python source code of test

Project: elasticintel (GitHub Link)

elasticintel-master
- whois_lambda
  - aws_requests_auth
    - aws_auth.py
    - __init__.py
    - boto_utils.py
  - whois.py
  - requests_aws4auth-0.9.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - ipwhois-1.0.0.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - LICENSE
  - requests_aws4auth
    - aws4signingkey.py
    - exceptions.py
    - service_parameters.py
    - six.py
    - test
      - requests_aws4auth_test.py
    - __init__.py
    - aws4auth.py
  - get_null_whois.json
  - ipwhois
    - whois.py
    - exceptions.py
    - asn.py
    - hr.py
    - rdap.py
    - net.py
    - data
      - iso_3166-1.csv
      - iso_3166-1_list_en.xml
    - nir.py
    - __init__.py
    - utils.py
    - experimental.py
    - ipwhois.py
  - requests-2.9.1.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - README.rst
  - lambda_function.py
  - HISTORY.rst
  - aws_requests_auth-0.3.3.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - dns
    - rdata.py
    - tsig.py
    - renderer.py
    - hash.py
    - opcode.py
    - rdatatype.py
    - tokenizer.py
    - ipv4.py
    - ttl.py
    - update.py
    - rcode.py
    - version.py
    - dnssec.py
    - zone.py
    - tsigkeyring.py
    - ipv6.py
    - reversename.py
    - wiredata.py
    - flags.py
    - rrset.py
    - query.py
    - rdtypes
      - mxbase.py
      - IN
        NSAP_PTR.py
        IPSECKEY.py
        DHCID.py
        KX.py
        AAAA.py
        PX.py
        NSAP.py
        __init__.py
        APL.py
        NAPTR.py
        WKS.py
        SRV.py
        A.py
      - ANY
        HIP.py
        DNSKEY.py
        EUI64.py
        NSEC3PARAM.py
        GPOS.py
        TLSA.py
        CAA.py
        LOC.py
        X25.py
        SOA.py
        SSHFP.py
        CNAME.py
        RRSIG.py
        DNAME.py
        AFSDB.py
        TXT.py
        ISDN.py
        HINFO.py
        AVC.py
        NSEC.py
        CDNSKEY.py
        EUI48.py
        NS.py
        CDS.py
        CERT.py
        DS.py
        __init__.py
        RT.py
        PTR.py
        NSEC3.py
        CSYNC.py
        URI.py
        DLV.py
        SPF.py
        MX.py
        RP.py
      - nsbase.py
      - __init__.py
      - euibase.py
      - txtbase.py
      - dnskeybase.py
      - dsbase.py
    - e164.py
    - rdataset.py
    - entropy.py
    - node.py
    - message.py
    - inet.py
    - _compat.py
    - __init__.py
    - exception.py
    - rdataclass.py
    - grange.py
    - set.py
    - name.py
    - edns.py
    - resolver.py
    - namedict.py
  - dnspython-1.15.0.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
    - LICENSE.txt
  - requirements.txt
  - NOTICE
  - requests
    - exceptions.py
    - sessions.py
    - hooks.py
    - status_codes.py
    - adapters.py
    - models.py
    - api.py
    - packages
      - chardet
        euctwfreq.py
        gb2312freq.py
        chardetect.py
        charsetgroupprober.py
        sbcharsetprober.py
        langhebrewmodel.py
        codingstatemachine.py
        big5prober.py
        langhungarianmodel.py
        mbcharsetprober.py
        langgreekmodel.py
        charsetprober.py
        euctwprober.py
        eucjpprober.py
        mbcsgroupprober.py
        escprober.py
        langbulgarianmodel.py
        utf8prober.py
        euckrfreq.py
        universaldetector.py
        mbcssm.py
        sbcsgroupprober.py
        hebrewprober.py
        constants.py
        sjisprober.py
        langthaimodel.py
        cp949prober.py
        latin1prober.py
        chardistribution.py
        __init__.py
        gb2312prober.py
        escsm.py
        big5freq.py
        compat.py
        euckrprober.py
        langcyrillicmodel.py
        jisfreq.py
        jpcntx.py
      - urllib3
        fields.py
        request.py
        exceptions.py
        _collections.py
        util
        request.py
        response.py
        ssl_.py
        connection.py
        timeout.py
        __init__.py
        retry.py
        url.py
        response.py
        packages
        six.py
        ordered_dict.py
        __init__.py
        ssl_match_hostname
        _implementation.py
        __init__.py
        connection.py
        __init__.py
        poolmanager.py
        contrib
        appengine.py
        pyopenssl.py
        ntlmpool.py
        __init__.py
        connectionpool.py
        filepost.py
      - __init__.py
    - __init__.py
    - utils.py
    - auth.py
    - cookies.py
    - structures.py
    - compat.py
    - certs.py
- elasticintel.py
- helpers
  - intelparser.py
  - feed_mgr.py
  - elastic_intel_manager.py
  - lambdarunner.py
  - feed_runner.py
  - feedhelper.py
  - terraform.py
  - __init__.py
- LICENSE
- terraform
  - dev
    - sns
      - sns.tf
      - outputs.tf
      - backend.tf
      - variables.tf
    - whois_lambda
      - main.tf
      - backend.tf
      - variables.tf
    - intelbot_ssm_parameter_store
      - main.tf
      - outputs.tf
      - backend.tf
      - variables.tf
    - s3
      - s3.tf
      - outputs.tf
      - backend.tf
      - variables.tf
    - elasticsearch
      - outputs.tf
      - backend.tf
      - variables.tf
      - elasticsearch.tf
    - backend
      - main.tf
    - intelbot_api_gateway
      - main.tf
      - outputs.tf
      - backend.tf
      - variables.tf
    - lambda
      - config.json
      - lambda.tf
      - outputs.tf
      - backend.tf
      - variables.tf
    - intelbot_lambda
      - main.tf
      - outputs.tf
      - backend.tf
      - variables.tf
  - modules
    - sns
      - sns.tf
      - outputs.tf
      - variables.tf
    - whois_lambda
      - whois_lambda.tf
      - build_lambda.sh
      - outputs.tf
      - variables.tf
    - intelbot_ssm_parameter_store
      - ssm_parameter_store.tf
      - outputs.tf
      - variables.tf
    - s3
      - s3.tf
      - outputs.tf
      - variables.tf
    - elasticsearch
      - outputs.tf
      - variables.tf
      - elasticsearch.tf
    - intelbot_api_gateway
      - api_gateway.tf
      - outputs.tf
      - variables.tf
    - lambda
      - lambda.tf
      - test.sh
      - __init__.py
      - outputs.tf
      - variables.tf
    - __init__.py
    - intelbot_lambda
      - lambda.tf
      - outputs.tf
      - variables.tf
      - build.sh
- example.conf.example
- .travis.yml
- README.md
- tests
  - test_feeds
    - txt_feed.json
    - csv_feed.json
  - dummy_feed.csv
  - test_feeds.py
  - .cache
    - v
      - cache
        lastfailed
  - __init__.py
  - test_ioc_parser.py
- requirements.txt
- intelbot
  - aws_requests_auth
    - aws_auth.py
    - __init__.py
    - boto_utils.py
  - intelbot.py
  - iocsearch.py
  - manage.py
  - requests-2.9.1.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - lambda_function.py
  - __init__.py
  - aws_requests_auth-0.3.3.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - tests
    - test_bot_message.json
    - .cache
      - v
        cache
        lastfailed
    - test_lambdabot.py
    - test_user_event.json
  - iocsearch_lambda.py
  - lambdabot_config.json.example
  - requirements.txt
  - requests
    - exceptions.py
    - sessions.py
    - hooks.py
    - status_codes.py
    - adapters.py
    - models.py
    - api.py
    - packages
      - chardet
        euctwfreq.py
        gb2312freq.py
        chardetect.py
        charsetgroupprober.py
        sbcharsetprober.py
        langhebrewmodel.py
        codingstatemachine.py
        big5prober.py
        langhungarianmodel.py
        mbcharsetprober.py
        langgreekmodel.py
        charsetprober.py
        euctwprober.py
        eucjpprober.py
        mbcsgroupprober.py
        escprober.py
        langbulgarianmodel.py
        utf8prober.py
        euckrfreq.py
        universaldetector.py
        mbcssm.py
        sbcsgroupprober.py
        hebrewprober.py
        constants.py
        sjisprober.py
        langthaimodel.py
        cp949prober.py
        latin1prober.py
        chardistribution.py
        __init__.py
        gb2312prober.py
        escsm.py
        big5freq.py
        compat.py
        euckrprober.py
        langcyrillicmodel.py
        jisfreq.py
        jpcntx.py
      - urllib3
        fields.py
        request.py
        exceptions.py
        _collections.py
        util
        request.py
        response.py
        ssl_.py
        connection.py
        timeout.py
        __init__.py
        retry.py
        url.py
        response.py
        packages
        six.py
        ordered_dict.py
        __init__.py
        ssl_match_hostname
        _implementation.py
        __init__.py
        connection.py
        __init__.py
        poolmanager.py
        contrib
        appengine.py
        pyopenssl.py
        ntlmpool.py
        __init__.py
        connectionpool.py
        filepost.py
      - __init__.py
    - __init__.py
    - utils.py
    - auth.py
    - cookies.py
    - structures.py
    - compat.py
    - certs.py
- docs
  - images
  - GettingStarted.md
  - index.md
  - README.md
  - slack_bot_setup.md
- ingest_feed_lambda
  - aws_requests_auth
    - aws_auth.py
    - __init__.py
    - boto_utils.py
  - six-1.11.0.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - ioc_validators.py
  - decorator.py
  - numpy-1.13.3.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - intel_validator.py
  - six.py
  - api_feed_downloader.py
  - validators
    - ip_address.py
    - iban.py
    - length.py
    - extremes.py
    - i18n
      - fi.py
      - __init__.py
    - mac_address.py
    - slug.py
    - uuid.py
    - domain.py
    - email.py
    - __init__.py
    - utils.py
    - between.py
    - hashes.py
    - truthy.py
    - url.py
  - intel.py
  - pandas
    - testing.py
    - tseries
      - util.py
      - holiday.py
      - api.py
      - offsets.py
      - plotting.py
      - __init__.py
      - converter.py
      - frequencies.py
    - computation
      - expressions.py
      - __init__.py
    - api
      - types
        __init__.py
      - __init__.py
    - lib.py
    - _libs
      - tslibs
        __init__.py
      - __init__.py
    - compat
      - pickle_compat.py
      - numpy
        function.py
        __init__.py
      - __init__.py
      - openpyxl_compat.py
      - chainmap.py
      - chainmap_impl.py
    - util
      - testing.py
      - decorators.py
      - _depr_module.py
      - _validators.py
      - __init__.py
      - _print_versions.py
      - _doctools.py
      - _decorators.py
      - _move.cpython-36m-x86_64-linux-gnu.so
      - hashing.py
      - _tester.py
    - types
      - common.py
      - __init__.py
      - concat.py
    - io
      - feather_format.py
      - data.py
      - packers.py
      - sql.py
      - excel.py
      - date_converters.py
      - html.py
      - pickle.py
      - clipboard
        exceptions.py
        clipboards.py
        windows.py
        __init__.py
      - clipboards.py
      - stata.py
      - sas
        sas_constants.py
        sas_xport.py
        sas7bdat.py
        sasreader.py
        __init__.py
      - msgpack
        exceptions.py
        __init__.py
        _version.py
      - wb.py
      - s3.py
      - api.py
      - common.py
      - __init__.py
      - gbq.py
      - json
        table_schema.py
        normalize.py
        __init__.py
        json.py
      - parsers.py
      - parquet.py
      - pytables.py
      - formats
        excel.py
        terminal.py
        templates
        html.tpl
        printing.py
        console.py
        css.py
        common.py
        __init__.py
        format.py
        style.py
    - __init__.py
    - parser.py
    - tests
      - test_categorical.py
      - test_strings.py
      - internals
        test_external_block.py
        test_internals.py
        __init__.py
      - test_base.py
      - test_errors.py
      - sparse
        test_frame.py
        test_format.py
        test_libsparse.py
        test_combine_concat.py
        test_indexing.py
        test_reshape.py
        test_array.py
        test_groupby.py
        test_list.py
        test_arithmetics.py
        common.py
        __init__.py
        test_series.py
        test_pivot.py
      - test_algos.py
      - test_resample.py
      - tseries
        test_frequencies.py
        test_holiday.py
        test_timezones.py
        data
        cday-0.14.1.pickle
        dateoffset_0_15_2.pickle
        __init__.py
        conftest.py
      - test_window.py
      - test_compat.py
      - computation
        test_eval.py
        test_compat.py
        __init__.py
      - test_take.py
      - frame
        test_subclass.py
        test_block_internals.py
        test_query_eval.py
        test_alter_axes.py
        test_axis_select_reindex.py
        test_apply.py
        test_mutate_columns.py
        test_analytics.py
        test_combine_concat.py
        test_nonunique_indexes.py
        test_period.py
        test_indexing.py
        test_reshape.py
        test_validate.py
        test_sorting.py
        test_rank.py
        test_convert_to.py
        test_to_csv.py
        test_timeseries.py
        common.py
        __init__.py
        test_missing.py
        test_join.py
        test_constructors.py
        test_replace.py
        test_quantile.py
        test_dtypes.py
        test_api.py
        test_operators.py
        test_repr_info.py
        test_asof.py
      - test_lib.py
      - series
        test_subclass.py
        test_alter_axes.py
        test_apply.py
        test_analytics.py
        test_io.py
        test_combine_concat.py
        test_period.py
        test_indexing.py
        test_validate.py
        test_sorting.py
        test_internals.py
        test_rank.py
        test_datetime_values.py
        test_timeseries.py
        common.py
        __init__.py
        test_missing.py
        test_constructors.py
        test_replace.py
        test_quantile.py
        test_dtypes.py
        test_repr.py
        test_api.py
        test_operators.py
        test_asof.py
      - api
        test_types.py
        __init__.py
        test_api.py
      - test_multilevel.py
      - test_panel.py
      - scalar
        test_timestamp.py
        test_period.py
        test_interval.py
        test_period_asfreq.py
        __init__.py
        test_nat.py
        test_timedelta.py
      - util
        test_util.py
        test_testing.py
        __init__.py
        test_hashing.py
      - test_sorting.py
      - test_common.py
      - groupby
        test_categorical.py
        test_bin_groupby.py
        test_timegrouper.py
        test_index_as_string.py
        test_counting.py
        test_groupby.py
        test_aggregate.py
        common.py
        __init__.py
        test_nth.py
        test_value_counts.py
        test_whitelist.py
        test_transform.py
        test_filters.py
      - test_expressions.py
      - indexing
        test_categorical.py
        test_ix.py
        test_callable.py
        test_partial.py
        test_indexing.py
        test_coercion.py
        test_panel.py
        test_loc.py
        test_interval.py
        test_chaining_and_caching.py
        test_indexing_slow.py
        test_multiindex.py
        common.py
        __init__.py
        test_iloc.py
        test_datetime.py
        test_scalar.py
        test_floats.py
        test_timedelta.py
      - test_downstream.py
      - test_panelnd.py
      - data
        iris.csv
        tips.csv
      - test_config.py
      - reshape
        test_union_categoricals.py
        test_reshape.py
        test_tile.py
        test_util.py
        test_merge.py
        test_concat.py
        data
        allow_exact_matches_and_tolerance.csv
        cut_data.csv
        asof2.csv
        trades.csv
        quotes.csv
        tolerance.csv
        trades2.csv
        asof.csv
        allow_exact_matches.csv
        quotes2.csv
        __init__.py
        test_merge_ordered.py
        test_join.py
        test_merge_asof.py
        test_pivot.py
      - io
        test_feather.py
        generate_legacy_storage_files.py
        test_clipboard.py
        test_pickle.py
        test_excel.py
        test_s3.py
        test_sql.py
        sas
        test_sas.py
        test_xport.py
        test_sas7bdat.py
        data
        test14.sas7bdat
        test4.sas7bdat
        test6.sas7bdat
        test3.sas7bdat
        test16.sas7bdat
        test_12659.sas7bdat
        productsales.sas7bdat
        paxraw_d_short.xpt
        test_12659.csv
        test15.sas7bdat
        test11.sas7bdat
        paxraw_d_short.csv
        test7.sas7bdat
        SSHSV1_A.csv
        test13.sas7bdat
        productsales.csv
        test8.sas7bdat
        test9.sas7bdat
        test12.sas7bdat
        datetime.sas7bdat
        test1.sas7bdat
        test10.sas7bdat
        datetime.csv
        test2.sas7bdat
        airline.sas7bdat
        airline.csv
        SSHSV1_A.xpt
        test_sas7bdat_2.csv
        test5.sas7bdat
        test_sas7bdat_1.csv
        __init__.py
        msgpack
        test_buffer.py
        test_except.py
        test_format.py
        test_subtype.py
        test_seq.py
        test_unpack.py
        test_newspec.py
        test_read_size.py
        test_obj.py
        test_unpack_raw.py
        data
        frame.mp
        test_case.py
        common.py
        __init__.py
        test_sequnpack.py
        test_extension.py
        test_pack.py
        test_limits.py
        test_html.py
        test_common.py
        test_gbq.py
        test_stata.py
        test_packers.py
        data
        test_types.xls
        blank.xlsx
        test_multisheet.xls
        stata7_117.dta
        test1.xlsm
        test_types.xlsx
        iris.csv
        stata15.dta
        stata1_117.dta
        test1.xlsx
        banklist.html
        stata8_117.dta
        test3.xlsx
        S4_EDUC1.dta
        test_index_name_pre17.xlsm
        test5.xls
        blank_with_header.xlsm
        spam.html
        nyse_wsj.html
        blank_with_header.xlsx
        test2.xlsx
        times_1904.xlsx
        stata6_113.dta
        stata8_115.dta
        legacy_hdf
        pytables_native.h5
        datetimetz_object.h5
        pytables_native2.h5
        periodindex_0.20.1_x86_64_darwin_2.7.13.h5
        stata7_111.dta
        legacy_pickle
        0.16.0
        0.16.0_x86_64_darwin_2.7.9.pickle
        0.18.0
        0.18.0_AMD64_windows_2.7.11.pickle
        0.18.0_x86_64_darwin_2.7.11.pickle
        0.18.0_x86_64_darwin_3.5.1.pickle
        0.18.0_AMD64_windows_3.5.1.pickle
        0.14.0
        0.14.0_x86_64_darwin_2.7.6.pickle
        0.14.0_x86_64_linux_2.7.8.pickle
        0.19.2
        0.19.2_x86_64_darwin_2.7.12.pickle
        0.19.2_x86_64_darwin_2.7.14.pickle
        0.19.2_x86_64_darwin_3.6.1.pickle
        0.15.2
        0.15.2_x86_64_darwin_2.7.9.pickle
        0.18.1
        0.18.1_x86_64_darwin_2.7.12.pickle
        0.18.1_x86_64_darwin_3.5.2.pickle
        0.14.1
        0.14.1_x86_64_darwin_2.7.12.pickle
        0.14.1_x86_64_linux_2.7.8.pickle
        0.20.3
        0.20.3_x86_64_darwin_2.7.14.pickle
        0.12.0
        0.12.0_AMD64_windows_2.7.3.pickle
        0.12.0_x86_64_linux_2.7.3.pickle
        0.17.0
        0.17.0_x86_64_darwin_2.7.11.pickle
        0.17.1_AMD64_windows_2.7.11.pickle
        0.17.0_x86_64_linux_2.7.11.pickle
        0.17.0_x86_64_linux_3.4.4.pickle
        0.17.0_AMD64_windows_2.7.11.pickle
        0.17.0_AMD64_windows_3.4.4.pickle
        0.17.0_x86_64_darwin_3.5.3.pickle
        0.17.0_x86_64_darwin_3.4.4.pickle
        0.13.0
        0.13.0_x86_64_linux_2.7.8.pickle
        0.13.0_x86_64_linux_2.7.3.pickle
        0.13.0_x86_64_linux_3.3.0.pickle
        0.13.0_i686_linux_2.7.3.pickle
        0.13.0_x86_64_darwin_2.7.5.pickle
        0.13.0_i686_linux_2.6.5.pickle
        0.13.0_i686_linux_3.2.3.pickle
        0.13.0_AMD64_windows_2.7.3.pickle
        0.13.0_x86_64_darwin_2.7.6.pickle
        0.15.0
        0.15.0_x86_64_darwin_2.7.12.pickle
        0.15.0_x86_64_linux_2.7.8.pickle
        0.17.1
        0.17.1_AMD64_windows_2.7.11.pickle
        0.17.1_x86_64_darwin_2.7.11.pickle
        0.11.0
        0.11.0_x86_64_linux_3.3.0.pickle
        x86_64_linux_2.7.3.pickle
        x86_64_linux_3.3.0.pickle
        0.10.1
        x86_64_linux_2.7.3.pickle
        AMD64_windows_2.7.3.pickle
        0.16.2
        0.16.2_x86_64_linux_2.7.10.pickle
        0.16.2_x86_64_linux_3.4.3.pickle
        0.16.2_AMD64_windows_3.4.3.pickle
        0.16.2_AMD64_windows_2.7.10.pickle
        0.16.2_x86_64_darwin_2.7.10.pickle
        0.16.2_x86_64_darwin_3.4.3.pickle
        0.16.2_x86_64_darwin_2.7.9.pickle
        valid_markup.html
        gbq_fake_job.txt
        testdtype.xlsm
        testdateoverflow.xls
        stata5_115.dta
        stata4_117.dta
        times_1904.xls
        stata1_114.dta
        stata5_113.dta
        test2.xls
        testdateoverflow.xlsm
        stata12_117.dta
        stata11_115.dta
        times_1900.xlsx
        stata4_115.dta
        test_converters.xlsx
        stata4_113.dta
        blank.xls
        stata6_115.dta
        computer_sales_page.html
        test_multisheet.xlsm
        stata6.csv
        stata5_114.dta
        stata2_115.dta
        stata7_115.dta
        stata3_113.dta
        stata4_114.dta
        test_types.xlsm
        test_index_name_pre17.xlsx
        banklist.csv
        test1.xls
        stata9_115.dta
        test3.xlsm
        html_encoding
        chinese_utf-16.html
        letz_latin1.html
        chinese_utf-8.html
        chinese_utf-32.html
        testskiprows.xlsx
        stata11_117.dta
        stata6_114.dta
        blank_with_header.xls
        test2.xlsm
        test5.xlsx
        stata5_117.dta
        stata3_115.dta
        times_1904.xlsm
        testmultiindex.xls
        testmultiindex.xlsm
        testmultiindex.xlsx
        times_1900.xlsm
        categorical_0_15_2.pickle
        macau.html
        test4.xlsx
        times_1900.xls
        testdtype.xlsx
        test4.xlsm
        stata10_115.dta
        tips.csv
        stata6_117.dta
        stata2_113.dta
        testdtype.xls
        stata2_117.dta
        legacy_msgpack
        0.16.0
        0.16.0_x86_64_darwin_2.7.9.msgpack
        0.18.0
        0.18.0_x86_64_darwin_3.5.1.msgpack
        0.18.0_AMD64_windows_2.7.11.msgpack
        0.18.0_AMD64_windows_3.5.1.msgpack
        0.18.0_x86_64_darwin_2.7.11.msgpack
        0.19.2
        0.19.2_x86_64_darwin_3.6.1.msgpack
        0.19.2_x86_64_darwin_2.7.12.msgpack
        0.18.1
        0.18.1_x86_64_darwin_2.7.12.msgpack
        0.18.1_x86_64_darwin_3.5.2.msgpack
        0.17.0
        0.17.0_x86_64_darwin_2.7.11.msgpack
        0.17.1_AMD64_windows_3.5.1.msgpack
        0.17.0_x86_64_darwin_3.4.4.msgpack
        0.17.0_x86_64_linux_3.4.4.msgpack
        0.17.0_AMD64_windows_2.7.11.msgpack
        0.17.1_AMD64_windows_2.7.11.msgpack
        0.17.0_AMD64_windows_3.4.4.msgpack
        0.17.0_x86_64_linux_2.7.11.msgpack
        0.17.1
        0.17.1_x86_64_darwin_3.5.1.msgpack
        0.17.1_AMD64_windows_3.5.1.msgpack
        0.17.1_x86_64_linux_2.7.11.msgpack
        0.17.1_x86_64_darwin_2.7.11.msgpack
        0.17.1_AMD64_windows_2.7.11.msgpack
        0.17.1_x86_64_linux_3.4.4.msgpack
        0.16.2
        0.16.2_x86_64_darwin_2.7.9.msgpack
        0.16.2_AMD64_windows_3.4.3.msgpack
        0.16.2_AMD64_windows_2.7.10.msgpack
        0.16.2_x86_64_linux_2.7.10.msgpack
        0.16.2_x86_64_darwin_3.4.3.msgpack
        0.16.2_x86_64_darwin_2.7.10.msgpack
        0.16.2_x86_64_linux_3.4.3.msgpack
        stata9_117.dta
        test_multisheet.xlsx
        test_squeeze.xls
        fixed_width_format.txt
        stata5.csv
        testskiprows.xlsm
        testdateoverflow.xlsx
        wikipedia_states.html
        test_index_name_pre17.xls
        categorical_0_14_1.pickle
        stata2_114.dta
        test_mmap.csv
        test_converters.xls
        test3.xls
        stata10_117.dta
        stata3_114.dta
        stata3.csv
        testskiprows.xls
        stata3_117.dta
        test_squeeze.xlsm
        test_converters.xlsm
        stata14_118.dta
        test_squeeze.xlsx
        test1.csv
        test5.xlsm
        test4.xls
        stata8_113.dta
        blank.xlsm
        stata1_encoding.dta
        __init__.py
        json
        test_compression.py
        test_pandas.py
        test_readlines.py
        test_json_table_schema.py
        test_normalize.py
        data
        tsframe_iso_v012.json
        tsframe_v012.json
        tsframe_v012.json.zip
        __init__.py
        test_ujson.py
        test_parquet.py
        parser
        test_textreader.py
        dialect.py
        test_network.py
        multithread.py
        mangle_dupes.py
        index_col.py
        test_read_fwf.py
        parse_dates.py
        python_parser_only.py
        skiprows.py
        usecols.py
        compression.py
        comment.py
        header.py
        quoting.py
        na_values.py
        data
        iris.csv
        test2.csv
        salaries.csv.bz2
        tips.csv.gz
        tar_csv.tar.gz
        salaries.csv
        sub_char.csv
        tips.csv
        tar_csv.tar
        test1.csv.gz
        unicode_series.csv
        tips.csv.bz2
        test_mmap.csv
        sauron.SHIFT_JIS.csv
        test1.csv.bz2
        utf16_ex.txt
        test1.csv
        salaries.csv.gz
        converters.py
        test_parsers.py
        common.py
        __init__.py
        c_parser_only.py
        test_unsupported.py
        dtypes.py
        formats
        test_format.py
        test_eng_formatting.py
        test_style.py
        test_to_csv.py
        data
        unicode_series.csv
        __init__.py
        test_css.py
        test_to_html.py
        test_printing.py
        test_to_excel.py
        test_to_latex.py
      - __init__.py
      - test_panel4d.py
      - test_join.py
      - tools
        test_numeric.py
        __init__.py
      - test_nanops.py
      - plotting
        test_frame.py
        test_misc.py
        test_converter.py
        test_boxplot_method.py
        test_deprecated.py
        test_hist_method.py
        test_groupby.py
        common.py
        __init__.py
        test_datetimelike.py
        test_series.py
      - indexes
        test_base.py
        datetimelike.py
        timedeltas
        test_setops.py
        test_indexing.py
        test_ops.py
        test_construction.py
        test_timedelta_range.py
        test_astype.py
        __init__.py
        test_tools.py
        test_partial_slicing.py
        test_timedelta.py
        test_category.py
        test_numeric.py
        test_interval.py
        test_frozen.py
        data
        mindex_073.pickle
        multiindex_v1.pickle
        test_multi.py
        common.py
        __init__.py
        test_range.py
        period
        test_setops.py
        test_period.py
        test_indexing.py
        test_asfreq.py
        test_period_range.py
        test_ops.py
        test_construction.py
        __init__.py
        test_tools.py
        test_partial_slicing.py
        test_formats.py
        conftest.py
        datetimes
        test_misc.py
        test_setops.py
        test_indexing.py
        test_ops.py
        test_construction.py
        test_astype.py
        __init__.py
        test_datetimelike.py
        test_tools.py
        test_partial_slicing.py
        test_missing.py
        test_datetime.py
        test_formats.py
        test_date_range.py
      - dtypes
        test_io.py
        test_cast.py
        test_common.py
        test_inference.py
        test_concat.py
        test_generic.py
        __init__.py
        test_missing.py
        test_dtypes.py
    - _version.py
    - tools
      - plotting.py
      - __init__.py
      - merge.py
      - hashing.py
    - core
      - groupby.py
      - config_init.py
      - index.py
      - sparse
        list.py
        frame.py
        api.py
        scipy_sparse.py
        array.py
        series.py
        __init__.py
      - accessor.py
      - resample.py
      - internals.py
      - config.py
      - ops.py
      - panel.py
      - datetools.py
      - computation
        eval.py
        ops.py
        engines.py
        expressions.py
        check.py
        api.py
        scope.py
        common.py
        __init__.py
        expr.py
        align.py
        pytables.py
      - panel4d.py
      - panelnd.py
      - window.py
      - util
        __init__.py
        hashing.py
      - nanops.py
      - indexing.py
      - api.py
      - reshape
        tile.py
        pivot.py
        util.py
        api.py
        __init__.py
        concat.py
        reshape.py
        merge.py
      - missing.py
      - series.py
      - common.py
      - __init__.py
      - algorithms.py
      - strings.py
      - tools
        datetimes.py
        timedeltas.py
        __init__.py
        numeric.py
      - categorical.py
      - indexes
        range.py
        period.py
        datetimes.py
        datetimelike.py
        category.py
        frozen.py
        api.py
        timedeltas.py
        accessors.py
        multi.py
        __init__.py
        numeric.py
        interval.py
        base.py
      - dtypes
        cast.py
        generic.py
        api.py
        missing.py
        common.py
        __init__.py
        inference.py
        concat.py
        dtypes.py
      - base.py
      - sorting.py
    - tslib.py
    - stats
      - moments.py
      - api.py
      - __init__.py
    - errors
      - __init__.py
    - plotting
      - _style.py
      - _timeseries.py
      - _tools.py
      - _converter.py
      - _core.py
      - _misc.py
      - _compat.py
      - __init__.py
    - conftest.py
    - formats
      - __init__.py
      - style.py
    - json.py
  - pandas-0.21.0.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - requests-2.9.1.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - pytz-2017.3.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - zip-safe
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - validators-0.12.0.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - ingest_intel_lambda.py
  - python_dateutil-2.6.1.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - zip-safe
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - dateutil
    - _common.py
    - tz
      - win.py
      - _common.py
      - tz.py
      - __init__.py
    - rrule.py
    - __init__.py
    - parser.py
    - _version.py
    - easter.py
    - tzwin.py
    - zoneinfo
      - rebuild.py
      - dateutil-zoneinfo.tar.gz
      - __init__.py
    - relativedelta.py
  - ioc_feed_parser.py
  - numpy
    - _import_tools.py
    - _globals.py
    - .libs
    - distutils
      - log.py
      - ccompiler.py
      - line_endings.py
      - misc_util.py
      - conv_template.py
      - __version__.py
      - unixccompiler.py
      - exec_command.py
      - msvccompiler.py
      - npy_pkg_config.py
      - msvc9compiler.py
      - system_info.py
      - numpy_distribution.py
      - from_template.py
      - mingw
        gfortran_vs2003_hack.c
      - info.py
      - setup.py
      - mingw32ccompiler.py
      - pathccompiler.py
      - intelccompiler.py
      - __config__.py
      - lib2def.py
      - __init__.py
      - tests
        test_system_info.py
        test_misc_util.py
        test_fcompiler_gnu.py
        test_exec_command.py
        test_npy_pkg_config.py
        test_fcompiler_intel.py
      - core.py
      - cpuinfo.py
      - command
        build.py
        bdist_rpm.py
        install_data.py
        build_ext.py
        config.py
        install_clib.py
        build_clib.py
        egg_info.py
        config_compiler.py
        autodist.py
        build_py.py
        sdist.py
        __init__.py
        develop.py
        install_headers.py
        build_scripts.py
        install.py
        build_src.py
      - compat.py
      - extension.py
      - environment.py
      - fcompiler
        absoft.py
        nag.py
        ibm.py
        hpux.py
        vast.py
        g95.py
        intel.py
        none.py
        gnu.py
        __init__.py
        pathf95.py
        mips.py
        sun.py
        pg.py
        lahey.py
        compaq.py
    - _distributor_init.py
    - version.py
    - polynomial
      - hermite.py
      - chebyshev.py
      - polynomial.py
      - _polybase.py
      - laguerre.py
      - legendre.py
      - setup.py
      - __init__.py
      - polyutils.py
      - tests
        test_polynomial.py
        test_chebyshev.py
        test_hermite.py
        test_laguerre.py
        test_classes.py
        test_hermite_e.py
        test_printing.py
        test_legendre.py
        test_polyutils.py
      - hermite_e.py
    - compat
      - setup.py
      - __init__.py
      - _inspect.py
      - py3k.py
    - lib
      - arraypad.py
      - recfunctions.py
      - polynomial.py
      - _datasource.py
      - function_base.py
      - ufunclike.py
      - type_check.py
      - index_tricks.py
      - _iotools.py
      - financial.py
      - info.py
      - stride_tricks.py
      - setup.py
      - nanfunctions.py
      - arraysetops.py
      - shape_base.py
      - user_array.py
      - __init__.py
      - utils.py
      - tests
        test_polynomial.py
        test_mixins.py
        test_recfunctions.py
        test_index_tricks.py
        test_format.py
        test_utils.py
        test__datasource.py
        test__version.py
        test_stride_tricks.py
        test_io.py
        test_nanfunctions.py
        test_shape_base.py
        test_arraypad.py
        test_packbits.py
        test_arrayterator.py
        test_financial.py
        test_type_check.py
        test_twodim_base.py
        test_regression.py
        data
        win64python2.npy
        py3-objarr.npy
        py2-objarr.npz
        py2-objarr.npy
        py3-objarr.npz
        python3.npy
        test__iotools.py
        test_arraysetops.py
        test_ufunclike.py
        test_function_base.py
      - _version.py
      - scimath.py
      - mixins.py
      - npyio.py
      - arrayterator.py
      - twodim_base.py
      - format.py
    - fft
      - fftpack_lite.cpython-36m-x86_64-linux-gnu.so
      - info.py
      - setup.py
      - __init__.py
      - tests
        test_helper.py
        test_fftpack.py
      - helper.py
      - fftpack.py
    - ma
      - version.py
      - extras.py
      - testutils.py
      - setup.py
      - bench.py
      - __init__.py
      - mrecords.py
      - tests
        test_subclassing.py
        test_extras.py
        test_old_ma.py
        test_regression.py
        test_mrecords.py
        test_deprecations.py
        test_core.py
      - timer_comparison.py
    - ctypeslib.py
    - setup.py
    - f2py
      - src
        fortranobject.h
        fortranobject.c
      - rules.py
      - func2subr.py
      - __version__.py
      - crackfortran.py
      - f2py_testing.py
      - f90mod_rules.py
      - f2py2e.py
      - info.py
      - setup.py
      - common_rules.py
      - auxfuncs.py
      - __main__.py
      - capi_maps.py
      - __init__.py
      - use_rules.py
      - tests
        src
        assumed_shape
        foo_mod.f90
        .f2py_f2cmap
        foo_use.f90
        foo_free.f90
        precision.f90
        mixed
        foo.f
        foo_fixed.f90
        foo_free.f90
        size
        foo.f90
        parameter
        constant_real.f90
        constant_both.f90
        constant_compound.f90
        constant_non_compound.f90
        constant_integer.f90
        common
        block.f
        kind
        foo.f90
        regression
        inout.f90
        array_from_pyobj
        wrapmodule.c
        string
        char.f90
        util.py
        test_return_integer.py
        test_return_real.py
        test_array_from_pyobj.py
        test_mixed.py
        test_return_logical.py
        test_assumed_shape.py
        test_kind.py
        test_string.py
        test_parameter.py
        test_common.py
        test_regression.py
        test_return_complex.py
        test_callback.py
        test_return_character.py
        test_size.py
      - cb_rules.py
      - diagnose.py
      - cfuncs.py
    - __config__.py
    - __init__.py
    - tests
      - test_warnings.py
      - test_scripts.py
      - test_numpy_version.py
      - test_matlib.py
      - test_reloading.py
      - test_ctypeslib.py
    - random
      - info.py
      - setup.py
      - __init__.py
      - tests
        test_random.py
        test_regression.py
      - randomkit.h
    - core
      - operand_flag_tests.cpython-36m-x86_64-linux-gnu.so
      - include
        numpy
        _neighborhood_iterator_imp.h
        noprefix.h
        npy_cpu.h
        npy_3kcompat.h
        old_defines.h
        npy_os.h
        oldnumeric.h
        ndarraytypes.h
        numpyconfig.h
        __multiarray_api.h
        multiarray_api.txt
        npy_math.h
        npy_endian.h
        halffloat.h
        __ufunc_api.h
        ufuncobject.h
        utils.h
        _numpyconfig.h
        npy_common.h
        npy_no_deprecated_api.h
        npy_interrupt.h
        ufunc_api.txt
        npy_1_7_deprecated_api.h
        ndarrayobject.h
        arrayscalars.h
        arrayobject.h
      - einsumfunc.py
      - numerictypes.py
      - getlimits.py
      - machar.py
      - setup_common.py
      - _dummy.cpython-36m-x86_64-linux-gnu.so
      - function_base.py
      - fromnumeric.py
      - lib
        npy-pkg-config
        npymath.ini
        mlib.ini
      - arrayprint.py
      - umath_tests.cpython-36m-x86_64-linux-gnu.so
      - memmap.py
      - info.py
      - setup.py
      - shape_base.py
      - _internal.py
      - __init__.py
      - numeric.py
      - struct_ufunc_test.cpython-36m-x86_64-linux-gnu.so
      - defchararray.py
      - tests
        test_ufunc.py
        test_nditer.py
        test_item_selection.py
        test_defchararray.py
        test_scalarinherit.py
        test_extint128.py
        test_shape_base.py
        test_getlimits.py
        test_einsum.py
        test_scalarmath.py
        test_unicode.py
        test_indexing.py
        test_numeric.py
        test_umath_complex.py
        test_half.py
        test_longdouble.py
        test_abc.py
        test_errstate.py
        test_arrayprint.py
        test_regression.py
        data
        astype_copy.pkl
        recarray_from_file.fits
        test_memmap.py
        test_numerictypes.py
        test_print.py
        test_scalarprint.py
        test_machar.py
        test_records.py
        test_datetime.py
        test_dtype.py
        test_deprecations.py
        test_umath.py
        test_api.py
        test_function_base.py
        test_mem_overlap.py
        test_indexerrors.py
      - records.py
      - cversions.py
      - _methods.py
      - generate_numpy_api.py
    - linalg
      - info.py
      - setup.py
      - lapack_lite.cpython-36m-x86_64-linux-gnu.so
      - linalg.py
      - __init__.py
      - tests
        test_linalg.py
        test_regression.py
        test_build.py
        test_deprecations.py
    - matlib.py
    - matrixlib
      - defmatrix.py
      - setup.py
      - __init__.py
      - tests
        test_defmatrix.py
        test_numeric.py
        test_multiarray.py
        test_regression.py
    - doc
      - ufuncs.py
      - creation.py
      - misc.py
      - internals.py
      - glossary.py
      - subclassing.py
      - indexing.py
      - constants.py
      - structured_arrays.py
      - basics.py
      - __init__.py
      - byteswapping.py
      - broadcasting.py
    - dual.py
    - testing
      - nosetester.py
      - decorators.py
      - noseclasses.py
      - print_coercion_tables.py
      - setup.py
      - __init__.py
      - utils.py
      - tests
        test_utils.py
        test_decorators.py
        test_doctesting.py
  - __init__.py
  - aws_requests_auth-0.3.3.dist-info
    - METADATA
    - top_level.txt
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - decorator-4.1.2.dist-info
    - METADATA
    - top_level.txt
    - pbr.json
    - metadata.json
    - WHEEL
    - INSTALLER
    - DESCRIPTION.rst
    - RECORD
  - requirements.txt
  - es.py
  - pytz
    - lazy.py
    - exceptions.py
    - tzfile.py
    - __init__.py
    - tzinfo.py
    - reference.py
    - zoneinfo
      - MET
      - Iceland
      - CET
      - Universal
      - Cuba
      - zone.tab
      - Canada
        Eastern
        Newfoundland
        Mountain
        Saskatchewan
        Atlantic
        Central
        Yukon
        Pacific
      - Japan
      - Navajo
      - Egypt
      - MST
      - Kwajalein
      - Asia
        Yangon
        Makassar
        Kolkata
        Dushanbe
        Aqtau
        Choibalsan
        Tokyo
        Ujung_Pandang
        Phnom_Penh
        Irkutsk
        Ho_Chi_Minh
        Tehran
        Dubai
        Kathmandu
        Thimbu
        Pontianak
        Chita
        Chongqing
        Hovd
        Bangkok
        Yekaterinburg
        Magadan
        Seoul
        Chungking
        Katmandu
        Muscat
        Colombo
        Ulaanbaatar
        Hong_Kong
        Vladivostok
        Qatar
        Aqtobe
        Aden
        Jerusalem
        Dili
        Urumqi
        Baku
        Istanbul
        Macao
        Bahrain
        Calcutta
        Thimphu
        Ust-Nera
        Famagusta
        Manila
        Krasnoyarsk
        Singapore
        Tomsk
        Oral
        Qyzylorda
        Nicosia
        Ulan_Bator
        Ashkhabad
        Omsk
        Bishkek
        Kamchatka
        Yakutsk
        Kabul
        Ashgabat
        Almaty
        Amman
        Baghdad
        Riyadh
        Khandyga
        Karachi
        Brunei
        Saigon
        Tashkent
        Srednekolymsk
        Gaza
        Beirut
        Tbilisi
        Barnaul
        Dacca
        Vientiane
        Kuching
        Jakarta
        Yerevan
        Kuala_Lumpur
        Jayapura
        Pyongyang
        Hebron
        Novosibirsk
        Tel_Aviv
        Atyrau
        Anadyr
        Kashgar
        Damascus
        Shanghai
        Kuwait
        Macau
        Novokuznetsk
        Rangoon
        Sakhalin
        Taipei
        Harbin
        Dhaka
        Samarkand
      - Europe
        Jersey
        Vilnius
        Sofia
        Lisbon
        Ulyanovsk
        Minsk
        Volgograd
        Budapest
        Uzhgorod
        Zurich
        Guernsey
        Zagreb
        Berlin
        London
        Luxembourg
        Warsaw
        Samara
        Paris
        Podgorica
        Busingen
        Tirane
        Brussels
        Istanbul
        San_Marino
        Chisinau
        Kiev
        Monaco
        Nicosia
        Vaduz
        Malta
        Prague
        Rome
        Sarajevo
        Ljubljana
        Moscow
        Madrid
        Bratislava
        Kaliningrad
        Andorra
        Gibraltar
        Belfast
        Amsterdam
        Copenhagen
        Skopje
        Dublin
        Tallinn
        Riga
        Mariehamn
        Helsinki
        Isle_of_Man
        Saratov
        Tiraspol
        Bucharest
        Stockholm
        Vatican
        Vienna
        Kirov
        Belgrade
        Simferopol
        Astrakhan
        Athens
        Zaporozhye
        Oslo
      - posixrules
      - iso3166.tab
      - zone1970.tab
      - Zulu
      - PST8PDT
      - Mexico
        General
        BajaNorte
        BajaSur
      - Turkey
      - PRC
      - NZ-CHAT
      - GMT0
      - EET
      - Factory
      - Antarctica
        Syowa
        Casey
        Palmer
        McMurdo
        South_Pole
        Mawson
        DumontDUrville
        Macquarie
        Rothera
        Davis
        Troll
        Vostok
      - Poland
      - W-SU
      - ROK
      - GMT-0
      - America
        Rankin_Inlet
        North_Dakota
        Beulah
        New_Salem
        Center
        Ensenada
        Edmonton
        Virgin
        Anguilla
        Rosario
        Araguaina
        Punta_Arenas
        Rainy_River
        Caracas
        Maceio
        Martinique
        Kralendijk
        St_Barthelemy
        Fort_Wayne
        Vancouver
        Santo_Domingo
        Moncton
        Montreal
        Whitehorse
        Godthab
        Dominica
        Cambridge_Bay
        New_York
        Kentucky
        Monticello
        Louisville
        Havana
        Rio_Branco
        Antigua
        Phoenix
        St_Kitts
        St_Vincent
        Indianapolis
        Swift_Current
        Matamoros
        Montserrat
        Anchorage
        Inuvik
        Guadeloupe
        Curacao
        Panama
        Manaus
        Halifax
        Bahia
        Tijuana
        Tegucigalpa
        Costa_Rica
        Port-au-Prince
        Atka
        Creston
        Chihuahua
        Santarem
        Lima
        Thule
        Sao_Paulo
        Regina
        Denver
        Buenos_Aires
        Adak
        Danmarkshavn
        Tortola
        Shiprock
        Bahia_Banderas
        Porto_Acre
        Nome
        Scoresbysund
        Guyana
        Managua
        Recife
        Nipigon
        Resolute
        Bogota
        Blanc-Sablon
        Chicago
        Iqaluit
        Jamaica
        Cuiaba
        Indiana
        Indianapolis
        Tell_City
        Vincennes
        Vevay
        Winamac
        Knox
        Marengo
        Petersburg
        Coral_Harbour
        Jujuy
        Guatemala
        Montevideo
        Guayaquil
        Dawson_Creek
        Santiago
        Cayman
        Miquelon
        Dawson
        Cordoba
        Detroit
        Merida
        Boa_Vista
        Boise
        Glace_Bay
        Barbados
        La_Paz
        Grand_Turk
        Belem
        Aruba
        Mendoza
        El_Salvador
        Goose_Bay
        St_Lucia
        Mexico_City
        Porto_Velho
        Santa_Isabel
        Pangnirtung
        Los_Angeles
        Metlakatla
        Hermosillo
        Paramaribo
        Juneau
        Yellowknife
        Grenada
        Louisville
        Eirunepe
        Puerto_Rico
        Lower_Princes
        Campo_Grande
        Noronha
        Toronto
        St_Johns
        Argentina
        La_Rioja
        San_Juan
        Ushuaia
        Salta
        Buenos_Aires
        San_Luis
        Jujuy
        Cordoba
        ComodRivadavia
        Mendoza
        Tucuman
        Rio_Gallegos
        Catamarca
        Cayenne
        Ojinaga
        Fort_Nelson
        Marigot
        Winnipeg
        Sitka
        Asuncion
        Mazatlan
        Monterrey
        Menominee
        Fortaleza
        St_Thomas
        Port_of_Spain
        Catamarca
        Cancun
        Thunder_Bay
        Yakutat
        Knox_IN
        Atikokan
        Belize
        Nassau
      - tzdata.zi
      - Africa
        Sao_Tome
        Nouakchott
        Abidjan
        Conakry
        Mbabane
        Windhoek
        Porto-Novo
        Brazzaville
        Bamako
        Lome
        Ouagadougou
        Gaborone
        Dar_es_Salaam
        Douala
        Timbuktu
        Monrovia
        Ndjamena
        Mogadishu
        Asmera
        Kinshasa
        Kigali
        Maputo
        El_Aaiun
        Blantyre
        Lubumbashi
        Niamey
        Juba
        Kampala
        Malabo
        Casablanca
        Algiers
        Luanda
        Bangui
        Maseru
        Lagos
        Ceuta
        Tunis
        Asmara
        Johannesburg
        Bujumbura
        Tripoli
        Freetown
        Lusaka
        Harare
        Addis_Ababa
        Banjul
        Bissau
        Cairo
        Nairobi
        Dakar
        Accra
        Djibouti
        Libreville
        Khartoum
      - Israel
      - Portugal
      - Indian
        Comoro
        Mayotte
        Mahe
        Mauritius
        Cocos
        Maldives
        Kerguelen
        Reunion
        Antananarivo
        Christmas
        Chagos
      - localtime
      - EST5EDT
      - EST
      - Singapore
      - Jamaica
      - Chile
        EasterIsland
        Continental
      - US
        Eastern
        Alaska
        Mountain
        Hawaii
        Samoa
        Indiana-Starke
        Arizona
        Central
        East-Indiana
        Aleutian
        Pacific-New
        Michigan
        Pacific
      - Libya
      - Iran
      - Etc
        GMT+12
        Universal
        GMT-9
        GMT-4
        GMT-10
        GMT+9
        Zulu
        GMT+4
        GMT-3
        GMT0
        GMT-6
        GMT+2
        GMT-7
        GMT-5
        GMT-0
        GMT-11
        GMT+10
        GMT-14
        GMT-12
        GMT-2
        GMT+1
        GMT+6
        GMT+8
        UCT
        GMT+11
        GMT
        GMT-8
        GMT+3
        Greenwich
        UTC
        GMT-1
        GMT+0
        GMT+5
        GMT+7
        GMT-13
      - WET
      - UCT
      - Australia
        Perth
        Tasmania
        Queensland
        Lindeman
        Victoria
        North
        South
        Adelaide
        Sydney
        Eucla
        Yancowinna
        Melbourne
        West
        Hobart
        LHI
        Canberra
        Lord_Howe
        Broken_Hill
        NSW
        Darwin
        Brisbane
        ACT
        Currie
      - GMT
      - Atlantic
        Faeroe
        St_Helena
        Canary
        Azores
        South_Georgia
        Reykjavik
        Cape_Verde
        Bermuda
        Faroe
        Jan_Mayen
        Stanley
        Madeira
      - Hongkong
      - HST
      - Eire
      - Arctic
        Longyearbyen
      - Greenwich
      - UTC
      - CST6CDT
      - Brazil
        Acre
        West
        DeNoronha
        East
      - GMT+0
      - MST7MDT
      - GB
      - ROC
      - NZ
      - GB-Eire
      - Pacific
        Rarotonga
        Marquesas
        Chuuk
        Kwajalein
        Tongatapu
        Norfolk
        Guam
        Tahiti
        Apia
        Easter
        Wallis
        Funafuti
        Galapagos
        Pitcairn
        Guadalcanal
        Kiritimati
        Nauru
        Saipan
        Samoa
        Honolulu
        Enderbury
        Ponape
        Port_Moresby
        Johnston
        Kosrae
        Midway
        Efate
        Niue
        Auckland
        Pago_Pago
        Yap
        Palau
        Noumea
        Pohnpei
        Fakaofo
        Tarawa
        Wake
        Chatham
        Gambier
        Majuro
        Bougainville
        Fiji
        Truk
      - leapseconds
  - lambda.zip
  - requests
    - exceptions.py
    - sessions.py
    - hooks.py
    - status_codes.py
    - adapters.py
    - models.py
    - api.py
    - packages
      - chardet
        euctwfreq.py
        gb2312freq.py
        chardetect.py
        charsetgroupprober.py
        sbcharsetprober.py
        langhebrewmodel.py
        codingstatemachine.py
        big5prober.py
        langhungarianmodel.py
        mbcharsetprober.py
        langgreekmodel.py
        charsetprober.py
        euctwprober.py
        eucjpprober.py
        mbcsgroupprober.py
        escprober.py
        langbulgarianmodel.py
        utf8prober.py
        euckrfreq.py
        universaldetector.py
        mbcssm.py
        sbcsgroupprober.py
        hebrewprober.py
        constants.py
        sjisprober.py
        langthaimodel.py
        cp949prober.py
        latin1prober.py
        chardistribution.py
        __init__.py
        gb2312prober.py
        escsm.py
        big5freq.py
        compat.py
        euckrprober.py
        langcyrillicmodel.py
        jisfreq.py
        jpcntx.py
      - urllib3
        fields.py
        request.py
        exceptions.py
        _collections.py
        util
        request.py
        response.py
        ssl_.py
        connection.py
        timeout.py
        __init__.py
        retry.py
        url.py
        response.py
        packages
        six.py
        ordered_dict.py
        __init__.py
        ssl_match_hostname
        _implementation.py
        __init__.py
        connection.py
        __init__.py
        poolmanager.py
        contrib
        appengine.py
        pyopenssl.py
        ntlmpool.py
        __init__.py
        connectionpool.py
        filepost.py
      - __init__.py
    - __init__.py
    - utils.py
    - auth.py
    - cookies.py
    - structures.py
    - compat.py
    - certs.py
- feeds.d
  - malware.json
  - general.json
  - example.json.bak
  - misc_ipaddress.json
  - uce_protect.json
  - ransomware.json
  - blocklist_dot_de.json
  - bambenek.json
  - misc_domains.json
  - misc_url.json
  - threatexchange.json.bak
  - phishing.json
  - feodo.json
  - nothink.json
- feed_scheduler_lambda
  - __init__.py
  - feed_scheduler_lambda.py
  - lambda.zip

# -*- coding: utf-8 -*-
# pylint: disable-msg=E1101,W0612

from datetime import datetime, timedelta
import pytest
import re

from numpy import nan as NA
import numpy as np
from numpy.random import randint

from pandas.compat import range, u
import pandas.compat as compat
from pandas import Index, Series, DataFrame, isna, MultiIndex, notna

from pandas.util.testing import assert_series_equal
import pandas.util.testing as tm

import pandas.core.strings as strings


class TestStringMethods(object):

    def test_api(self):

        # GH 6106, GH 9322
        assert Series.str is strings.StringMethods
        assert isinstance(Series(['']).str, strings.StringMethods)

        # GH 9184
        invalid = Series([1])
        with tm.assert_raises_regex(AttributeError,
                                    "only use .str accessor"):
            invalid.str
        assert not hasattr(invalid, 'str')

    def test_iter(self):
        # GH3638
        strs = 'google', 'wikimedia', 'wikipedia', 'wikitravel'
        ds = Series(strs)

        for s in ds.str:
            # iter must yield a Series
            assert isinstance(s, Series)

            # indices of each yielded Series should be equal to the index of
            # the original Series
            tm.assert_index_equal(s.index, ds.index)

            for el in s:
                # each element of the series is either a basestring/str or nan
                assert isinstance(el, compat.string_types) or isna(el)

        # desired behavior is to iterate until everything would be nan on the
        # next iter so make sure the last element of the iterator was 'l' in
        # this case since 'wikitravel' is the longest string
        assert s.dropna().values.item() == 'l'

    def test_iter_empty(self):
        ds = Series([], dtype=object)

        i, s = 100, 1

        for i, s in enumerate(ds.str):
            pass

        # nothing to iterate over so nothing defined values should remain
        # unchanged
        assert i == 100
        assert s == 1

    def test_iter_single_element(self):
        ds = Series(['a'])

        for i, s in enumerate(ds.str):
            pass

        assert not i
        assert_series_equal(ds, s)

    def test_iter_object_try_string(self):
        ds = Series([slice(None, randint(10), randint(10, 20)) for _ in range(
            4)])

        i, s = 100, 'h'

        for i, s in enumerate(ds.str):
            pass

        assert i == 100
        assert s == 'h'

    def test_cat(self):
        one = np.array(['a', 'a', 'b', 'b', 'c', NA], dtype=np.object_)
        two = np.array(['a', NA, 'b', 'd', 'foo', NA], dtype=np.object_)

        # single array
        result = strings.str_cat(one)
        exp = 'aabbc'
        assert result == exp

        result = strings.str_cat(one, na_rep='NA')
        exp = 'aabbcNA'
        assert result == exp

        result = strings.str_cat(one, na_rep='-')
        exp = 'aabbc-'
        assert result == exp

        result = strings.str_cat(one, sep='_', na_rep='NA')
        exp = 'a_a_b_b_c_NA'
        assert result == exp

        result = strings.str_cat(two, sep='-')
        exp = 'a-b-d-foo'
        assert result == exp

        # Multiple arrays
        result = strings.str_cat(one, [two], na_rep='NA')
        exp = np.array(['aa', 'aNA', 'bb', 'bd', 'cfoo', 'NANA'],
                       dtype=np.object_)
        tm.assert_numpy_array_equal(result, exp)

        result = strings.str_cat(one, two)
        exp = np.array(['aa', NA, 'bb', 'bd', 'cfoo', NA], dtype=np.object_)
        tm.assert_almost_equal(result, exp)

    def test_count(self):
        values = np.array(['foo', 'foofoo', NA, 'foooofooofommmfoo'],
                          dtype=np.object_)

        result = strings.str_count(values, 'f[o]+')
        exp = np.array([1, 2, NA, 4])
        tm.assert_numpy_array_equal(result, exp)

        result = Series(values).str.count('f[o]+')
        exp = Series([1, 2, NA, 4])
        assert isinstance(result, Series)
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = ['a', NA, 'b', True, datetime.today(), 'foo', None, 1, 2.]
        rs = strings.str_count(mixed, 'a')
        xp = np.array([1, NA, 0, NA, NA, 0, NA, NA, NA])
        tm.assert_numpy_array_equal(rs, xp)

        rs = Series(mixed).str.count('a')
        xp = Series([1, NA, 0, NA, NA, 0, NA, NA, NA])
        assert isinstance(rs, Series)
        tm.assert_series_equal(rs, xp)

        # unicode
        values = [u('foo'), u('foofoo'), NA, u('foooofooofommmfoo')]

        result = strings.str_count(values, 'f[o]+')
        exp = np.array([1, 2, NA, 4])
        tm.assert_numpy_array_equal(result, exp)

        result = Series(values).str.count('f[o]+')
        exp = Series([1, 2, NA, 4])
        assert isinstance(result, Series)
        tm.assert_series_equal(result, exp)

    def test_contains(self):
        values = np.array(['foo', NA, 'fooommm__foo',
                           'mmm_', 'foommm[_]+bar'], dtype=np.object_)
        pat = 'mmm[_]+'

        result = strings.str_contains(values, pat)
        expected = np.array([False, NA, True, True, False], dtype=np.object_)
        tm.assert_numpy_array_equal(result, expected)

        result = strings.str_contains(values, pat, regex=False)
        expected = np.array([False, NA, False, False, True], dtype=np.object_)
        tm.assert_numpy_array_equal(result, expected)

        values = ['foo', 'xyz', 'fooommm__foo', 'mmm_']
        result = strings.str_contains(values, pat)
        expected = np.array([False, False, True, True])
        assert result.dtype == np.bool_
        tm.assert_numpy_array_equal(result, expected)

        # case insensitive using regex
        values = ['Foo', 'xYz', 'fOOomMm__fOo', 'MMM_']
        result = strings.str_contains(values, 'FOO|mmm', case=False)
        expected = np.array([True, False, True, True])
        tm.assert_numpy_array_equal(result, expected)

        # case insensitive without regex
        result = strings.str_contains(values, 'foo', regex=False, case=False)
        expected = np.array([True, False, True, False])
        tm.assert_numpy_array_equal(result, expected)

        # mixed
        mixed = ['a', NA, 'b', True, datetime.today(), 'foo', None, 1, 2.]
        rs = strings.str_contains(mixed, 'o')
        xp = np.array([False, NA, False, NA, NA, True, NA, NA, NA],
                      dtype=np.object_)
        tm.assert_numpy_array_equal(rs, xp)

        rs = Series(mixed).str.contains('o')
        xp = Series([False, NA, False, NA, NA, True, NA, NA, NA])
        assert isinstance(rs, Series)
        tm.assert_series_equal(rs, xp)

        # unicode
        values = np.array([u'foo', NA, u'fooommm__foo', u'mmm_'],
                          dtype=np.object_)
        pat = 'mmm[_]+'

        result = strings.str_contains(values, pat)
        expected = np.array([False, np.nan, True, True], dtype=np.object_)
        tm.assert_numpy_array_equal(result, expected)

        result = strings.str_contains(values, pat, na=False)
        expected = np.array([False, False, True, True])
        tm.assert_numpy_array_equal(result, expected)

        values = np.array(['foo', 'xyz', 'fooommm__foo', 'mmm_'],
                          dtype=np.object_)
        result = strings.str_contains(values, pat)
        expected = np.array([False, False, True, True])
        assert result.dtype == np.bool_
        tm.assert_numpy_array_equal(result, expected)

        # na
        values = Series(['om', 'foo', np.nan])
        res = values.str.contains('foo', na="foo")
        assert res.loc[2] == "foo"

    def test_startswith(self):
        values = Series(['om', NA, 'foo_nom', 'nom', 'bar_foo', NA, 'foo'])

        result = values.str.startswith('foo')
        exp = Series([False, NA, True, False, False, NA, True])
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = np.array(['a', NA, 'b', True, datetime.today(),
                          'foo', None, 1, 2.], dtype=np.object_)
        rs = strings.str_startswith(mixed, 'f')
        xp = np.array([False, NA, False, NA, NA, True, NA, NA, NA],
                      dtype=np.object_)
        tm.assert_numpy_array_equal(rs, xp)

        rs = Series(mixed).str.startswith('f')
        assert isinstance(rs, Series)
        xp = Series([False, NA, False, NA, NA, True, NA, NA, NA])
        tm.assert_series_equal(rs, xp)

        # unicode
        values = Series([u('om'), NA, u('foo_nom'), u('nom'), u('bar_foo'), NA,
                         u('foo')])

        result = values.str.startswith('foo')
        exp = Series([False, NA, True, False, False, NA, True])
        tm.assert_series_equal(result, exp)

        result = values.str.startswith('foo', na=True)
        tm.assert_series_equal(result, exp.fillna(True).astype(bool))

    def test_endswith(self):
        values = Series(['om', NA, 'foo_nom', 'nom', 'bar_foo', NA, 'foo'])

        result = values.str.endswith('foo')
        exp = Series([False, NA, False, False, True, NA, True])
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = ['a', NA, 'b', True, datetime.today(), 'foo', None, 1, 2.]
        rs = strings.str_endswith(mixed, 'f')
        xp = np.array([False, NA, False, NA, NA, False, NA, NA, NA],
                      dtype=np.object_)
        tm.assert_numpy_array_equal(rs, xp)

        rs = Series(mixed).str.endswith('f')
        xp = Series([False, NA, False, NA, NA, False, NA, NA, NA])
        assert isinstance(rs, Series)
        tm.assert_series_equal(rs, xp)

        # unicode
        values = Series([u('om'), NA, u('foo_nom'), u('nom'), u('bar_foo'), NA,
                         u('foo')])

        result = values.str.endswith('foo')
        exp = Series([False, NA, False, False, True, NA, True])
        tm.assert_series_equal(result, exp)

        result = values.str.endswith('foo', na=False)
        tm.assert_series_equal(result, exp.fillna(False).astype(bool))

    def test_title(self):
        values = Series(["FOO", "BAR", NA, "Blah", "blurg"])

        result = values.str.title()
        exp = Series(["Foo", "Bar", NA, "Blah", "Blurg"])
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = Series(["FOO", NA, "bar", True, datetime.today(), "blah", None,
                        1, 2.])
        mixed = mixed.str.title()
        exp = Series(["Foo", NA, "Bar", NA, NA, "Blah", NA, NA, NA])
        tm.assert_almost_equal(mixed, exp)

        # unicode
        values = Series([u("FOO"), NA, u("bar"), u("Blurg")])

        results = values.str.title()
        exp = Series([u("Foo"), NA, u("Bar"), u("Blurg")])

        tm.assert_series_equal(results, exp)

    def test_lower_upper(self):
        values = Series(['om', NA, 'nom', 'nom'])

        result = values.str.upper()
        exp = Series(['OM', NA, 'NOM', 'NOM'])
        tm.assert_series_equal(result, exp)

        result = result.str.lower()
        tm.assert_series_equal(result, values)

        # mixed
        mixed = Series(['a', NA, 'b', True, datetime.today(), 'foo', None, 1,
                        2.])
        mixed = mixed.str.upper()
        rs = Series(mixed).str.lower()
        xp = Series(['a', NA, 'b', NA, NA, 'foo', NA, NA, NA])
        assert isinstance(rs, Series)
        tm.assert_series_equal(rs, xp)

        # unicode
        values = Series([u('om'), NA, u('nom'), u('nom')])

        result = values.str.upper()
        exp = Series([u('OM'), NA, u('NOM'), u('NOM')])
        tm.assert_series_equal(result, exp)

        result = result.str.lower()
        tm.assert_series_equal(result, values)

    def test_capitalize(self):
        values = Series(["FOO", "BAR", NA, "Blah", "blurg"])
        result = values.str.capitalize()
        exp = Series(["Foo", "Bar", NA, "Blah", "Blurg"])
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = Series(["FOO", NA, "bar", True, datetime.today(), "blah", None,
                        1, 2.])
        mixed = mixed.str.capitalize()
        exp = Series(["Foo", NA, "Bar", NA, NA, "Blah", NA, NA, NA])
        tm.assert_almost_equal(mixed, exp)

        # unicode
        values = Series([u("FOO"), NA, u("bar"), u("Blurg")])
        results = values.str.capitalize()
        exp = Series([u("Foo"), NA, u("Bar"), u("Blurg")])
        tm.assert_series_equal(results, exp)

    def test_swapcase(self):
        values = Series(["FOO", "BAR", NA, "Blah", "blurg"])
        result = values.str.swapcase()
        exp = Series(["foo", "bar", NA, "bLAH", "BLURG"])
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = Series(["FOO", NA, "bar", True, datetime.today(), "Blah", None,
                        1, 2.])
        mixed = mixed.str.swapcase()
        exp = Series(["foo", NA, "BAR", NA, NA, "bLAH", NA, NA, NA])
        tm.assert_almost_equal(mixed, exp)

        # unicode
        values = Series([u("FOO"), NA, u("bar"), u("Blurg")])
        results = values.str.swapcase()
        exp = Series([u("foo"), NA, u("BAR"), u("bLURG")])
        tm.assert_series_equal(results, exp)

    def test_casemethods(self):
        values = ['aaa', 'bbb', 'CCC', 'Dddd', 'eEEE']
        s = Series(values)
        assert s.str.lower().tolist() == [v.lower() for v in values]
        assert s.str.upper().tolist() == [v.upper() for v in values]
        assert s.str.title().tolist() == [v.title() for v in values]
        assert s.str.capitalize().tolist() == [v.capitalize() for v in values]
        assert s.str.swapcase().tolist() == [v.swapcase() for v in values]

    def test_replace(self):
        values = Series(['fooBAD__barBAD', NA])

        result = values.str.replace('BAD[_]*', '')
        exp = Series(['foobar', NA])
        tm.assert_series_equal(result, exp)

        result = values.str.replace('BAD[_]*', '', n=1)
        exp = Series(['foobarBAD', NA])
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = Series(['aBAD', NA, 'bBAD', True, datetime.today(), 'fooBAD',
                        None, 1, 2.])

        rs = Series(mixed).str.replace('BAD[_]*', '')
        xp = Series(['a', NA, 'b', NA, NA, 'foo', NA, NA, NA])
        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        # unicode
        values = Series([u('fooBAD__barBAD'), NA])

        result = values.str.replace('BAD[_]*', '')
        exp = Series([u('foobar'), NA])
        tm.assert_series_equal(result, exp)

        result = values.str.replace('BAD[_]*', '', n=1)
        exp = Series([u('foobarBAD'), NA])
        tm.assert_series_equal(result, exp)

        # flags + unicode
        values = Series([b"abcd,\xc3\xa0".decode("utf-8")])
        exp = Series([b"abcd, \xc3\xa0".decode("utf-8")])
        result = values.str.replace(r"(?<=\w),(?=\w)", ", ", flags=re.UNICODE)
        tm.assert_series_equal(result, exp)

        # GH 13438
        for klass in (Series, Index):
            for repl in (None, 3, {'a': 'b'}):
                for data in (['a', 'b', None], ['a', 'b', 'c', 'ad']):
                    values = klass(data)
                    pytest.raises(TypeError, values.str.replace, 'a', repl)

    def test_replace_callable(self):
        # GH 15055
        values = Series(['fooBAD__barBAD', NA])

        # test with callable
        repl = lambda m: m.group(0).swapcase()
        result = values.str.replace('[a-z][A-Z]{2}', repl, n=2)
        exp = Series(['foObaD__baRbaD', NA])
        tm.assert_series_equal(result, exp)

        # test with wrong number of arguments, raising an error
        if compat.PY2:
            p_err = r'takes (no|(exactly|at (least|most)) ?\d+) arguments?'
        else:
            p_err = (r'((takes)|(missing)) (?(2)from \d+ to )?\d+ '
                     r'(?(3)required )positional arguments?')

        repl = lambda: None
        with tm.assert_raises_regex(TypeError, p_err):
            values.str.replace('a', repl)

        repl = lambda m, x: None
        with tm.assert_raises_regex(TypeError, p_err):
            values.str.replace('a', repl)

        repl = lambda m, x, y=None: None
        with tm.assert_raises_regex(TypeError, p_err):
            values.str.replace('a', repl)

        # test regex named groups
        values = Series(['Foo Bar Baz', NA])
        pat = r"(?P<first>\w+) (?P<middle>\w+) (?P<last>\w+)"
        repl = lambda m: m.group('middle').swapcase()
        result = values.str.replace(pat, repl)
        exp = Series(['bAR', NA])
        tm.assert_series_equal(result, exp)

    def test_replace_compiled_regex(self):
        # GH 15446
        values = Series(['fooBAD__barBAD', NA])

        # test with compiled regex
        pat = re.compile(r'BAD[_]*')
        result = values.str.replace(pat, '')
        exp = Series(['foobar', NA])
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = Series(['aBAD', NA, 'bBAD', True, datetime.today(), 'fooBAD',
                        None, 1, 2.])

        rs = Series(mixed).str.replace(pat, '')
        xp = Series(['a', NA, 'b', NA, NA, 'foo', NA, NA, NA])
        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        # unicode
        values = Series([u('fooBAD__barBAD'), NA])

        result = values.str.replace(pat, '')
        exp = Series([u('foobar'), NA])
        tm.assert_series_equal(result, exp)

        result = values.str.replace(pat, '', n=1)
        exp = Series([u('foobarBAD'), NA])
        tm.assert_series_equal(result, exp)

        # flags + unicode
        values = Series([b"abcd,\xc3\xa0".decode("utf-8")])
        exp = Series([b"abcd, \xc3\xa0".decode("utf-8")])
        pat = re.compile(r"(?<=\w),(?=\w)", flags=re.UNICODE)
        result = values.str.replace(pat, ", ")
        tm.assert_series_equal(result, exp)

        # case and flags provided to str.replace will have no effect
        # and will produce warnings
        values = Series(['fooBAD__barBAD__bad', NA])
        pat = re.compile(r'BAD[_]*')

        with tm.assert_raises_regex(ValueError,
                                    "case and flags cannot be"):
            result = values.str.replace(pat, '', flags=re.IGNORECASE)

        with tm.assert_raises_regex(ValueError,
                                    "case and flags cannot be"):
            result = values.str.replace(pat, '', case=False)

        with tm.assert_raises_regex(ValueError,
                                    "case and flags cannot be"):
            result = values.str.replace(pat, '', case=True)

        # test with callable
        values = Series(['fooBAD__barBAD', NA])
        repl = lambda m: m.group(0).swapcase()
        pat = re.compile('[a-z][A-Z]{2}')
        result = values.str.replace(pat, repl, n=2)
        exp = Series(['foObaD__baRbaD', NA])
        tm.assert_series_equal(result, exp)

    def test_repeat(self):
        values = Series(['a', 'b', NA, 'c', NA, 'd'])

        result = values.str.repeat(3)
        exp = Series(['aaa', 'bbb', NA, 'ccc', NA, 'ddd'])
        tm.assert_series_equal(result, exp)

        result = values.str.repeat([1, 2, 3, 4, 5, 6])
        exp = Series(['a', 'bb', NA, 'cccc', NA, 'dddddd'])
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = Series(['a', NA, 'b', True, datetime.today(), 'foo', None, 1,
                        2.])

        rs = Series(mixed).str.repeat(3)
        xp = Series(['aaa', NA, 'bbb', NA, NA, 'foofoofoo', NA, NA, NA])
        assert isinstance(rs, Series)
        tm.assert_series_equal(rs, xp)

        # unicode
        values = Series([u('a'), u('b'), NA, u('c'), NA, u('d')])

        result = values.str.repeat(3)
        exp = Series([u('aaa'), u('bbb'), NA, u('ccc'), NA, u('ddd')])
        tm.assert_series_equal(result, exp)

        result = values.str.repeat([1, 2, 3, 4, 5, 6])
        exp = Series([u('a'), u('bb'), NA, u('cccc'), NA, u('dddddd')])
        tm.assert_series_equal(result, exp)

    def test_match(self):
        # New match behavior introduced in 0.13
        values = Series(['fooBAD__barBAD', NA, 'foo'])
        result = values.str.match('.*(BAD[_]+).*(BAD)')
        exp = Series([True, NA, False])
        tm.assert_series_equal(result, exp)

        values = Series(['fooBAD__barBAD', NA, 'foo'])
        result = values.str.match('.*BAD[_]+.*BAD')
        exp = Series([True, NA, False])
        tm.assert_series_equal(result, exp)

        # test passing as_indexer still works but is ignored
        values = Series(['fooBAD__barBAD', NA, 'foo'])
        exp = Series([True, NA, False])
        with tm.assert_produces_warning(FutureWarning):
            result = values.str.match('.*BAD[_]+.*BAD', as_indexer=True)
        tm.assert_series_equal(result, exp)
        with tm.assert_produces_warning(FutureWarning):
            result = values.str.match('.*BAD[_]+.*BAD', as_indexer=False)
        tm.assert_series_equal(result, exp)
        with tm.assert_produces_warning(FutureWarning):
            result = values.str.match('.*(BAD[_]+).*(BAD)', as_indexer=True)
        tm.assert_series_equal(result, exp)
        pytest.raises(ValueError, values.str.match, '.*(BAD[_]+).*(BAD)',
                      as_indexer=False)

        # mixed
        mixed = Series(['aBAD_BAD', NA, 'BAD_b_BAD', True, datetime.today(),
                        'foo', None, 1, 2.])
        rs = Series(mixed).str.match('.*(BAD[_]+).*(BAD)')
        xp = Series([True, NA, True, NA, NA, False, NA, NA, NA])
        assert isinstance(rs, Series)
        tm.assert_series_equal(rs, xp)

        # unicode
        values = Series([u('fooBAD__barBAD'), NA, u('foo')])
        result = values.str.match('.*(BAD[_]+).*(BAD)')
        exp = Series([True, NA, False])
        tm.assert_series_equal(result, exp)

        # na GH #6609
        res = Series(['a', 0, np.nan]).str.match('a', na=False)
        exp = Series([True, False, False])
        assert_series_equal(exp, res)
        res = Series(['a', 0, np.nan]).str.match('a')
        exp = Series([True, np.nan, np.nan])
        assert_series_equal(exp, res)

    def test_extract_expand_None(self):
        values = Series(['fooBAD__barBAD', NA, 'foo'])
        with tm.assert_produces_warning(FutureWarning):
            values.str.extract('.*(BAD[_]+).*(BAD)', expand=None)

    def test_extract_expand_unspecified(self):
        values = Series(['fooBAD__barBAD', NA, 'foo'])
        with tm.assert_produces_warning(FutureWarning):
            values.str.extract('.*(BAD[_]+).*(BAD)')

    def test_extract_expand_False(self):
        # Contains tests like those in test_match and some others.
        values = Series(['fooBAD__barBAD', NA, 'foo'])
        er = [NA, NA]  # empty row

        result = values.str.extract('.*(BAD[_]+).*(BAD)', expand=False)
        exp = DataFrame([['BAD__', 'BAD'], er, er])
        tm.assert_frame_equal(result, exp)

        # mixed
        mixed = Series(['aBAD_BAD', NA, 'BAD_b_BAD', True, datetime.today(),
                        'foo', None, 1, 2.])

        rs = Series(mixed).str.extract('.*(BAD[_]+).*(BAD)', expand=False)
        exp = DataFrame([['BAD_', 'BAD'], er, ['BAD_', 'BAD'], er, er, er, er,
                         er, er])
        tm.assert_frame_equal(rs, exp)

        # unicode
        values = Series([u('fooBAD__barBAD'), NA, u('foo')])

        result = values.str.extract('.*(BAD[_]+).*(BAD)', expand=False)
        exp = DataFrame([[u('BAD__'), u('BAD')], er, er])
        tm.assert_frame_equal(result, exp)

        # GH9980
        # Index only works with one regex group since
        # multi-group would expand to a frame
        idx = Index(['A1', 'A2', 'A3', 'A4', 'B5'])
        with tm.assert_raises_regex(ValueError, "supported"):
            idx.str.extract('([AB])([123])', expand=False)

        # these should work for both Series and Index
        for klass in [Series, Index]:
            # no groups
            s_or_idx = klass(['A1', 'B2', 'C3'])
            f = lambda: s_or_idx.str.extract('[ABC][123]', expand=False)
            pytest.raises(ValueError, f)

            # only non-capturing groups
            f = lambda: s_or_idx.str.extract('(?:[AB]).*', expand=False)
            pytest.raises(ValueError, f)

            # single group renames series/index properly
            s_or_idx = klass(['A1', 'A2'])
            result = s_or_idx.str.extract(r'(?P<uno>A)\d', expand=False)
            assert result.name == 'uno'

            exp = klass(['A', 'A'], name='uno')
            if klass == Series:
                tm.assert_series_equal(result, exp)
            else:
                tm.assert_index_equal(result, exp)

        s = Series(['A1', 'B2', 'C3'])
        # one group, no matches
        result = s.str.extract('(_)', expand=False)
        exp = Series([NA, NA, NA], dtype=object)
        tm.assert_series_equal(result, exp)

        # two groups, no matches
        result = s.str.extract('(_)(_)', expand=False)
        exp = DataFrame([[NA, NA], [NA, NA], [NA, NA]], dtype=object)
        tm.assert_frame_equal(result, exp)

        # one group, some matches
        result = s.str.extract('([AB])[123]', expand=False)
        exp = Series(['A', 'B', NA])
        tm.assert_series_equal(result, exp)

        # two groups, some matches
        result = s.str.extract('([AB])([123])', expand=False)
        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]])
        tm.assert_frame_equal(result, exp)

        # one named group
        result = s.str.extract('(?P<letter>[AB])', expand=False)
        exp = Series(['A', 'B', NA], name='letter')
        tm.assert_series_equal(result, exp)

        # two named groups
        result = s.str.extract('(?P<letter>[AB])(?P<number>[123])',
                               expand=False)
        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]],
                        columns=['letter', 'number'])
        tm.assert_frame_equal(result, exp)

        # mix named and unnamed groups
        result = s.str.extract('([AB])(?P<number>[123])', expand=False)
        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]],
                        columns=[0, 'number'])
        tm.assert_frame_equal(result, exp)

        # one normal group, one non-capturing group
        result = s.str.extract('([AB])(?:[123])', expand=False)
        exp = Series(['A', 'B', NA])
        tm.assert_series_equal(result, exp)

        # two normal groups, one non-capturing group
        result = Series(['A11', 'B22', 'C33']).str.extract(
            '([AB])([123])(?:[123])', expand=False)
        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]])
        tm.assert_frame_equal(result, exp)

        # one optional group followed by one normal group
        result = Series(['A1', 'B2', '3']).str.extract(
            '(?P<letter>[AB])?(?P<number>[123])', expand=False)
        exp = DataFrame([['A', '1'], ['B', '2'], [NA, '3']],
                        columns=['letter', 'number'])
        tm.assert_frame_equal(result, exp)

        # one normal group followed by one optional group
        result = Series(['A1', 'B2', 'C']).str.extract(
            '(?P<letter>[ABC])(?P<number>[123])?', expand=False)
        exp = DataFrame([['A', '1'], ['B', '2'], ['C', NA]],
                        columns=['letter', 'number'])
        tm.assert_frame_equal(result, exp)

        # GH6348
        # not passing index to the extractor
        def check_index(index):
            data = ['A1', 'B2', 'C']
            index = index[:len(data)]
            s = Series(data, index=index)
            result = s.str.extract(r'(\d)', expand=False)
            exp = Series(['1', '2', NA], index=index)
            tm.assert_series_equal(result, exp)

            result = Series(data, index=index).str.extract(
                r'(?P<letter>\D)(?P<number>\d)?', expand=False)
            e_list = [
                ['A', '1'],
                ['B', '2'],
                ['C', NA]
            ]
            exp = DataFrame(e_list, columns=['letter', 'number'], index=index)
            tm.assert_frame_equal(result, exp)

        i_funs = [
            tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
            tm.makeDateIndex, tm.makePeriodIndex, tm.makeRangeIndex
        ]
        for index in i_funs:
            check_index(index())

        # single_series_name_is_preserved.
        s = Series(['a3', 'b3', 'c2'], name='bob')
        r = s.str.extract(r'(?P<sue>[a-z])', expand=False)
        e = Series(['a', 'b', 'c'], name='sue')
        tm.assert_series_equal(r, e)
        assert r.name == e.name

    def test_extract_expand_True(self):
        # Contains tests like those in test_match and some others.
        values = Series(['fooBAD__barBAD', NA, 'foo'])
        er = [NA, NA]  # empty row

        result = values.str.extract('.*(BAD[_]+).*(BAD)', expand=True)
        exp = DataFrame([['BAD__', 'BAD'], er, er])
        tm.assert_frame_equal(result, exp)

        # mixed
        mixed = Series(['aBAD_BAD', NA, 'BAD_b_BAD', True, datetime.today(),
                        'foo', None, 1, 2.])

        rs = Series(mixed).str.extract('.*(BAD[_]+).*(BAD)', expand=True)
        exp = DataFrame([['BAD_', 'BAD'], er, ['BAD_', 'BAD'], er, er,
                         er, er, er, er])
        tm.assert_frame_equal(rs, exp)

        # unicode
        values = Series([u('fooBAD__barBAD'), NA, u('foo')])

        result = values.str.extract('.*(BAD[_]+).*(BAD)', expand=True)
        exp = DataFrame([[u('BAD__'), u('BAD')], er, er])
        tm.assert_frame_equal(result, exp)

        # these should work for both Series and Index
        for klass in [Series, Index]:
            # no groups
            s_or_idx = klass(['A1', 'B2', 'C3'])
            f = lambda: s_or_idx.str.extract('[ABC][123]', expand=True)
            pytest.raises(ValueError, f)

            # only non-capturing groups
            f = lambda: s_or_idx.str.extract('(?:[AB]).*', expand=True)
            pytest.raises(ValueError, f)

            # single group renames series/index properly
            s_or_idx = klass(['A1', 'A2'])
            result_df = s_or_idx.str.extract(r'(?P<uno>A)\d', expand=True)
            assert isinstance(result_df, DataFrame)
            result_series = result_df['uno']
            assert_series_equal(result_series, Series(['A', 'A'], name='uno'))

    def test_extract_series(self):
        # extract should give the same result whether or not the
        # series has a name.
        for series_name in None, "series_name":
            s = Series(['A1', 'B2', 'C3'], name=series_name)
            # one group, no matches
            result = s.str.extract('(_)', expand=True)
            exp = DataFrame([NA, NA, NA], dtype=object)
            tm.assert_frame_equal(result, exp)

            # two groups, no matches
            result = s.str.extract('(_)(_)', expand=True)
            exp = DataFrame([[NA, NA], [NA, NA], [NA, NA]], dtype=object)
            tm.assert_frame_equal(result, exp)

            # one group, some matches
            result = s.str.extract('([AB])[123]', expand=True)
            exp = DataFrame(['A', 'B', NA])
            tm.assert_frame_equal(result, exp)

            # two groups, some matches
            result = s.str.extract('([AB])([123])', expand=True)
            exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]])
            tm.assert_frame_equal(result, exp)

            # one named group
            result = s.str.extract('(?P<letter>[AB])', expand=True)
            exp = DataFrame({"letter": ['A', 'B', NA]})
            tm.assert_frame_equal(result, exp)

            # two named groups
            result = s.str.extract(
                '(?P<letter>[AB])(?P<number>[123])',
                expand=True)
            e_list = [
                ['A', '1'],
                ['B', '2'],
                [NA, NA]
            ]
            exp = DataFrame(e_list, columns=['letter', 'number'])
            tm.assert_frame_equal(result, exp)

            # mix named and unnamed groups
            result = s.str.extract('([AB])(?P<number>[123])', expand=True)
            exp = DataFrame(e_list, columns=[0, 'number'])
            tm.assert_frame_equal(result, exp)

            # one normal group, one non-capturing group
            result = s.str.extract('([AB])(?:[123])', expand=True)
            exp = DataFrame(['A', 'B', NA])
            tm.assert_frame_equal(result, exp)

    def test_extract_optional_groups(self):

        # two normal groups, one non-capturing group
        result = Series(['A11', 'B22', 'C33']).str.extract(
            '([AB])([123])(?:[123])', expand=True)
        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]])
        tm.assert_frame_equal(result, exp)

        # one optional group followed by one normal group
        result = Series(['A1', 'B2', '3']).str.extract(
            '(?P<letter>[AB])?(?P<number>[123])', expand=True)
        e_list = [
            ['A', '1'],
            ['B', '2'],
            [NA, '3']
        ]
        exp = DataFrame(e_list, columns=['letter', 'number'])
        tm.assert_frame_equal(result, exp)

        # one normal group followed by one optional group
        result = Series(['A1', 'B2', 'C']).str.extract(
            '(?P<letter>[ABC])(?P<number>[123])?', expand=True)
        e_list = [
            ['A', '1'],
            ['B', '2'],
            ['C', NA]
        ]
        exp = DataFrame(e_list, columns=['letter', 'number'])
        tm.assert_frame_equal(result, exp)

        # GH6348
        # not passing index to the extractor
        def check_index(index):
            data = ['A1', 'B2', 'C']
            index = index[:len(data)]
            result = Series(data, index=index).str.extract(
                r'(\d)', expand=True)
            exp = DataFrame(['1', '2', NA], index=index)
            tm.assert_frame_equal(result, exp)

            result = Series(data, index=index).str.extract(
                r'(?P<letter>\D)(?P<number>\d)?', expand=True)
            e_list = [
                ['A', '1'],
                ['B', '2'],
                ['C', NA]
            ]
            exp = DataFrame(e_list, columns=['letter', 'number'], index=index)
            tm.assert_frame_equal(result, exp)

        i_funs = [
            tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
            tm.makeDateIndex, tm.makePeriodIndex, tm.makeRangeIndex
        ]
        for index in i_funs:
            check_index(index())

    def test_extract_single_group_returns_frame(self):
        # GH11386 extract should always return DataFrame, even when
        # there is only one group. Prior to v0.18.0, extract returned
        # Series when there was only one group in the regex.
        s = Series(['a3', 'b3', 'c2'], name='series_name')
        r = s.str.extract(r'(?P<letter>[a-z])', expand=True)
        e = DataFrame({"letter": ['a', 'b', 'c']})
        tm.assert_frame_equal(r, e)

    def test_extractall(self):
        subject_list = [
            'dave@google.com',
            'tdhock5@gmail.com',
            'maudelaperriere@gmail.com',
            'rob@gmail.com some text steve@gmail.com',
            'a@b.com some text c@d.com and e@f.com',
            np.nan,
            "",
        ]
        expected_tuples = [
            ("dave", "google", "com"),
            ("tdhock5", "gmail", "com"),
            ("maudelaperriere", "gmail", "com"),
            ("rob", "gmail", "com"), ("steve", "gmail", "com"),
            ("a", "b", "com"), ("c", "d", "com"), ("e", "f", "com"),
        ]
        named_pattern = r"""
        (?P<user>[a-z0-9]+)
        @
        (?P<domain>[a-z]+)
        \.
        (?P<tld>[a-z]{2,4})
        """
        expected_columns = ["user", "domain", "tld"]
        S = Series(subject_list)
        # extractall should return a DataFrame with one row for each
        # match, indexed by the subject from which the match came.
        expected_index = MultiIndex.from_tuples([
            (0, 0),
            (1, 0),
            (2, 0),
            (3, 0),
            (3, 1),
            (4, 0),
            (4, 1),
            (4, 2),
        ], names=(None, "match"))
        expected_df = DataFrame(
            expected_tuples, expected_index, expected_columns)
        computed_df = S.str.extractall(named_pattern, re.VERBOSE)
        tm.assert_frame_equal(computed_df, expected_df)

        # The index of the input Series should be used to construct
        # the index of the output DataFrame:
        series_index = MultiIndex.from_tuples([
            ("single", "Dave"),
            ("single", "Toby"),
            ("single", "Maude"),
            ("multiple", "robAndSteve"),
            ("multiple", "abcdef"),
            ("none", "missing"),
            ("none", "empty"),
        ])
        Si = Series(subject_list, series_index)
        expected_index = MultiIndex.from_tuples([
            ("single", "Dave", 0),
            ("single", "Toby", 0),
            ("single", "Maude", 0),
            ("multiple", "robAndSteve", 0),
            ("multiple", "robAndSteve", 1),
            ("multiple", "abcdef", 0),
            ("multiple", "abcdef", 1),
            ("multiple", "abcdef", 2),
        ], names=(None, None, "match"))
        expected_df = DataFrame(
            expected_tuples, expected_index, expected_columns)
        computed_df = Si.str.extractall(named_pattern, re.VERBOSE)
        tm.assert_frame_equal(computed_df, expected_df)

        # MultiIndexed subject with names.
        Sn = Series(subject_list, series_index)
        Sn.index.names = ("matches", "description")
        expected_index.names = ("matches", "description", "match")
        expected_df = DataFrame(
            expected_tuples, expected_index, expected_columns)
        computed_df = Sn.str.extractall(named_pattern, re.VERBOSE)
        tm.assert_frame_equal(computed_df, expected_df)

        # optional groups.
        subject_list = ['', 'A1', '32']
        named_pattern = '(?P<letter>[AB])?(?P<number>[123])'
        computed_df = Series(subject_list).str.extractall(named_pattern)
        expected_index = MultiIndex.from_tuples([
            (1, 0),
            (2, 0),
            (2, 1),
        ], names=(None, "match"))
        expected_df = DataFrame([
            ('A', '1'),
            (NA, '3'),
            (NA, '2'),
        ], expected_index, columns=['letter', 'number'])
        tm.assert_frame_equal(computed_df, expected_df)

        # only one of two groups has a name.
        pattern = '([AB])?(?P<number>[123])'
        computed_df = Series(subject_list).str.extractall(pattern)
        expected_df = DataFrame([
            ('A', '1'),
            (NA, '3'),
            (NA, '2'),
        ], expected_index, columns=[0, 'number'])
        tm.assert_frame_equal(computed_df, expected_df)

    def test_extractall_single_group(self):
        # extractall(one named group) returns DataFrame with one named
        # column.
        s = Series(['a3', 'b3', 'd4c2'], name='series_name')
        r = s.str.extractall(r'(?P<letter>[a-z])')
        i = MultiIndex.from_tuples([
            (0, 0),
            (1, 0),
            (2, 0),
            (2, 1),
        ], names=(None, "match"))
        e = DataFrame({"letter": ['a', 'b', 'd', 'c']}, i)
        tm.assert_frame_equal(r, e)

        # extractall(one un-named group) returns DataFrame with one
        # un-named column.
        r = s.str.extractall(r'([a-z])')
        e = DataFrame(['a', 'b', 'd', 'c'], i)
        tm.assert_frame_equal(r, e)

    def test_extractall_single_group_with_quantifier(self):
        # extractall(one un-named group with quantifier) returns
        # DataFrame with one un-named column (GH13382).
        s = Series(['ab3', 'abc3', 'd4cd2'], name='series_name')
        r = s.str.extractall(r'([a-z]+)')
        i = MultiIndex.from_tuples([
            (0, 0),
            (1, 0),
            (2, 0),
            (2, 1),
        ], names=(None, "match"))
        e = DataFrame(['ab', 'abc', 'd', 'cd'], i)
        tm.assert_frame_equal(r, e)

    def test_extractall_no_matches(self):
        s = Series(['a3', 'b3', 'd4c2'], name='series_name')
        # one un-named group.
        r = s.str.extractall('(z)')
        e = DataFrame(columns=[0])
        tm.assert_frame_equal(r, e)
        # two un-named groups.
        r = s.str.extractall('(z)(z)')
        e = DataFrame(columns=[0, 1])
        tm.assert_frame_equal(r, e)
        # one named group.
        r = s.str.extractall('(?P<first>z)')
        e = DataFrame(columns=["first"])
        tm.assert_frame_equal(r, e)
        # two named groups.
        r = s.str.extractall('(?P<first>z)(?P<second>z)')
        e = DataFrame(columns=["first", "second"])
        tm.assert_frame_equal(r, e)
        # one named, one un-named.
        r = s.str.extractall('(z)(?P<second>z)')
        e = DataFrame(columns=[0,
                               "second"])
        tm.assert_frame_equal(r, e)

    def test_extractall_stringindex(self):
        s = Series(["a1a2", "b1", "c1"], name='xxx')
        res = s.str.extractall(r"[ab](?P<digit>\d)")
        exp_idx = MultiIndex.from_tuples([(0, 0), (0, 1), (1, 0)],
                                         names=[None, 'match'])
        exp = DataFrame({'digit': ["1", "2", "1"]}, index=exp_idx)
        tm.assert_frame_equal(res, exp)

        # index should return the same result as the default index without name
        # thus index.name doesn't affect to the result
        for idx in [Index(["a1a2", "b1", "c1"]),
                    Index(["a1a2", "b1", "c1"], name='xxx')]:

            res = idx.str.extractall(r"[ab](?P<digit>\d)")
            tm.assert_frame_equal(res, exp)

        s = Series(["a1a2", "b1", "c1"], name='s_name',
                   index=Index(["XX", "yy", "zz"], name='idx_name'))
        res = s.str.extractall(r"[ab](?P<digit>\d)")
        exp_idx = MultiIndex.from_tuples([("XX", 0), ("XX", 1), ("yy", 0)],
                                         names=["idx_name", 'match'])
        exp = DataFrame({'digit': ["1", "2", "1"]}, index=exp_idx)
        tm.assert_frame_equal(res, exp)

    def test_extractall_errors(self):
        # Does not make sense to use extractall with a regex that has
        # no capture groups. (it returns DataFrame with one column for
        # each capture group)
        s = Series(['a3', 'b3', 'd4c2'], name='series_name')
        with tm.assert_raises_regex(ValueError, "no capture groups"):
            s.str.extractall(r'[a-z]')

    def test_extract_index_one_two_groups(self):
        s = Series(['a3', 'b3', 'd4c2'], index=["A3", "B3", "D4"],
                   name='series_name')
        r = s.index.str.extract(r'([A-Z])', expand=True)
        e = DataFrame(['A', "B", "D"])
        tm.assert_frame_equal(r, e)

        # Prior to v0.18.0, index.str.extract(regex with one group)
        # returned Index. With more than one group, extract raised an
        # error (GH9980). Now extract always returns DataFrame.
        r = s.index.str.extract(
            r'(?P<letter>[A-Z])(?P<digit>[0-9])', expand=True)
        e_list = [
            ("A", "3"),
            ("B", "3"),
            ("D", "4"),
        ]
        e = DataFrame(e_list, columns=["letter", "digit"])
        tm.assert_frame_equal(r, e)

    def test_extractall_same_as_extract(self):
        s = Series(['a3', 'b3', 'c2'], name='series_name')

        pattern_two_noname = r'([a-z])([0-9])'
        extract_two_noname = s.str.extract(pattern_two_noname, expand=True)
        has_multi_index = s.str.extractall(pattern_two_noname)
        no_multi_index = has_multi_index.xs(0, level="match")
        tm.assert_frame_equal(extract_two_noname, no_multi_index)

        pattern_two_named = r'(?P<letter>[a-z])(?P<digit>[0-9])'
        extract_two_named = s.str.extract(pattern_two_named, expand=True)
        has_multi_index = s.str.extractall(pattern_two_named)
        no_multi_index = has_multi_index.xs(0, level="match")
        tm.assert_frame_equal(extract_two_named, no_multi_index)

        pattern_one_named = r'(?P<group_name>[a-z])'
        extract_one_named = s.str.extract(pattern_one_named, expand=True)
        has_multi_index = s.str.extractall(pattern_one_named)
        no_multi_index = has_multi_index.xs(0, level="match")
        tm.assert_frame_equal(extract_one_named, no_multi_index)

        pattern_one_noname = r'([a-z])'
        extract_one_noname = s.str.extract(pattern_one_noname, expand=True)
        has_multi_index = s.str.extractall(pattern_one_noname)
        no_multi_index = has_multi_index.xs(0, level="match")
        tm.assert_frame_equal(extract_one_noname, no_multi_index)

    def test_extractall_same_as_extract_subject_index(self):
        # same as above tests, but s has an MultiIndex.
        i = MultiIndex.from_tuples([
            ("A", "first"),
            ("B", "second"),
            ("C", "third"),
        ], names=("capital", "ordinal"))
        s = Series(['a3', 'b3', 'c2'], i, name='series_name')

        pattern_two_noname = r'([a-z])([0-9])'
        extract_two_noname = s.str.extract(pattern_two_noname, expand=True)
        has_match_index = s.str.extractall(pattern_two_noname)
        no_match_index = has_match_index.xs(0, level="match")
        tm.assert_frame_equal(extract_two_noname, no_match_index)

        pattern_two_named = r'(?P<letter>[a-z])(?P<digit>[0-9])'
        extract_two_named = s.str.extract(pattern_two_named, expand=True)
        has_match_index = s.str.extractall(pattern_two_named)
        no_match_index = has_match_index.xs(0, level="match")
        tm.assert_frame_equal(extract_two_named, no_match_index)

        pattern_one_named = r'(?P<group_name>[a-z])'
        extract_one_named = s.str.extract(pattern_one_named, expand=True)
        has_match_index = s.str.extractall(pattern_one_named)
        no_match_index = has_match_index.xs(0, level="match")
        tm.assert_frame_equal(extract_one_named, no_match_index)

        pattern_one_noname = r'([a-z])'
        extract_one_noname = s.str.extract(pattern_one_noname, expand=True)
        has_match_index = s.str.extractall(pattern_one_noname)
        no_match_index = has_match_index.xs(0, level="match")
        tm.assert_frame_equal(extract_one_noname, no_match_index)

    def test_empty_str_methods(self):
        empty_str = empty = Series(dtype=object)
        empty_int = Series(dtype=int)
        empty_bool = Series(dtype=bool)
        empty_bytes = Series(dtype=object)

        # GH7241
        # (extract) on empty series

        tm.assert_series_equal(empty_str, empty.str.cat(empty))
        assert '' == empty.str.cat()
        tm.assert_series_equal(empty_str, empty.str.title())
        tm.assert_series_equal(empty_int, empty.str.count('a'))
        tm.assert_series_equal(empty_bool, empty.str.contains('a'))
        tm.assert_series_equal(empty_bool, empty.str.startswith('a'))
        tm.assert_series_equal(empty_bool, empty.str.endswith('a'))
        tm.assert_series_equal(empty_str, empty.str.lower())
        tm.assert_series_equal(empty_str, empty.str.upper())
        tm.assert_series_equal(empty_str, empty.str.replace('a', 'b'))
        tm.assert_series_equal(empty_str, empty.str.repeat(3))
        tm.assert_series_equal(empty_bool, empty.str.match('^a'))
        tm.assert_frame_equal(
            DataFrame(columns=[0], dtype=str),
            empty.str.extract('()', expand=True))
        tm.assert_frame_equal(
            DataFrame(columns=[0, 1], dtype=str),
            empty.str.extract('()()', expand=True))
        tm.assert_series_equal(
            empty_str,
            empty.str.extract('()', expand=False))
        tm.assert_frame_equal(
            DataFrame(columns=[0, 1], dtype=str),
            empty.str.extract('()()', expand=False))
        tm.assert_frame_equal(DataFrame(dtype=str), empty.str.get_dummies())
        tm.assert_series_equal(empty_str, empty_str.str.join(''))
        tm.assert_series_equal(empty_int, empty.str.len())
        tm.assert_series_equal(empty_str, empty_str.str.findall('a'))
        tm.assert_series_equal(empty_int, empty.str.find('a'))
        tm.assert_series_equal(empty_int, empty.str.rfind('a'))
        tm.assert_series_equal(empty_str, empty.str.pad(42))
        tm.assert_series_equal(empty_str, empty.str.center(42))
        tm.assert_series_equal(empty_str, empty.str.split('a'))
        tm.assert_series_equal(empty_str, empty.str.rsplit('a'))
        tm.assert_series_equal(empty_str,
                               empty.str.partition('a', expand=False))
        tm.assert_series_equal(empty_str,
                               empty.str.rpartition('a', expand=False))
        tm.assert_series_equal(empty_str, empty.str.slice(stop=1))
        tm.assert_series_equal(empty_str, empty.str.slice(step=1))
        tm.assert_series_equal(empty_str, empty.str.strip())
        tm.assert_series_equal(empty_str, empty.str.lstrip())
        tm.assert_series_equal(empty_str, empty.str.rstrip())
        tm.assert_series_equal(empty_str, empty.str.wrap(42))
        tm.assert_series_equal(empty_str, empty.str.get(0))
        tm.assert_series_equal(empty_str, empty_bytes.str.decode('ascii'))
        tm.assert_series_equal(empty_bytes, empty.str.encode('ascii'))
        tm.assert_series_equal(empty_str, empty.str.isalnum())
        tm.assert_series_equal(empty_str, empty.str.isalpha())
        tm.assert_series_equal(empty_str, empty.str.isdigit())
        tm.assert_series_equal(empty_str, empty.str.isspace())
        tm.assert_series_equal(empty_str, empty.str.islower())
        tm.assert_series_equal(empty_str, empty.str.isupper())
        tm.assert_series_equal(empty_str, empty.str.istitle())
        tm.assert_series_equal(empty_str, empty.str.isnumeric())
        tm.assert_series_equal(empty_str, empty.str.isdecimal())
        tm.assert_series_equal(empty_str, empty.str.capitalize())
        tm.assert_series_equal(empty_str, empty.str.swapcase())
        tm.assert_series_equal(empty_str, empty.str.normalize('NFC'))
        if compat.PY3:
            table = str.maketrans('a', 'b')
        else:
            import string
            table = string.maketrans('a', 'b')
        tm.assert_series_equal(empty_str, empty.str.translate(table))

    def test_empty_str_methods_to_frame(self):
        empty = Series(dtype=str)
        empty_df = DataFrame([])
        tm.assert_frame_equal(empty_df, empty.str.partition('a'))
        tm.assert_frame_equal(empty_df, empty.str.rpartition('a'))

    def test_ismethods(self):
        values = ['A', 'b', 'Xy', '4', '3A', '', 'TT', '55', '-', '  ']
        str_s = Series(values)
        alnum_e = [True, True, True, True, True, False, True, True, False,
                   False]
        alpha_e = [True, True, True, False, False, False, True, False, False,
                   False]
        digit_e = [False, False, False, True, False, False, False, True, False,
                   False]

        # TODO: unused
        num_e = [False, False, False, True, False, False,  # noqa
                 False, True, False, False]

        space_e = [False, False, False, False, False, False, False, False,
                   False, True]
        lower_e = [False, True, False, False, False, False, False, False,
                   False, False]
        upper_e = [True, False, False, False, True, False, True, False, False,
                   False]
        title_e = [True, False, True, False, True, False, False, False, False,
                   False]

        tm.assert_series_equal(str_s.str.isalnum(), Series(alnum_e))
        tm.assert_series_equal(str_s.str.isalpha(), Series(alpha_e))
        tm.assert_series_equal(str_s.str.isdigit(), Series(digit_e))
        tm.assert_series_equal(str_s.str.isspace(), Series(space_e))
        tm.assert_series_equal(str_s.str.islower(), Series(lower_e))
        tm.assert_series_equal(str_s.str.isupper(), Series(upper_e))
        tm.assert_series_equal(str_s.str.istitle(), Series(title_e))

        assert str_s.str.isalnum().tolist() == [v.isalnum() for v in values]
        assert str_s.str.isalpha().tolist() == [v.isalpha() for v in values]
        assert str_s.str.isdigit().tolist() == [v.isdigit() for v in values]
        assert str_s.str.isspace().tolist() == [v.isspace() for v in values]
        assert str_s.str.islower().tolist() == [v.islower() for v in values]
        assert str_s.str.isupper().tolist() == [v.isupper() for v in values]
        assert str_s.str.istitle().tolist() == [v.istitle() for v in values]

    def test_isnumeric(self):
        # 0x00bc: ¼ VULGAR FRACTION ONE QUARTER
        # 0x2605: ★ not number
        # 0x1378: ፸ ETHIOPIC NUMBER SEVENTY
        # 0xFF13: ３ Em 3
        values = ['A', '3', u'¼', u'★', u'፸', u'３', 'four']
        s = Series(values)
        numeric_e = [False, True, True, False, True, True, False]
        decimal_e = [False, True, False, False, False, True, False]
        tm.assert_series_equal(s.str.isnumeric(), Series(numeric_e))
        tm.assert_series_equal(s.str.isdecimal(), Series(decimal_e))

        unicodes = [u'A', u'3', u'¼', u'★', u'፸', u'３', u'four']
        assert s.str.isnumeric().tolist() == [v.isnumeric() for v in unicodes]
        assert s.str.isdecimal().tolist() == [v.isdecimal() for v in unicodes]

        values = ['A', np.nan, u'¼', u'★', np.nan, u'３', 'four']
        s = Series(values)
        numeric_e = [False, np.nan, True, False, np.nan, True, False]
        decimal_e = [False, np.nan, False, False, np.nan, True, False]
        tm.assert_series_equal(s.str.isnumeric(), Series(numeric_e))
        tm.assert_series_equal(s.str.isdecimal(), Series(decimal_e))

    def test_get_dummies(self):
        s = Series(['a|b', 'a|c', np.nan])
        result = s.str.get_dummies('|')
        expected = DataFrame([[1, 1, 0], [1, 0, 1], [0, 0, 0]],
                             columns=list('abc'))
        tm.assert_frame_equal(result, expected)

        s = Series(['a;b', 'a', 7])
        result = s.str.get_dummies(';')
        expected = DataFrame([[0, 1, 1], [0, 1, 0], [1, 0, 0]],
                             columns=list('7ab'))
        tm.assert_frame_equal(result, expected)

        # GH9980, GH8028
        idx = Index(['a|b', 'a|c', 'b|c'])
        result = idx.str.get_dummies('|')

        expected = MultiIndex.from_tuples([(1, 1, 0), (1, 0, 1),
                                           (0, 1, 1)], names=('a', 'b', 'c'))
        tm.assert_index_equal(result, expected)

    def test_get_dummies_with_name_dummy(self):
        # GH 12180
        # Dummies named 'name' should work as expected
        s = Series(['a', 'b,name', 'b'])
        result = s.str.get_dummies(',')
        expected = DataFrame([[1, 0, 0], [0, 1, 1], [0, 1, 0]],
                             columns=['a', 'b', 'name'])
        tm.assert_frame_equal(result, expected)

        idx = Index(['a|b', 'name|c', 'b|name'])
        result = idx.str.get_dummies('|')

        expected = MultiIndex.from_tuples([(1, 1, 0, 0), (0, 0, 1, 1),
                                           (0, 1, 0, 1)],
                                          names=('a', 'b', 'c', 'name'))
        tm.assert_index_equal(result, expected)

    def test_join(self):
        values = Series(['a_b_c', 'c_d_e', np.nan, 'f_g_h'])
        result = values.str.split('_').str.join('_')
        tm.assert_series_equal(values, result)

        # mixed
        mixed = Series(['a_b', NA, 'asdf_cas_asdf', True, datetime.today(),
                        'foo', None, 1, 2.])

        rs = Series(mixed).str.split('_').str.join('_')
        xp = Series(['a_b', NA, 'asdf_cas_asdf', NA, NA, 'foo', NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        # unicode
        values = Series([u('a_b_c'), u('c_d_e'), np.nan, u('f_g_h')])
        result = values.str.split('_').str.join('_')
        tm.assert_series_equal(values, result)

    def test_len(self):
        values = Series(['foo', 'fooo', 'fooooo', np.nan, 'fooooooo'])

        result = values.str.len()
        exp = values.map(lambda x: len(x) if notna(x) else NA)
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = Series(['a_b', NA, 'asdf_cas_asdf', True, datetime.today(),
                        'foo', None, 1, 2.])

        rs = Series(mixed).str.len()
        xp = Series([3, NA, 13, NA, NA, 3, NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        # unicode
        values = Series([u('foo'), u('fooo'), u('fooooo'), np.nan, u(
            'fooooooo')])

        result = values.str.len()
        exp = values.map(lambda x: len(x) if notna(x) else NA)
        tm.assert_series_equal(result, exp)

    def test_findall(self):
        values = Series(['fooBAD__barBAD', NA, 'foo', 'BAD'])

        result = values.str.findall('BAD[_]*')
        exp = Series([['BAD__', 'BAD'], NA, [], ['BAD']])
        tm.assert_almost_equal(result, exp)

        # mixed
        mixed = Series(['fooBAD__barBAD', NA, 'foo', True, datetime.today(),
                        'BAD', None, 1, 2.])

        rs = Series(mixed).str.findall('BAD[_]*')
        xp = Series([['BAD__', 'BAD'], NA, [], NA, NA, ['BAD'], NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        # unicode
        values = Series([u('fooBAD__barBAD'), NA, u('foo'), u('BAD')])

        result = values.str.findall('BAD[_]*')
        exp = Series([[u('BAD__'), u('BAD')], NA, [], [u('BAD')]])
        tm.assert_almost_equal(result, exp)

    def test_find(self):
        values = Series(['ABCDEFG', 'BCDEFEF', 'DEFGHIJEF', 'EFGHEF', 'XXXX'])
        result = values.str.find('EF')
        tm.assert_series_equal(result, Series([4, 3, 1, 0, -1]))
        expected = np.array([v.find('EF') for v in values.values],
                            dtype=np.int64)
        tm.assert_numpy_array_equal(result.values, expected)

        result = values.str.rfind('EF')
        tm.assert_series_equal(result, Series([4, 5, 7, 4, -1]))
        expected = np.array([v.rfind('EF') for v in values.values],
                            dtype=np.int64)
        tm.assert_numpy_array_equal(result.values, expected)

        result = values.str.find('EF', 3)
        tm.assert_series_equal(result, Series([4, 3, 7, 4, -1]))
        expected = np.array([v.find('EF', 3) for v in values.values],
                            dtype=np.int64)
        tm.assert_numpy_array_equal(result.values, expected)

        result = values.str.rfind('EF', 3)
        tm.assert_series_equal(result, Series([4, 5, 7, 4, -1]))
        expected = np.array([v.rfind('EF', 3) for v in values.values],
                            dtype=np.int64)
        tm.assert_numpy_array_equal(result.values, expected)

        result = values.str.find('EF', 3, 6)
        tm.assert_series_equal(result, Series([4, 3, -1, 4, -1]))
        expected = np.array([v.find('EF', 3, 6) for v in values.values],
                            dtype=np.int64)
        tm.assert_numpy_array_equal(result.values, expected)

        result = values.str.rfind('EF', 3, 6)
        tm.assert_series_equal(result, Series([4, 3, -1, 4, -1]))
        expected = np.array([v.rfind('EF', 3, 6) for v in values.values],
                            dtype=np.int64)
        tm.assert_numpy_array_equal(result.values, expected)

        with tm.assert_raises_regex(TypeError,
                                    "expected a string object, not int"):
            result = values.str.find(0)

        with tm.assert_raises_regex(TypeError,
                                    "expected a string object, not int"):
            result = values.str.rfind(0)

    def test_find_nan(self):
        values = Series(['ABCDEFG', np.nan, 'DEFGHIJEF', np.nan, 'XXXX'])
        result = values.str.find('EF')
        tm.assert_series_equal(result, Series([4, np.nan, 1, np.nan, -1]))

        result = values.str.rfind('EF')
        tm.assert_series_equal(result, Series([4, np.nan, 7, np.nan, -1]))

        result = values.str.find('EF', 3)
        tm.assert_series_equal(result, Series([4, np.nan, 7, np.nan, -1]))

        result = values.str.rfind('EF', 3)
        tm.assert_series_equal(result, Series([4, np.nan, 7, np.nan, -1]))

        result = values.str.find('EF', 3, 6)
        tm.assert_series_equal(result, Series([4, np.nan, -1, np.nan, -1]))

        result = values.str.rfind('EF', 3, 6)
        tm.assert_series_equal(result, Series([4, np.nan, -1, np.nan, -1]))

    def test_index(self):

        def _check(result, expected):
            if isinstance(result, Series):
                tm.assert_series_equal(result, expected)
            else:
                tm.assert_index_equal(result, expected)

        for klass in [Series, Index]:
            s = klass(['ABCDEFG', 'BCDEFEF', 'DEFGHIJEF', 'EFGHEF'])

            result = s.str.index('EF')
            _check(result, klass([4, 3, 1, 0]))
            expected = np.array([v.index('EF') for v in s.values],
                                dtype=np.int64)
            tm.assert_numpy_array_equal(result.values, expected)

            result = s.str.rindex('EF')
            _check(result, klass([4, 5, 7, 4]))
            expected = np.array([v.rindex('EF') for v in s.values],
                                dtype=np.int64)
            tm.assert_numpy_array_equal(result.values, expected)

            result = s.str.index('EF', 3)
            _check(result, klass([4, 3, 7, 4]))
            expected = np.array([v.index('EF', 3) for v in s.values],
                                dtype=np.int64)
            tm.assert_numpy_array_equal(result.values, expected)

            result = s.str.rindex('EF', 3)
            _check(result, klass([4, 5, 7, 4]))
            expected = np.array([v.rindex('EF', 3) for v in s.values],
                                dtype=np.int64)
            tm.assert_numpy_array_equal(result.values, expected)

            result = s.str.index('E', 4, 8)
            _check(result, klass([4, 5, 7, 4]))
            expected = np.array([v.index('E', 4, 8) for v in s.values],
                                dtype=np.int64)
            tm.assert_numpy_array_equal(result.values, expected)

            result = s.str.rindex('E', 0, 5)
            _check(result, klass([4, 3, 1, 4]))
            expected = np.array([v.rindex('E', 0, 5) for v in s.values],
                                dtype=np.int64)
            tm.assert_numpy_array_equal(result.values, expected)

            with tm.assert_raises_regex(ValueError,
                                        "substring not found"):
                result = s.str.index('DE')

            with tm.assert_raises_regex(TypeError,
                                        "expected a string "
                                        "object, not int"):
                result = s.str.index(0)

        # test with nan
        s = Series(['abcb', 'ab', 'bcbe', np.nan])
        result = s.str.index('b')
        tm.assert_series_equal(result, Series([1, 1, 0, np.nan]))
        result = s.str.rindex('b')
        tm.assert_series_equal(result, Series([3, 1, 2, np.nan]))

    def test_pad(self):
        values = Series(['a', 'b', NA, 'c', NA, 'eeeeee'])

        result = values.str.pad(5, side='left')
        exp = Series(['    a', '    b', NA, '    c', NA, 'eeeeee'])
        tm.assert_almost_equal(result, exp)

        result = values.str.pad(5, side='right')
        exp = Series(['a    ', 'b    ', NA, 'c    ', NA, 'eeeeee'])
        tm.assert_almost_equal(result, exp)

        result = values.str.pad(5, side='both')
        exp = Series(['  a  ', '  b  ', NA, '  c  ', NA, 'eeeeee'])
        tm.assert_almost_equal(result, exp)

        # mixed
        mixed = Series(['a', NA, 'b', True, datetime.today(), 'ee', None, 1, 2.
                        ])

        rs = Series(mixed).str.pad(5, side='left')
        xp = Series(['    a', NA, '    b', NA, NA, '   ee', NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        mixed = Series(['a', NA, 'b', True, datetime.today(), 'ee', None, 1, 2.
                        ])

        rs = Series(mixed).str.pad(5, side='right')
        xp = Series(['a    ', NA, 'b    ', NA, NA, 'ee   ', NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        mixed = Series(['a', NA, 'b', True, datetime.today(), 'ee', None, 1, 2.
                        ])

        rs = Series(mixed).str.pad(5, side='both')
        xp = Series(['  a  ', NA, '  b  ', NA, NA, '  ee ', NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        # unicode
        values = Series([u('a'), u('b'), NA, u('c'), NA, u('eeeeee')])

        result = values.str.pad(5, side='left')
        exp = Series([u('    a'), u('    b'), NA, u('    c'), NA, u('eeeeee')])
        tm.assert_almost_equal(result, exp)

        result = values.str.pad(5, side='right')
        exp = Series([u('a    '), u('b    '), NA, u('c    '), NA, u('eeeeee')])
        tm.assert_almost_equal(result, exp)

        result = values.str.pad(5, side='both')
        exp = Series([u('  a  '), u('  b  '), NA, u('  c  '), NA, u('eeeeee')])
        tm.assert_almost_equal(result, exp)

    def test_pad_fillchar(self):

        values = Series(['a', 'b', NA, 'c', NA, 'eeeeee'])

        result = values.str.pad(5, side='left', fillchar='X')
        exp = Series(['XXXXa', 'XXXXb', NA, 'XXXXc', NA, 'eeeeee'])
        tm.assert_almost_equal(result, exp)

        result = values.str.pad(5, side='right', fillchar='X')
        exp = Series(['aXXXX', 'bXXXX', NA, 'cXXXX', NA, 'eeeeee'])
        tm.assert_almost_equal(result, exp)

        result = values.str.pad(5, side='both', fillchar='X')
        exp = Series(['XXaXX', 'XXbXX', NA, 'XXcXX', NA, 'eeeeee'])
        tm.assert_almost_equal(result, exp)

        with tm.assert_raises_regex(TypeError,
                                    "fillchar must be a "
                                    "character, not str"):
            result = values.str.pad(5, fillchar='XY')

        with tm.assert_raises_regex(TypeError,
                                    "fillchar must be a "
                                    "character, not int"):
            result = values.str.pad(5, fillchar=5)

    def test_pad_width(self):
        # GH 13598
        s = Series(['1', '22', 'a', 'bb'])

        for f in ['center', 'ljust', 'rjust', 'zfill', 'pad']:
            with tm.assert_raises_regex(TypeError,
                                        "width must be of "
                                        "integer type, not*"):
                getattr(s.str, f)('f')

    def test_translate(self):

        def _check(result, expected):
            if isinstance(result, Series):
                tm.assert_series_equal(result, expected)
            else:
                tm.assert_index_equal(result, expected)

        for klass in [Series, Index]:
            s = klass(['abcdefg', 'abcc', 'cdddfg', 'cdefggg'])
            if not compat.PY3:
                import string
                table = string.maketrans('abc', 'cde')
            else:
                table = str.maketrans('abc', 'cde')
            result = s.str.translate(table)
            expected = klass(['cdedefg', 'cdee', 'edddfg', 'edefggg'])
            _check(result, expected)

            # use of deletechars is python 2 only
            if not compat.PY3:
                result = s.str.translate(table, deletechars='fg')
                expected = klass(['cdede', 'cdee', 'eddd', 'ede'])
                _check(result, expected)

                result = s.str.translate(None, deletechars='fg')
                expected = klass(['abcde', 'abcc', 'cddd', 'cde'])
                _check(result, expected)
            else:
                with tm.assert_raises_regex(
                        ValueError, "deletechars is not a valid argument"):
                    result = s.str.translate(table, deletechars='fg')

        # Series with non-string values
        s = Series(['a', 'b', 'c', 1.2])
        expected = Series(['c', 'd', 'e', np.nan])
        result = s.str.translate(table)
        tm.assert_series_equal(result, expected)

    def test_center_ljust_rjust(self):
        values = Series(['a', 'b', NA, 'c', NA, 'eeeeee'])

        result = values.str.center(5)
        exp = Series(['  a  ', '  b  ', NA, '  c  ', NA, 'eeeeee'])
        tm.assert_almost_equal(result, exp)

        result = values.str.ljust(5)
        exp = Series(['a    ', 'b    ', NA, 'c    ', NA, 'eeeeee'])
        tm.assert_almost_equal(result, exp)

        result = values.str.rjust(5)
        exp = Series(['    a', '    b', NA, '    c', NA, 'eeeeee'])
        tm.assert_almost_equal(result, exp)

        # mixed
        mixed = Series(['a', NA, 'b', True, datetime.today(), 'c', 'eee', None,
                        1, 2.])

        rs = Series(mixed).str.center(5)
        xp = Series(['  a  ', NA, '  b  ', NA, NA, '  c  ', ' eee ', NA, NA, NA
                     ])
        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        rs = Series(mixed).str.ljust(5)
        xp = Series(['a    ', NA, 'b    ', NA, NA, 'c    ', 'eee  ', NA, NA, NA
                     ])
        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        rs = Series(mixed).str.rjust(5)
        xp = Series(['    a', NA, '    b', NA, NA, '    c', '  eee', NA, NA, NA
                     ])
        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        # unicode
        values = Series([u('a'), u('b'), NA, u('c'), NA, u('eeeeee')])

        result = values.str.center(5)
        exp = Series([u('  a  '), u('  b  '), NA, u('  c  '), NA, u('eeeeee')])
        tm.assert_almost_equal(result, exp)

        result = values.str.ljust(5)
        exp = Series([u('a    '), u('b    '), NA, u('c    '), NA, u('eeeeee')])
        tm.assert_almost_equal(result, exp)

        result = values.str.rjust(5)
        exp = Series([u('    a'), u('    b'), NA, u('    c'), NA, u('eeeeee')])
        tm.assert_almost_equal(result, exp)

    def test_center_ljust_rjust_fillchar(self):
        values = Series(['a', 'bb', 'cccc', 'ddddd', 'eeeeee'])

        result = values.str.center(5, fillchar='X')
        expected = Series(['XXaXX', 'XXbbX', 'Xcccc', 'ddddd', 'eeeeee'])
        tm.assert_series_equal(result, expected)
        expected = np.array([v.center(5, 'X') for v in values.values],
                            dtype=np.object_)
        tm.assert_numpy_array_equal(result.values, expected)

        result = values.str.ljust(5, fillchar='X')
        expected = Series(['aXXXX', 'bbXXX', 'ccccX', 'ddddd', 'eeeeee'])
        tm.assert_series_equal(result, expected)
        expected = np.array([v.ljust(5, 'X') for v in values.values],
                            dtype=np.object_)
        tm.assert_numpy_array_equal(result.values, expected)

        result = values.str.rjust(5, fillchar='X')
        expected = Series(['XXXXa', 'XXXbb', 'Xcccc', 'ddddd', 'eeeeee'])
        tm.assert_series_equal(result, expected)
        expected = np.array([v.rjust(5, 'X') for v in values.values],
                            dtype=np.object_)
        tm.assert_numpy_array_equal(result.values, expected)

        # If fillchar is not a charatter, normal str raises TypeError
        # 'aaa'.ljust(5, 'XY')
        # TypeError: must be char, not str
        with tm.assert_raises_regex(TypeError,
                                    "fillchar must be a "
                                    "character, not str"):
            result = values.str.center(5, fillchar='XY')

        with tm.assert_raises_regex(TypeError,
                                    "fillchar must be a "
                                    "character, not str"):
            result = values.str.ljust(5, fillchar='XY')

        with tm.assert_raises_regex(TypeError,
                                    "fillchar must be a "
                                    "character, not str"):
            result = values.str.rjust(5, fillchar='XY')

        with tm.assert_raises_regex(TypeError,
                                    "fillchar must be a "
                                    "character, not int"):
            result = values.str.center(5, fillchar=1)

        with tm.assert_raises_regex(TypeError,
                                    "fillchar must be a "
                                    "character, not int"):
            result = values.str.ljust(5, fillchar=1)

        with tm.assert_raises_regex(TypeError,
                                    "fillchar must be a "
                                    "character, not int"):
            result = values.str.rjust(5, fillchar=1)

    def test_zfill(self):
        values = Series(['1', '22', 'aaa', '333', '45678'])

        result = values.str.zfill(5)
        expected = Series(['00001', '00022', '00aaa', '00333', '45678'])
        tm.assert_series_equal(result, expected)
        expected = np.array([v.zfill(5) for v in values.values],
                            dtype=np.object_)
        tm.assert_numpy_array_equal(result.values, expected)

        result = values.str.zfill(3)
        expected = Series(['001', '022', 'aaa', '333', '45678'])
        tm.assert_series_equal(result, expected)
        expected = np.array([v.zfill(3) for v in values.values],
                            dtype=np.object_)
        tm.assert_numpy_array_equal(result.values, expected)

        values = Series(['1', np.nan, 'aaa', np.nan, '45678'])
        result = values.str.zfill(5)
        expected = Series(['00001', np.nan, '00aaa', np.nan, '45678'])
        tm.assert_series_equal(result, expected)

    def test_split(self):
        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])

        result = values.str.split('_')
        exp = Series([['a', 'b', 'c'], ['c', 'd', 'e'], NA, ['f', 'g', 'h']])
        tm.assert_series_equal(result, exp)

        # more than one char
        values = Series(['a__b__c', 'c__d__e', NA, 'f__g__h'])
        result = values.str.split('__')
        tm.assert_series_equal(result, exp)

        result = values.str.split('__', expand=False)
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = Series(['a_b_c', NA, 'd_e_f', True, datetime.today(), None, 1,
                        2.])
        result = mixed.str.split('_')
        exp = Series([['a', 'b', 'c'], NA, ['d', 'e', 'f'], NA, NA, NA, NA, NA
                      ])
        assert isinstance(result, Series)
        tm.assert_almost_equal(result, exp)

        result = mixed.str.split('_', expand=False)
        assert isinstance(result, Series)
        tm.assert_almost_equal(result, exp)

        # unicode
        values = Series([u('a_b_c'), u('c_d_e'), NA, u('f_g_h')])

        result = values.str.split('_')
        exp = Series([[u('a'), u('b'), u('c')], [u('c'), u('d'), u('e')], NA,
                      [u('f'), u('g'), u('h')]])
        tm.assert_series_equal(result, exp)

        result = values.str.split('_', expand=False)
        tm.assert_series_equal(result, exp)

        # regex split
        values = Series([u('a,b_c'), u('c_d,e'), NA, u('f,g,h')])
        result = values.str.split('[,_]')
        exp = Series([[u('a'), u('b'), u('c')], [u('c'), u('d'), u('e')], NA,
                      [u('f'), u('g'), u('h')]])
        tm.assert_series_equal(result, exp)

    def test_rsplit(self):
        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
        result = values.str.rsplit('_')
        exp = Series([['a', 'b', 'c'], ['c', 'd', 'e'], NA, ['f', 'g', 'h']])
        tm.assert_series_equal(result, exp)

        # more than one char
        values = Series(['a__b__c', 'c__d__e', NA, 'f__g__h'])
        result = values.str.rsplit('__')
        tm.assert_series_equal(result, exp)

        result = values.str.rsplit('__', expand=False)
        tm.assert_series_equal(result, exp)

        # mixed
        mixed = Series(['a_b_c', NA, 'd_e_f', True, datetime.today(), None, 1,
                        2.])
        result = mixed.str.rsplit('_')
        exp = Series([['a', 'b', 'c'], NA, ['d', 'e', 'f'], NA, NA, NA, NA, NA
                      ])
        assert isinstance(result, Series)
        tm.assert_almost_equal(result, exp)

        result = mixed.str.rsplit('_', expand=False)
        assert isinstance(result, Series)
        tm.assert_almost_equal(result, exp)

        # unicode
        values = Series([u('a_b_c'), u('c_d_e'), NA, u('f_g_h')])
        result = values.str.rsplit('_')
        exp = Series([[u('a'), u('b'), u('c')], [u('c'), u('d'), u('e')], NA,
                      [u('f'), u('g'), u('h')]])
        tm.assert_series_equal(result, exp)

        result = values.str.rsplit('_', expand=False)
        tm.assert_series_equal(result, exp)

        # regex split is not supported by rsplit
        values = Series([u('a,b_c'), u('c_d,e'), NA, u('f,g,h')])
        result = values.str.rsplit('[,_]')
        exp = Series([[u('a,b_c')], [u('c_d,e')], NA, [u('f,g,h')]])
        tm.assert_series_equal(result, exp)

        # setting max number of splits, make sure it's from reverse
        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
        result = values.str.rsplit('_', n=1)
        exp = Series([['a_b', 'c'], ['c_d', 'e'], NA, ['f_g', 'h']])
        tm.assert_series_equal(result, exp)

    def test_split_noargs(self):
        # #1859
        s = Series(['Wes McKinney', 'Travis  Oliphant'])
        result = s.str.split()
        expected = ['Travis', 'Oliphant']
        assert result[1] == expected
        result = s.str.rsplit()
        assert result[1] == expected

    def test_split_maxsplit(self):
        # re.split 0, str.split -1
        s = Series(['bd asdf jfg', 'kjasdflqw asdfnfk'])

        result = s.str.split(n=-1)
        xp = s.str.split()
        tm.assert_series_equal(result, xp)

        result = s.str.split(n=0)
        tm.assert_series_equal(result, xp)

        xp = s.str.split('asdf')
        result = s.str.split('asdf', n=0)
        tm.assert_series_equal(result, xp)

        result = s.str.split('asdf', n=-1)
        tm.assert_series_equal(result, xp)

    def test_split_no_pat_with_nonzero_n(self):
        s = Series(['split once', 'split once too!'])
        result = s.str.split(n=1)
        expected = Series({0: ['split', 'once'], 1: ['split', 'once too!']})
        tm.assert_series_equal(expected, result, check_index_type=False)

    def test_split_to_dataframe(self):
        s = Series(['nosplit', 'alsonosplit'])
        result = s.str.split('_', expand=True)
        exp = DataFrame({0: Series(['nosplit', 'alsonosplit'])})
        tm.assert_frame_equal(result, exp)

        s = Series(['some_equal_splits', 'with_no_nans'])
        result = s.str.split('_', expand=True)
        exp = DataFrame({0: ['some', 'with'],
                         1: ['equal', 'no'],
                         2: ['splits', 'nans']})
        tm.assert_frame_equal(result, exp)

        s = Series(['some_unequal_splits', 'one_of_these_things_is_not'])
        result = s.str.split('_', expand=True)
        exp = DataFrame({0: ['some', 'one'],
                         1: ['unequal', 'of'],
                         2: ['splits', 'these'],
                         3: [NA, 'things'],
                         4: [NA, 'is'],
                         5: [NA, 'not']})
        tm.assert_frame_equal(result, exp)

        s = Series(['some_splits', 'with_index'], index=['preserve', 'me'])
        result = s.str.split('_', expand=True)
        exp = DataFrame({0: ['some', 'with'], 1: ['splits', 'index']},
                        index=['preserve', 'me'])
        tm.assert_frame_equal(result, exp)

        with tm.assert_raises_regex(ValueError, "expand must be"):
            s.str.split('_', expand="not_a_boolean")

    def test_split_to_multiindex_expand(self):
        idx = Index(['nosplit', 'alsonosplit'])
        result = idx.str.split('_', expand=True)
        exp = idx
        tm.assert_index_equal(result, exp)
        assert result.nlevels == 1

        idx = Index(['some_equal_splits', 'with_no_nans'])
        result = idx.str.split('_', expand=True)
        exp = MultiIndex.from_tuples([('some', 'equal', 'splits'), (
            'with', 'no', 'nans')])
        tm.assert_index_equal(result, exp)
        assert result.nlevels == 3

        idx = Index(['some_unequal_splits', 'one_of_these_things_is_not'])
        result = idx.str.split('_', expand=True)
        exp = MultiIndex.from_tuples([('some', 'unequal', 'splits', NA, NA, NA
                                       ), ('one', 'of', 'these', 'things',
                                           'is', 'not')])
        tm.assert_index_equal(result, exp)
        assert result.nlevels == 6

        with tm.assert_raises_regex(ValueError, "expand must be"):
            idx.str.split('_', expand="not_a_boolean")

    def test_rsplit_to_dataframe_expand(self):
        s = Series(['nosplit', 'alsonosplit'])
        result = s.str.rsplit('_', expand=True)
        exp = DataFrame({0: Series(['nosplit', 'alsonosplit'])})
        tm.assert_frame_equal(result, exp)

        s = Series(['some_equal_splits', 'with_no_nans'])
        result = s.str.rsplit('_', expand=True)
        exp = DataFrame({0: ['some', 'with'],
                         1: ['equal', 'no'],
                         2: ['splits', 'nans']})
        tm.assert_frame_equal(result, exp)

        result = s.str.rsplit('_', expand=True, n=2)
        exp = DataFrame({0: ['some', 'with'],
                         1: ['equal', 'no'],
                         2: ['splits', 'nans']})
        tm.assert_frame_equal(result, exp)

        result = s.str.rsplit('_', expand=True, n=1)
        exp = DataFrame({0: ['some_equal', 'with_no'], 1: ['splits', 'nans']})
        tm.assert_frame_equal(result, exp)

        s = Series(['some_splits', 'with_index'], index=['preserve', 'me'])
        result = s.str.rsplit('_', expand=True)
        exp = DataFrame({0: ['some', 'with'], 1: ['splits', 'index']},
                        index=['preserve', 'me'])
        tm.assert_frame_equal(result, exp)

    def test_rsplit_to_multiindex_expand(self):
        idx = Index(['nosplit', 'alsonosplit'])
        result = idx.str.rsplit('_', expand=True)
        exp = idx
        tm.assert_index_equal(result, exp)
        assert result.nlevels == 1

        idx = Index(['some_equal_splits', 'with_no_nans'])
        result = idx.str.rsplit('_', expand=True)
        exp = MultiIndex.from_tuples([('some', 'equal', 'splits'), (
            'with', 'no', 'nans')])
        tm.assert_index_equal(result, exp)
        assert result.nlevels == 3

        idx = Index(['some_equal_splits', 'with_no_nans'])
        result = idx.str.rsplit('_', expand=True, n=1)
        exp = MultiIndex.from_tuples([('some_equal', 'splits'),
                                      ('with_no', 'nans')])
        tm.assert_index_equal(result, exp)
        assert result.nlevels == 2

    def test_split_with_name(self):
        # GH 12617

        # should preserve name
        s = Series(['a,b', 'c,d'], name='xxx')
        res = s.str.split(',')
        exp = Series([['a', 'b'], ['c', 'd']], name='xxx')
        tm.assert_series_equal(res, exp)

        res = s.str.split(',', expand=True)
        exp = DataFrame([['a', 'b'], ['c', 'd']])
        tm.assert_frame_equal(res, exp)

        idx = Index(['a,b', 'c,d'], name='xxx')
        res = idx.str.split(',')
        exp = Index([['a', 'b'], ['c', 'd']], name='xxx')
        assert res.nlevels == 1
        tm.assert_index_equal(res, exp)

        res = idx.str.split(',', expand=True)
        exp = MultiIndex.from_tuples([('a', 'b'), ('c', 'd')])
        assert res.nlevels == 2
        tm.assert_index_equal(res, exp)

    def test_partition_series(self):
        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])

        result = values.str.partition('_', expand=False)
        exp = Series([('a', '_', 'b_c'), ('c', '_', 'd_e'), NA,
                      ('f', '_', 'g_h')])
        tm.assert_series_equal(result, exp)

        result = values.str.rpartition('_', expand=False)
        exp = Series([('a_b', '_', 'c'), ('c_d', '_', 'e'), NA,
                      ('f_g', '_', 'h')])
        tm.assert_series_equal(result, exp)

        # more than one char
        values = Series(['a__b__c', 'c__d__e', NA, 'f__g__h'])
        result = values.str.partition('__', expand=False)
        exp = Series([('a', '__', 'b__c'), ('c', '__', 'd__e'), NA,
                      ('f', '__', 'g__h')])
        tm.assert_series_equal(result, exp)

        result = values.str.rpartition('__', expand=False)
        exp = Series([('a__b', '__', 'c'), ('c__d', '__', 'e'), NA,
                      ('f__g', '__', 'h')])
        tm.assert_series_equal(result, exp)

        # None
        values = Series(['a b c', 'c d e', NA, 'f g h'])
        result = values.str.partition(expand=False)
        exp = Series([('a', ' ', 'b c'), ('c', ' ', 'd e'), NA,
                      ('f', ' ', 'g h')])
        tm.assert_series_equal(result, exp)

        result = values.str.rpartition(expand=False)
        exp = Series([('a b', ' ', 'c'), ('c d', ' ', 'e'), NA,
                      ('f g', ' ', 'h')])
        tm.assert_series_equal(result, exp)

        # Not splited
        values = Series(['abc', 'cde', NA, 'fgh'])
        result = values.str.partition('_', expand=False)
        exp = Series([('abc', '', ''), ('cde', '', ''), NA, ('fgh', '', '')])
        tm.assert_series_equal(result, exp)

        result = values.str.rpartition('_', expand=False)
        exp = Series([('', '', 'abc'), ('', '', 'cde'), NA, ('', '', 'fgh')])
        tm.assert_series_equal(result, exp)

        # unicode
        values = Series([u'a_b_c', u'c_d_e', NA, u'f_g_h'])

        result = values.str.partition('_', expand=False)
        exp = Series([(u'a', u'_', u'b_c'), (u'c', u'_', u'd_e'),
                      NA, (u'f', u'_', u'g_h')])
        tm.assert_series_equal(result, exp)

        result = values.str.rpartition('_', expand=False)
        exp = Series([(u'a_b', u'_', u'c'), (u'c_d', u'_', u'e'),
                      NA, (u'f_g', u'_', u'h')])
        tm.assert_series_equal(result, exp)

        # compare to standard lib
        values = Series(['A_B_C', 'B_C_D', 'E_F_G', 'EFGHEF'])
        result = values.str.partition('_', expand=False).tolist()
        assert result == [v.partition('_') for v in values]
        result = values.str.rpartition('_', expand=False).tolist()
        assert result == [v.rpartition('_') for v in values]

    def test_partition_index(self):
        values = Index(['a_b_c', 'c_d_e', 'f_g_h'])

        result = values.str.partition('_', expand=False)
        exp = Index(np.array([('a', '_', 'b_c'), ('c', '_', 'd_e'), ('f', '_',
                                                                     'g_h')]))
        tm.assert_index_equal(result, exp)
        assert result.nlevels == 1

        result = values.str.rpartition('_', expand=False)
        exp = Index(np.array([('a_b', '_', 'c'), ('c_d', '_', 'e'), (
            'f_g', '_', 'h')]))
        tm.assert_index_equal(result, exp)
        assert result.nlevels == 1

        result = values.str.partition('_')
        exp = Index([('a', '_', 'b_c'), ('c', '_', 'd_e'), ('f', '_', 'g_h')])
        tm.assert_index_equal(result, exp)
        assert isinstance(result, MultiIndex)
        assert result.nlevels == 3

        result = values.str.rpartition('_')
        exp = Index([('a_b', '_', 'c'), ('c_d', '_', 'e'), ('f_g', '_', 'h')])
        tm.assert_index_equal(result, exp)
        assert isinstance(result, MultiIndex)
        assert result.nlevels == 3

    def test_partition_to_dataframe(self):
        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
        result = values.str.partition('_')
        exp = DataFrame({0: ['a', 'c', np.nan, 'f'],
                         1: ['_', '_', np.nan, '_'],
                         2: ['b_c', 'd_e', np.nan, 'g_h']})
        tm.assert_frame_equal(result, exp)

        result = values.str.rpartition('_')
        exp = DataFrame({0: ['a_b', 'c_d', np.nan, 'f_g'],
                         1: ['_', '_', np.nan, '_'],
                         2: ['c', 'e', np.nan, 'h']})
        tm.assert_frame_equal(result, exp)

        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
        result = values.str.partition('_', expand=True)
        exp = DataFrame({0: ['a', 'c', np.nan, 'f'],
                         1: ['_', '_', np.nan, '_'],
                         2: ['b_c', 'd_e', np.nan, 'g_h']})
        tm.assert_frame_equal(result, exp)

        result = values.str.rpartition('_', expand=True)
        exp = DataFrame({0: ['a_b', 'c_d', np.nan, 'f_g'],
                         1: ['_', '_', np.nan, '_'],
                         2: ['c', 'e', np.nan, 'h']})
        tm.assert_frame_equal(result, exp)

    def test_partition_with_name(self):
        # GH 12617

        s = Series(['a,b', 'c,d'], name='xxx')
        res = s.str.partition(',')
        exp = DataFrame({0: ['a', 'c'], 1: [',', ','], 2: ['b', 'd']})
        tm.assert_frame_equal(res, exp)

        # should preserve name
        res = s.str.partition(',', expand=False)
        exp = Series([('a', ',', 'b'), ('c', ',', 'd')], name='xxx')
        tm.assert_series_equal(res, exp)

        idx = Index(['a,b', 'c,d'], name='xxx')
        res = idx.str.partition(',')
        exp = MultiIndex.from_tuples([('a', ',', 'b'), ('c', ',', 'd')])
        assert res.nlevels == 3
        tm.assert_index_equal(res, exp)

        # should preserve name
        res = idx.str.partition(',', expand=False)
        exp = Index(np.array([('a', ',', 'b'), ('c', ',', 'd')]), name='xxx')
        assert res.nlevels == 1
        tm.assert_index_equal(res, exp)

    def test_pipe_failures(self):
        # #2119
        s = Series(['A|B|C'])

        result = s.str.split('|')
        exp = Series([['A', 'B', 'C']])

        tm.assert_series_equal(result, exp)

        result = s.str.replace('|', ' ')
        exp = Series(['A B C'])

        tm.assert_series_equal(result, exp)

    def test_slice(self):
        values = Series(['aafootwo', 'aabartwo', NA, 'aabazqux'])

        result = values.str.slice(2, 5)
        exp = Series(['foo', 'bar', NA, 'baz'])
        tm.assert_series_equal(result, exp)

        for start, stop, step in [(0, 3, -1), (None, None, -1), (3, 10, 2),
                                  (3, 0, -1)]:
            try:
                result = values.str.slice(start, stop, step)
                expected = Series([s[start:stop:step] if not isna(s) else NA
                                   for s in values])
                tm.assert_series_equal(result, expected)
            except:
                print('failed on %s:%s:%s' % (start, stop, step))
                raise

        # mixed
        mixed = Series(['aafootwo', NA, 'aabartwo', True, datetime.today(),
                        None, 1, 2.])

        rs = Series(mixed).str.slice(2, 5)
        xp = Series(['foo', NA, 'bar', NA, NA, NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        rs = Series(mixed).str.slice(2, 5, -1)
        xp = Series(['oof', NA, 'rab', NA, NA, NA, NA, NA])

        # unicode
        values = Series([u('aafootwo'), u('aabartwo'), NA, u('aabazqux')])

        result = values.str.slice(2, 5)
        exp = Series([u('foo'), u('bar'), NA, u('baz')])
        tm.assert_series_equal(result, exp)

        result = values.str.slice(0, -1, 2)
        exp = Series([u('afow'), u('abrw'), NA, u('abzu')])
        tm.assert_series_equal(result, exp)

    def test_slice_replace(self):
        values = Series(['short', 'a bit longer', 'evenlongerthanthat', '', NA
                         ])

        exp = Series(['shrt', 'a it longer', 'evnlongerthanthat', '', NA])
        result = values.str.slice_replace(2, 3)
        tm.assert_series_equal(result, exp)

        exp = Series(['shzrt', 'a zit longer', 'evznlongerthanthat', 'z', NA])
        result = values.str.slice_replace(2, 3, 'z')
        tm.assert_series_equal(result, exp)

        exp = Series(['shzort', 'a zbit longer', 'evzenlongerthanthat', 'z', NA
                      ])
        result = values.str.slice_replace(2, 2, 'z')
        tm.assert_series_equal(result, exp)

        exp = Series(['shzort', 'a zbit longer', 'evzenlongerthanthat', 'z', NA
                      ])
        result = values.str.slice_replace(2, 1, 'z')
        tm.assert_series_equal(result, exp)

        exp = Series(['shorz', 'a bit longez', 'evenlongerthanthaz', 'z', NA])
        result = values.str.slice_replace(-1, None, 'z')
        tm.assert_series_equal(result, exp)

        exp = Series(['zrt', 'zer', 'zat', 'z', NA])
        result = values.str.slice_replace(None, -2, 'z')
        tm.assert_series_equal(result, exp)

        exp = Series(['shortz', 'a bit znger', 'evenlozerthanthat', 'z', NA])
        result = values.str.slice_replace(6, 8, 'z')
        tm.assert_series_equal(result, exp)

        exp = Series(['zrt', 'a zit longer', 'evenlongzerthanthat', 'z', NA])
        result = values.str.slice_replace(-10, 3, 'z')
        tm.assert_series_equal(result, exp)

    def test_strip_lstrip_rstrip(self):
        values = Series(['  aa   ', ' bb \n', NA, 'cc  '])

        result = values.str.strip()
        exp = Series(['aa', 'bb', NA, 'cc'])
        tm.assert_series_equal(result, exp)

        result = values.str.lstrip()
        exp = Series(['aa   ', 'bb \n', NA, 'cc  '])
        tm.assert_series_equal(result, exp)

        result = values.str.rstrip()
        exp = Series(['  aa', ' bb', NA, 'cc'])
        tm.assert_series_equal(result, exp)

    def test_strip_lstrip_rstrip_mixed(self):
        # mixed
        mixed = Series(['  aa  ', NA, ' bb \t\n', True, datetime.today(), None,
                        1, 2.])

        rs = Series(mixed).str.strip()
        xp = Series(['aa', NA, 'bb', NA, NA, NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        rs = Series(mixed).str.lstrip()
        xp = Series(['aa  ', NA, 'bb \t\n', NA, NA, NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        rs = Series(mixed).str.rstrip()
        xp = Series(['  aa', NA, ' bb', NA, NA, NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

    def test_strip_lstrip_rstrip_unicode(self):
        # unicode
        values = Series([u('  aa   '), u(' bb \n'), NA, u('cc  ')])

        result = values.str.strip()
        exp = Series([u('aa'), u('bb'), NA, u('cc')])
        tm.assert_series_equal(result, exp)

        result = values.str.lstrip()
        exp = Series([u('aa   '), u('bb \n'), NA, u('cc  ')])
        tm.assert_series_equal(result, exp)

        result = values.str.rstrip()
        exp = Series([u('  aa'), u(' bb'), NA, u('cc')])
        tm.assert_series_equal(result, exp)

    def test_strip_lstrip_rstrip_args(self):
        values = Series(['xxABCxx', 'xx BNSD', 'LDFJH xx'])

        rs = values.str.strip('x')
        xp = Series(['ABC', ' BNSD', 'LDFJH '])
        assert_series_equal(rs, xp)

        rs = values.str.lstrip('x')
        xp = Series(['ABCxx', ' BNSD', 'LDFJH xx'])
        assert_series_equal(rs, xp)

        rs = values.str.rstrip('x')
        xp = Series(['xxABC', 'xx BNSD', 'LDFJH '])
        assert_series_equal(rs, xp)

    def test_strip_lstrip_rstrip_args_unicode(self):
        values = Series([u('xxABCxx'), u('xx BNSD'), u('LDFJH xx')])

        rs = values.str.strip(u('x'))
        xp = Series(['ABC', ' BNSD', 'LDFJH '])
        assert_series_equal(rs, xp)

        rs = values.str.lstrip(u('x'))
        xp = Series(['ABCxx', ' BNSD', 'LDFJH xx'])
        assert_series_equal(rs, xp)

        rs = values.str.rstrip(u('x'))
        xp = Series(['xxABC', 'xx BNSD', 'LDFJH '])
        assert_series_equal(rs, xp)

    def test_wrap(self):
        # test values are: two words less than width, two words equal to width,
        # two words greater than width, one word less than width, one word
        # equal to width, one word greater than width, multiple tokens with
        # trailing whitespace equal to width
        values = Series([u('hello world'), u('hello world!'), u(
            'hello world!!'), u('abcdefabcde'), u('abcdefabcdef'), u(
                'abcdefabcdefa'), u('ab ab ab ab '), u('ab ab ab ab a'), u(
                    '\t')])

        # expected values
        xp = Series([u('hello world'), u('hello world!'), u('hello\nworld!!'),
                     u('abcdefabcde'), u('abcdefabcdef'), u('abcdefabcdef\na'),
                     u('ab ab ab ab'), u('ab ab ab ab\na'), u('')])

        rs = values.str.wrap(12, break_long_words=True)
        assert_series_equal(rs, xp)

        # test with pre and post whitespace (non-unicode), NaN, and non-ascii
        # Unicode
        values = Series(['  pre  ', np.nan, u('\xac\u20ac\U00008000 abadcafe')
                         ])
        xp = Series(['  pre', NA, u('\xac\u20ac\U00008000 ab\nadcafe')])
        rs = values.str.wrap(6)
        assert_series_equal(rs, xp)

    def test_get(self):
        values = Series(['a_b_c', 'c_d_e', np.nan, 'f_g_h'])

        result = values.str.split('_').str.get(1)
        expected = Series(['b', 'd', np.nan, 'g'])
        tm.assert_series_equal(result, expected)

        # mixed
        mixed = Series(['a_b_c', NA, 'c_d_e', True, datetime.today(), None, 1,
                        2.])

        rs = Series(mixed).str.split('_').str.get(1)
        xp = Series(['b', NA, 'd', NA, NA, NA, NA, NA])

        assert isinstance(rs, Series)
        tm.assert_almost_equal(rs, xp)

        # unicode
        values = Series([u('a_b_c'), u('c_d_e'), np.nan, u('f_g_h')])

        result = values.str.split('_').str.get(1)
        expected = Series([u('b'), u('d'), np.nan, u('g')])
        tm.assert_series_equal(result, expected)

        # bounds testing
        values = Series(['1_2_3_4_5', '6_7_8_9_10', '11_12'])

        # positive index
        result = values.str.split('_').str.get(2)
        expected = Series(['3', '8', np.nan])
        tm.assert_series_equal(result, expected)

        # negative index
        result = values.str.split('_').str.get(-3)
        expected = Series(['3', '8', np.nan])
        tm.assert_series_equal(result, expected)

    def test_more_contains(self):
        # PR #1179
        s = Series(['A', 'B', 'C', 'Aaba', 'Baca', '', NA,
                    'CABA', 'dog', 'cat'])

        result = s.str.contains('a')
        expected = Series([False, False, False, True, True, False, np.nan,
                           False, False, True])
        assert_series_equal(result, expected)

        result = s.str.contains('a', case=False)
        expected = Series([True, False, False, True, True, False, np.nan, True,
                           False, True])
        assert_series_equal(result, expected)

        result = s.str.contains('Aa')
        expected = Series([False, False, False, True, False, False, np.nan,
                           False, False, False])
        assert_series_equal(result, expected)

        result = s.str.contains('ba')
        expected = Series([False, False, False, True, False, False, np.nan,
                           False, False, False])
        assert_series_equal(result, expected)

        result = s.str.contains('ba', case=False)
        expected = Series([False, False, False, True, True, False, np.nan,
                           True, False, False])
        assert_series_equal(result, expected)

    def test_contains_nan(self):
        # PR #14171
        s = Series([np.nan, np.nan, np.nan], dtype=np.object_)

        result = s.str.contains('foo', na=False)
        expected = Series([False, False, False], dtype=np.bool_)
        assert_series_equal(result, expected)

        result = s.str.contains('foo', na=True)
        expected = Series([True, True, True], dtype=np.bool_)
        assert_series_equal(result, expected)

        result = s.str.contains('foo', na="foo")
        expected = Series(["foo", "foo", "foo"], dtype=np.object_)
        assert_series_equal(result, expected)

        result = s.str.contains('foo')
        expected = Series([np.nan, np.nan, np.nan], dtype=np.object_)
        assert_series_equal(result, expected)

    def test_more_replace(self):
        # PR #1179
        s = Series(['A', 'B', 'C', 'Aaba', 'Baca', '', NA, 'CABA',
                    'dog', 'cat'])

        result = s.str.replace('A', 'YYY')
        expected = Series(['YYY', 'B', 'C', 'YYYaba', 'Baca', '', NA,
                           'CYYYBYYY', 'dog', 'cat'])
        assert_series_equal(result, expected)

        result = s.str.replace('A', 'YYY', case=False)
        expected = Series(['YYY', 'B', 'C', 'YYYYYYbYYY', 'BYYYcYYY', '', NA,
                           'CYYYBYYY', 'dog', 'cYYYt'])
        assert_series_equal(result, expected)

        result = s.str.replace('^.a|dog', 'XX-XX ', case=False)
        expected = Series(['A', 'B', 'C', 'XX-XX ba', 'XX-XX ca', '', NA,
                           'XX-XX BA', 'XX-XX ', 'XX-XX t'])
        assert_series_equal(result, expected)

    def test_string_slice_get_syntax(self):
        s = Series(['YYY', 'B', 'C', 'YYYYYYbYYY', 'BYYYcYYY', NA, 'CYYYBYYY',
                    'dog', 'cYYYt'])

        result = s.str[0]
        expected = s.str.get(0)
        assert_series_equal(result, expected)

        result = s.str[:3]
        expected = s.str.slice(stop=3)
        assert_series_equal(result, expected)

        result = s.str[2::-1]
        expected = s.str.slice(start=2, step=-1)
        assert_series_equal(result, expected)

    def test_string_slice_out_of_bounds(self):
        s = Series([(1, 2), (1, ), (3, 4, 5)])

        result = s.str[1]
        expected = Series([2, np.nan, 4])

        assert_series_equal(result, expected)

        s = Series(['foo', 'b', 'ba'])
        result = s.str[1]
        expected = Series(['o', np.nan, 'a'])
        assert_series_equal(result, expected)

    def test_match_findall_flags(self):
        data = {'Dave': 'dave@google.com',
                'Steve': 'steve@gmail.com',
                'Rob': 'rob@gmail.com',
                'Wes': np.nan}
        data = Series(data)

        pat = r'([A-Z0-9._%+-]+)@([A-Z0-9.-]+)\.([A-Z]{2,4})'

        result = data.str.extract(pat, flags=re.IGNORECASE, expand=True)
        assert result.iloc[0].tolist() == ['dave', 'google', 'com']

        result = data.str.match(pat, flags=re.IGNORECASE)
        assert result[0]

        result = data.str.findall(pat, flags=re.IGNORECASE)
        assert result[0][0] == ('dave', 'google', 'com')

        result = data.str.count(pat, flags=re.IGNORECASE)
        assert result[0] == 1

        with tm.assert_produces_warning(UserWarning):
            result = data.str.contains(pat, flags=re.IGNORECASE)
        assert result[0]

    def test_encode_decode(self):
        base = Series([u('a'), u('b'), u('a\xe4')])
        series = base.str.encode('utf-8')

        f = lambda x: x.decode('utf-8')
        result = series.str.decode('utf-8')
        exp = series.map(f)

        tm.assert_series_equal(result, exp)

    def test_encode_decode_errors(self):
        encodeBase = Series([u('a'), u('b'), u('a\x9d')])

        pytest.raises(UnicodeEncodeError, encodeBase.str.encode, 'cp1252')

        f = lambda x: x.encode('cp1252', 'ignore')
        result = encodeBase.str.encode('cp1252', 'ignore')
        exp = encodeBase.map(f)
        tm.assert_series_equal(result, exp)

        decodeBase = Series([b'a', b'b', b'a\x9d'])

        pytest.raises(UnicodeDecodeError, decodeBase.str.decode, 'cp1252')

        f = lambda x: x.decode('cp1252', 'ignore')
        result = decodeBase.str.decode('cp1252', 'ignore')
        exp = decodeBase.map(f)

        tm.assert_series_equal(result, exp)

    def test_normalize(self):
        values = ['ABC', u'ＡＢＣ', u'１２３', np.nan, u'ｱｲｴ']
        s = Series(values, index=['a', 'b', 'c', 'd', 'e'])

        normed = [u'ABC', u'ABC', u'123', np.nan, u'アイエ']
        expected = Series(normed, index=['a', 'b', 'c', 'd', 'e'])

        result = s.str.normalize('NFKC')
        tm.assert_series_equal(result, expected)

        expected = Series([u'ABC', u'ＡＢＣ', u'１２３', np.nan, u'ｱｲｴ'],
                          index=['a', 'b', 'c', 'd', 'e'])

        result = s.str.normalize('NFC')
        tm.assert_series_equal(result, expected)

        with tm.assert_raises_regex(ValueError,
                                    "invalid normalization form"):
            s.str.normalize('xxx')

        s = Index([u'ＡＢＣ', u'１２３', u'ｱｲｴ'])
        expected = Index([u'ABC', u'123', u'アイエ'])
        result = s.str.normalize('NFKC')
        tm.assert_index_equal(result, expected)

    def test_cat_on_filtered_index(self):
        df = DataFrame(index=MultiIndex.from_product(
            [[2011, 2012], [1, 2, 3]], names=['year', 'month']))

        df = df.reset_index()
        df = df[df.month > 1]

        str_year = df.year.astype('str')
        str_month = df.month.astype('str')
        str_both = str_year.str.cat(str_month, sep=' ')

        assert str_both.loc[1] == '2011 2'

        str_multiple = str_year.str.cat([str_month, str_month], sep=' ')

        assert str_multiple.loc[1] == '2011 2 2'

    def test_str_cat_raises_intuitive_error(self):
        # https://github.com/pandas-dev/pandas/issues/11334
        s = Series(['a', 'b', 'c', 'd'])
        message = "Did you mean to supply a `sep` keyword?"
        with tm.assert_raises_regex(ValueError, message):
            s.str.cat('|')
        with tm.assert_raises_regex(ValueError, message):
            s.str.cat('    ')

    def test_index_str_accessor_visibility(self):
        from pandas.core.strings import StringMethods

        if not compat.PY3:
            cases = [(['a', 'b'], 'string'), (['a', u('b')], 'mixed'),
                     ([u('a'), u('b')], 'unicode'),
                     (['a', 'b', 1], 'mixed-integer'),
                     (['a', 'b', 1.3], 'mixed'),
                     (['a', 'b', 1.3, 1], 'mixed-integer'),
                     (['aa', datetime(2011, 1, 1)], 'mixed')]
        else:
            cases = [(['a', 'b'], 'string'), (['a', u('b')], 'string'),
                     ([u('a'), u('b')], 'string'),
                     (['a', 'b', 1], 'mixed-integer'),
                     (['a', 'b', 1.3], 'mixed'),
                     (['a', 'b', 1.3, 1], 'mixed-integer'),
                     (['aa', datetime(2011, 1, 1)], 'mixed')]
        for values, tp in cases:
            idx = Index(values)
            assert isinstance(Series(values).str, StringMethods)
            assert isinstance(idx.str, StringMethods)
            assert idx.inferred_type == tp

        for values, tp in cases:
            idx = Index(values)
            assert isinstance(Series(values).str, StringMethods)
            assert isinstance(idx.str, StringMethods)
            assert idx.inferred_type == tp

        cases = [([1, np.nan], 'floating'),
                 ([datetime(2011, 1, 1)], 'datetime64'),
                 ([timedelta(1)], 'timedelta64')]
        for values, tp in cases:
            idx = Index(values)
            message = 'Can only use .str accessor with string values'
            with tm.assert_raises_regex(AttributeError, message):
                Series(values).str
            with tm.assert_raises_regex(AttributeError, message):
                idx.str
            assert idx.inferred_type == tp

        # MultiIndex has mixed dtype, but not allow to use accessor
        idx = MultiIndex.from_tuples([('a', 'b'), ('a', 'b')])
        assert idx.inferred_type == 'mixed'
        message = 'Can only use .str accessor with Index, not MultiIndex'
        with tm.assert_raises_regex(AttributeError, message):
            idx.str

    def test_str_accessor_no_new_attributes(self):
        # https://github.com/pandas-dev/pandas/issues/10673
        s = Series(list('aabbcde'))
        with tm.assert_raises_regex(AttributeError,
                                    "You cannot add any new attribute"):
            s.str.xlabel = "a"

    def test_method_on_bytes(self):
        lhs = Series(np.array(list('abc'), 'S1').astype(object))
        rhs = Series(np.array(list('def'), 'S1').astype(object))
        if compat.PY3:
            pytest.raises(TypeError, lhs.str.cat, rhs)
        else:
            result = lhs.str.cat(rhs)
            expected = Series(np.array(
                ['ad', 'be', 'cf'], 'S2').astype(object))
            tm.assert_series_equal(result, expected)