python source code of test

Project: predictive-maintenance-using-machine-learning (GitHub Link)

predictive-maintenance-using-machine-learning-master
- .github
  - PULL_REQUEST_TEMPLATE.md
- source
  - predictive_maintenance
    - index.py
    - pandas
      - testing.py
      - tseries
        holiday.py
        api.py
        offsets.py
        plotting.py
        __init__.py
        converter.py
        frequencies.py
      - api
        extensions
        __init__.py
        types
        __init__.py
        __init__.py
      - _libs
        tslibs
        nattype.cpython-37m-x86_64-linux-gnu.so
        ccalendar.cpython-37m-x86_64-linux-gnu.so
        frequencies.cpython-37m-x86_64-linux-gnu.so
        __init__.py
        np_datetime.cpython-37m-x86_64-linux-gnu.so
        json.cpython-37m-x86_64-linux-gnu.so
        indexing.cpython-37m-x86_64-linux-gnu.so
        skiplist.cpython-37m-x86_64-linux-gnu.so
        testing.cpython-37m-x86_64-linux-gnu.so
        __init__.py
        missing.cpython-37m-x86_64-linux-gnu.so
        hashing.cpython-37m-x86_64-linux-gnu.so
        properties.cpython-37m-x86_64-linux-gnu.so
      - compat
        pickle_compat.py
        numpy
        function.py
        __init__.py
        __init__.py
        chainmap.py
        chainmap_impl.py
      - util
        testing.py
        _exceptions.py
        _test_decorators.py
        _depr_module.py
        _move.cpython-37m-x86_64-linux-gnu.so
        _validators.py
        __init__.py
        _print_versions.py
        _doctools.py
        _decorators.py
        _tester.py
      - arrays
        __init__.py
      - io
        feather_format.py
        packers.py
        sql.py
        excel.py
        date_converters.py
        html.py
        pickle.py
        clipboard
        exceptions.py
        clipboards.py
        windows.py
        __init__.py
        clipboards.py
        stata.py
        sas
        sas_constants.py
        sas_xport.py
        sas7bdat.py
        sasreader.py
        __init__.py
        msgpack
        _unpacker.cpython-37m-x86_64-linux-gnu.so
        exceptions.py
        _packer.cpython-37m-x86_64-linux-gnu.so
        __init__.py
        _version.py
        gcs.py
        s3.py
        api.py
        common.py
        __init__.py
        gbq.py
        json
        table_schema.py
        normalize.py
        __init__.py
        json.py
        parsers.py
        parquet.py
        pytables.py
        formats
        excel.py
        terminal.py
        html.py
        templates
        html.tpl
        printing.py
        csvs.py
        console.py
        latex.py
        css.py
        __init__.py
        format.py
        style.py
      - __init__.py
      - tests
        test_strings.py
        tslibs
        test_array_to_datetime.py
        test_ccalendar.py
        test_normalize_date.py
        test_conversion.py
        test_timedeltas.py
        test_period_asfreq.py
        test_timezones.py
        test_libfrequencies.py
        __init__.py
        test_liboffsets.py
        test_api.py
        test_parsing.py
        test_parse_iso8601.py
        internals
        test_internals.py
        __init__.py
        test_base.py
        test_errors.py
        sparse
        test_format.py
        test_combine_concat.py
        frame
        test_frame.py
        test_apply.py
        test_analytics.py
        test_indexing.py
        test_to_csv.py
        __init__.py
        test_to_from_scipy.py
        conftest.py
        series
        test_indexing.py
        __init__.py
        test_series.py
        test_indexing.py
        test_reshape.py
        test_groupby.py
        common.py
        __init__.py
        test_pivot.py
        test_algos.py
        arithmetic
        test_timedelta64.py
        test_object.py
        test_datetime64.py
        test_period.py
        test_numeric.py
        __init__.py
        conftest.py
        tseries
        test_frequencies.py
        test_holiday.py
        __init__.py
        offsets
        test_offsets.py
        test_offsets_properties.py
        test_fiscal.py
        test_ticks.py
        common.py
        __init__.py
        conftest.py
        test_yqm_offsets.py
        test_window.py
        test_compat.py
        computation
        test_eval.py
        test_compat.py
        __init__.py
        test_take.py
        frame
        test_duplicates.py
        test_subclass.py
        test_block_internals.py
        test_query_eval.py
        test_alter_axes.py
        test_axis_select_reindex.py
        test_apply.py
        test_mutate_columns.py
        test_analytics.py
        test_combine_concat.py
        test_nonunique_indexes.py
        test_period.py
        test_indexing.py
        test_reshape.py
        test_validate.py
        test_sorting.py
        test_rank.py
        test_convert_to.py
        test_to_csv.py
        test_timezones.py
        test_timeseries.py
        common.py
        __init__.py
        test_missing.py
        test_join.py
        test_constructors.py
        test_replace.py
        test_quantile.py
        test_dtypes.py
        test_arithmetic.py
        test_api.py
        test_operators.py
        test_repr_info.py
        test_sort_values_level_as_str.py
        conftest.py
        test_asof.py
        test_lib.py
        series
        test_duplicates.py
        test_subclass.py
        test_block_internals.py
        test_alter_axes.py
        test_apply.py
        test_analytics.py
        test_io.py
        test_combine_concat.py
        test_period.py
        test_validate.py
        test_sorting.py
        test_internals.py
        test_rank.py
        indexing
        test_callable.py
        test_indexing.py
        test_numeric.py
        test_loc.py
        __init__.py
        test_iloc.py
        test_alter_index.py
        test_boolean.py
        test_datetime.py
        conftest.py
        test_datetime_values.py
        test_timezones.py
        test_timeseries.py
        common.py
        __init__.py
        test_missing.py
        test_constructors.py
        test_replace.py
        test_quantile.py
        test_dtypes.py
        test_arithmetic.py
        test_repr.py
        test_api.py
        test_operators.py
        conftest.py
        test_asof.py
        api
        test_types.py
        __init__.py
        test_api.py
        test_multilevel.py
        test_panel.py
        scalar
        interval
        test_ops.py
        test_interval.py
        __init__.py
        timedelta
        test_construction.py
        __init__.py
        test_formats.py
        test_arithmetic.py
        test_timedelta.py
        __init__.py
        test_nat.py
        period
        test_period.py
        test_asfreq.py
        __init__.py
        timestamp
        test_comparisons.py
        test_timestamp.py
        test_timezones.py
        __init__.py
        test_unary_ops.py
        test_arithmetic.py
        test_rendering.py
        util
        test_assert_interval_array_equal.py
        test_assert_index_equal.py
        test_move.py
        test_assert_series_equal.py
        test_safe_import.py
        test_assert_almost_equal.py
        test_util.py
        test_deprecate_kwarg.py
        test_assert_extension_array_equal.py
        test_assert_frame_equal.py
        test_assert_numpy_array_equal.py
        test_validate_kwargs.py
        __init__.py
        test_validate_args.py
        test_hashing.py
        test_locale.py
        test_assert_categorical_equal.py
        test_deprecate.py
        test_validate_args_and_kwargs.py
        conftest.py
        extension
        test_categorical.py
        decimal
        test_decimal.py
        array.py
        __init__.py
        arrow
        test_bool.py
        bool.py
        __init__.py
        test_sparse.py
        test_external_block.py
        numpy_
        test_numpy_nested.py
        test_numpy.py
        __init__.py
        conftest.py
        base
        groupby.py
        constructors.py
        getitem.py
        casting.py
        reshaping.py
        ops.py
        printing.py
        setitem.py
        io.py
        dtype.py
        missing.py
        __init__.py
        reduce.py
        methods.py
        interface.py
        base.py
        test_period.py
        test_integer.py
        test_interval.py
        test_common.py
        __init__.py
        test_datetime.py
        json
        array.py
        __init__.py
        test_json.py
        conftest.py
        test_sorting.py
        test_common.py
        groupby
        test_categorical.py
        test_bin_groupby.py
        test_timegrouper.py
        test_apply.py
        test_index_as_string.py
        test_counting.py
        aggregate
        test_aggregate.py
        test_cython.py
        __init__.py
        test_other.py
        test_rank.py
        test_groupby.py
        __init__.py
        test_nth.py
        test_value_counts.py
        test_whitelist.py
        test_transform.py
        test_filters.py
        test_function.py
        conftest.py
        test_grouping.py
        test_expressions.py
        generic
        test_frame.py
        test_label_or_level_utils.py
        test_panel.py
        test_generic.py
        __init__.py
        test_series.py
        indexing
        test_categorical.py
        test_ix.py
        interval
        test_interval.py
        test_interval_new.py
        __init__.py
        test_callable.py
        test_partial.py
        test_indexing.py
        test_coercion.py
        test_panel.py
        test_loc.py
        test_chaining_and_caching.py
        test_indexing_slow.py
        common.py
        __init__.py
        test_iloc.py
        test_datetime.py
        test_scalar.py
        multiindex
        test_setitem.py
        test_ix.py
        test_slice.py
        test_getitem.py
        test_partial.py
        test_panel.py
        test_loc.py
        test_xs.py
        test_chaining_and_caching.py
        test_indexing_slow.py
        test_multiindex.py
        test_set_ops.py
        __init__.py
        test_iloc.py
        test_datetime.py
        test_sorted.py
        conftest.py
        test_floats.py
        test_timedelta.py
        test_indexing_engines.py
        conftest.py
        test_downstream.py
        arrays
        sparse
        test_libsparse.py
        test_array.py
        test_arithmetics.py
        __init__.py
        test_dtype.py
        categorical
        test_warnings.py
        test_subclass.py
        test_algos.py
        test_analytics.py
        test_indexing.py
        test_sorting.py
        common.py
        __init__.py
        test_missing.py
        test_constructors.py
        test_dtypes.py
        test_repr.py
        test_api.py
        test_operators.py
        conftest.py
        interval
        test_ops.py
        test_interval.py
        __init__.py
        test_period.py
        test_integer.py
        test_array.py
        test_timedeltas.py
        test_numpy.py
        test_datetimes.py
        __init__.py
        test_datetimelike.py
        test_config.py
        reshape
        merge
        test_merge_index_as_string.py
        test_merge.py
        test_multi.py
        __init__.py
        test_merge_ordered.py
        test_join.py
        test_merge_asof.py
        test_union_categoricals.py
        test_reshape.py
        test_util.py
        test_qcut.py
        test_concat.py
        __init__.py
        test_melt.py
        test_pivot.py
        test_cut.py
        io
        test_feather.py
        generate_legacy_storage_files.py
        test_compression.py
        test_date_converters.py
        test_clipboard.py
        test_pickle.py
        test_excel.py
        test_s3.py
        test_sql.py
        sas
        test_sas.py
        test_xport.py
        test_sas7bdat.py
        __init__.py
        msgpack
        test_buffer.py
        test_except.py
        test_format.py
        test_subtype.py
        test_seq.py
        test_unpack.py
        test_newspec.py
        test_read_size.py
        test_obj.py
        test_unpack_raw.py
        test_case.py
        common.py
        __init__.py
        test_sequnpack.py
        test_extension.py
        test_pack.py
        test_limits.py
        test_html.py
        test_common.py
        test_gbq.py
        test_stata.py
        test_packers.py
        __init__.py
        test_gcs.py
        json
        test_compression.py
        test_pandas.py
        test_readlines.py
        test_json_table_schema.py
        test_normalize.py
        __init__.py
        test_ujson.py
        test_parquet.py
        parser
        test_skiprows.py
        test_textreader.py
        test_mangle_dupes.py
        test_network.py
        test_comment.py
        test_converters.py
        test_compression.py
        test_read_fwf.py
        test_na_values.py
        test_python_parser_only.py
        test_common.py
        test_c_parser_only.py
        test_dialect.py
        test_multi_thread.py
        __init__.py
        test_usecols.py
        test_unsupported.py
        test_index_col.py
        test_parse_dates.py
        test_quoting.py
        test_dtypes.py
        test_header.py
        conftest.py
        conftest.py
        formats
        test_format.py
        test_eng_formatting.py
        test_console.py
        test_style.py
        test_to_csv.py
        __init__.py
        test_css.py
        test_to_html.py
        test_printing.py
        test_to_excel.py
        test_to_latex.py
        __init__.py
        test_join.py
        tools
        test_numeric.py
        __init__.py
        reductions
        test_reductions.py
        __init__.py
        test_stat_reductions.py
        test_nanops.py
        plotting
        test_frame.py
        test_misc.py
        test_converter.py
        test_boxplot_method.py
        test_hist_method.py
        test_groupby.py
        common.py
        __init__.py
        test_datetimelike.py
        test_series.py
        indexes
        test_base.py
        interval
        test_interval_range.py
        test_interval.py
        test_construction.py
        test_interval_new.py
        test_astype.py
        __init__.py
        test_interval_tree.py
        datetimelike.py
        timedeltas
        test_setops.py
        test_indexing.py
        test_ops.py
        test_construction.py
        test_timedelta_range.py
        test_astype.py
        __init__.py
        test_scalar_compat.py
        test_tools.py
        test_partial_slicing.py
        test_formats.py
        test_arithmetic.py
        test_timedelta.py
        test_category.py
        test_numeric.py
        test_frozen.py
        test_common.py
        multi
        test_duplicates.py
        test_drop.py
        test_format.py
        test_get_set.py
        test_compat.py
        test_analytics.py
        test_monotonic.py
        test_integrity.py
        test_conversion.py
        test_names.py
        test_indexing.py
        test_reshape.py
        test_equivalence.py
        test_sorting.py
        test_copy.py
        test_partial_indexing.py
        test_contains.py
        test_astype.py
        test_constructor.py
        test_set_ops.py
        __init__.py
        test_missing.py
        test_join.py
        test_reindex.py
        conftest.py
        common.py
        __init__.py
        test_range.py
        period
        test_setops.py
        test_period.py
        test_indexing.py
        test_asfreq.py
        test_period_range.py
        test_ops.py
        test_construction.py
        test_astype.py
        __init__.py
        test_scalar_compat.py
        test_tools.py
        test_partial_slicing.py
        test_formats.py
        test_arithmetic.py
        conftest.py
        datetimes
        test_misc.py
        test_setops.py
        test_indexing.py
        test_ops.py
        test_construction.py
        test_timezones.py
        test_astype.py
        __init__.py
        test_datetimelike.py
        test_scalar_compat.py
        test_tools.py
        test_partial_slicing.py
        test_missing.py
        test_datetime.py
        test_formats.py
        test_date_range.py
        test_arithmetic.py
        test_register_accessor.py
        dtypes
        test_common.py
        test_inference.py
        test_concat.py
        test_generic.py
        cast
        test_construct_from_scalar.py
        test_convert_objects.py
        test_find_common_type.py
        test_infer_datetimelike.py
        test_construct_ndarray.py
        test_infer_dtype.py
        test_downcast.py
        __init__.py
        test_construct_object_arr.py
        __init__.py
        test_missing.py
        test_dtypes.py
        resample
        test_base.py
        test_resampler_grouper.py
        test_datetime_index.py
        test_period_index.py
        test_time_grouper.py
        __init__.py
        test_resample_api.py
        test_timedelta.py
        conftest.py
      - _version.py
      - core
        config_init.py
        internals
        managers.py
        blocks.py
        arrays.py
        __init__.py
        concat.py
        construction.py
        index.py
        sparse
        frame.py
        api.py
        scipy_sparse.py
        series.py
        __init__.py
        accessor.py
        resample.py
        config.py
        ops.py
        panel.py
        computation
        eval.py
        ops.py
        engines.py
        expressions.py
        check.py
        api.py
        scope.py
        common.py
        __init__.py
        expr.py
        align.py
        pytables.py
        window.py
        util
        __init__.py
        hashing.py
        nanops.py
        groupby
        groupby.py
        ops.py
        generic.py
        __init__.py
        grouper.py
        categorical.py
        base.py
        indexing.py
        arrays
        period.py
        numpy_.py
        datetimes.py
        datetimelike.py
        array_.py
        integer.py
        timedeltas.py
        __init__.py
        interval.py
        _ranges.py
        categorical.py
        sparse.py
        base.py
        api.py
        apply.py
        reshape
        tile.py
        pivot.py
        util.py
        api.py
        __init__.py
        melt.py
        concat.py
        reshape.py
        merge.py
        missing.py
        series.py
        common.py
        __init__.py
        algorithms.py
        strings.py
        tools
        datetimes.py
        timedeltas.py
        __init__.py
        numeric.py
        categorical.py
        indexes
        range.py
        period.py
        datetimes.py
        datetimelike.py
        category.py
        frozen.py
        api.py
        timedeltas.py
        accessors.py
        multi.py
        __init__.py
        numeric.py
        interval.py
        base.py
        dtypes
        cast.py
        generic.py
        api.py
        missing.py
        common.py
        __init__.py
        inference.py
        concat.py
        dtypes.py
        base.py
        base.py
        sorting.py
      - errors
        __init__.py
      - plotting
        _style.py
        _timeseries.py
        _tools.py
        _converter.py
        _core.py
        _misc.py
        _compat.py
        __init__.py
      - conftest.py
    - numpy
      - _globals.py
      - .libs
      - distutils
        log.py
        ccompiler.py
        line_endings.py
        misc_util.py
        conv_template.py
        __version__.py
        unixccompiler.py
        exec_command.py
        msvccompiler.py
        npy_pkg_config.py
        msvc9compiler.py
        system_info.py
        numpy_distribution.py
        from_template.py
        mingw
        gfortran_vs2003_hack.c
        info.py
        setup.py
        mingw32ccompiler.py
        pathccompiler.py
        intelccompiler.py
        __config__.py
        lib2def.py
        __init__.py
        tests
        test_fcompiler.py
        test_system_info.py
        test_misc_util.py
        test_fcompiler_gnu.py
        test_exec_command.py
        test_npy_pkg_config.py
        test_fcompiler_intel.py
        test_from_template.py
        __init__.py
        test_fcompiler_nagfor.py
        test_shell_utils.py
        core.py
        cpuinfo.py
        command
        build.py
        bdist_rpm.py
        install_data.py
        build_ext.py
        config.py
        install_clib.py
        build_clib.py
        egg_info.py
        config_compiler.py
        autodist.py
        build_py.py
        sdist.py
        __init__.py
        develop.py
        install_headers.py
        build_scripts.py
        install.py
        build_src.py
        compat.py
        extension.py
        _shell_utils.py
        fcompiler
        absoft.py
        nag.py
        ibm.py
        hpux.py
        vast.py
        g95.py
        intel.py
        none.py
        gnu.py
        __init__.py
        pathf95.py
        mips.py
        sun.py
        pg.py
        lahey.py
        compaq.py
        environment.py
      - _distributor_init.py
      - version.py
      - polynomial
        hermite.py
        chebyshev.py
        polynomial.py
        _polybase.py
        laguerre.py
        legendre.py
        setup.py
        __init__.py
        polyutils.py
        tests
        test_polynomial.py
        test_chebyshev.py
        test_hermite.py
        __init__.py
        test_laguerre.py
        test_classes.py
        test_hermite_e.py
        test_printing.py
        test_legendre.py
        test_polyutils.py
        hermite_e.py
      - compat
        setup.py
        __init__.py
        _inspect.py
        tests
        test_compat.py
        __init__.py
        py3k.py
      - lib
        histograms.py
        arraypad.py
        recfunctions.py
        polynomial.py
        _datasource.py
        function_base.py
        ufunclike.py
        type_check.py
        index_tricks.py
        _iotools.py
        financial.py
        info.py
        stride_tricks.py
        setup.py
        nanfunctions.py
        arraysetops.py
        shape_base.py
        user_array.py
        __init__.py
        utils.py
        tests
        test_polynomial.py
        test_mixins.py
        test_recfunctions.py
        test_index_tricks.py
        test_format.py
        test_histograms.py
        test_utils.py
        test__datasource.py
        test__version.py
        test_stride_tricks.py
        test_io.py
        test_nanfunctions.py
        test_shape_base.py
        test_arraypad.py
        test_packbits.py
        test_arrayterator.py
        test_financial.py
        test_type_check.py
        test_twodim_base.py
        test_regression.py
        data
        win64python2.npy
        py3-objarr.npy
        py2-objarr.npz
        py2-objarr.npy
        py3-objarr.npz
        python3.npy
        test__iotools.py
        test_arraysetops.py
        __init__.py
        test_ufunclike.py
        test_function_base.py
        _version.py
        scimath.py
        mixins.py
        npyio.py
        arrayterator.py
        twodim_base.py
        format.py
      - fft
        fftpack_lite.cpython-37m-x86_64-linux-gnu.so
        info.py
        setup.py
        __init__.py
        tests
        test_helper.py
        __init__.py
        test_fftpack.py
        helper.py
        fftpack.py
      - ma
        version.py
        extras.py
        testutils.py
        setup.py
        bench.py
        __init__.py
        mrecords.py
        tests
        test_subclassing.py
        test_extras.py
        test_old_ma.py
        test_regression.py
        __init__.py
        test_mrecords.py
        test_deprecations.py
        test_core.py
        timer_comparison.py
      - _pytesttester.py
      - ctypeslib.py
      - setup.py
      - f2py
        src
        fortranobject.h
        fortranobject.c
        rules.py
        func2subr.py
        __version__.py
        crackfortran.py
        f2py_testing.py
        f90mod_rules.py
        f2py2e.py
        info.py
        setup.py
        common_rules.py
        auxfuncs.py
        __main__.py
        capi_maps.py
        __init__.py
        use_rules.py
        tests
        src
        assumed_shape
        foo_mod.f90
        .f2py_f2cmap
        foo_use.f90
        foo_free.f90
        precision.f90
        mixed
        foo.f
        foo_fixed.f90
        foo_free.f90
        size
        foo.f90
        parameter
        constant_real.f90
        constant_both.f90
        constant_compound.f90
        constant_non_compound.f90
        constant_integer.f90
        common
        block.f
        kind
        foo.f90
        regression
        inout.f90
        array_from_pyobj
        wrapmodule.c
        string
        char.f90
        test_compile_function.py
        util.py
        test_return_integer.py
        test_return_real.py
        test_semicolon_split.py
        test_array_from_pyobj.py
        test_mixed.py
        test_return_logical.py
        test_assumed_shape.py
        test_kind.py
        test_block_docstring.py
        test_string.py
        test_parameter.py
        test_common.py
        test_regression.py
        test_quoted_character.py
        __init__.py
        test_return_complex.py
        test_callback.py
        test_return_character.py
        test_size.py
        cb_rules.py
        diagnose.py
        cfuncs.py
      - __config__.py
      - __init__.py
      - tests
        test_warnings.py
        test_scripts.py
        test_numpy_version.py
        test_matlib.py
        __init__.py
        test_reloading.py
        test_public_api.py
        test_ctypeslib.py
      - random
        info.py
        setup.py
        __init__.py
        tests
        test_random.py
        test_regression.py
        __init__.py
        randomkit.h
      - core
        umath.py
        _add_newdocs.py
        _dtype_ctypes.py
        _string_helpers.py
        _struct_ufunc_tests.cpython-37m-x86_64-linux-gnu.so
        include
        numpy
        _neighborhood_iterator_imp.h
        noprefix.h
        npy_cpu.h
        npy_3kcompat.h
        old_defines.h
        npy_os.h
        oldnumeric.h
        ndarraytypes.h
        numpyconfig.h
        __multiarray_api.h
        multiarray_api.txt
        npy_math.h
        npy_endian.h
        halffloat.h
        __ufunc_api.h
        ufuncobject.h
        utils.h
        _numpyconfig.h
        npy_common.h
        npy_no_deprecated_api.h
        npy_interrupt.h
        ufunc_api.txt
        npy_1_7_deprecated_api.h
        ndarrayobject.h
        arrayscalars.h
        arrayobject.h
        einsumfunc.py
        umath_tests.py
        numerictypes.py
        getlimits.py
        machar.py
        _dtype.py
        setup_common.py
        function_base.py
        fromnumeric.py
        lib
        npy-pkg-config
        npymath.ini
        mlib.ini
        arrayprint.py
        memmap.py
        info.py
        setup.py
        _type_aliases.py
        multiarray.py
        shape_base.py
        _internal.py
        _umath_tests.cpython-37m-x86_64-linux-gnu.so
        __init__.py
        numeric.py
        defchararray.py
        tests
        test_ufunc.py
        test_nditer.py
        test_item_selection.py
        test_defchararray.py
        test_scalarinherit.py
        test_extint128.py
        test_shape_base.py
        test_getlimits.py
        test_einsum.py
        test_scalarmath.py
        test_unicode.py
        test_indexing.py
        test_numeric.py
        test_umath_complex.py
        _locales.py
        test_half.py
        test_longdouble.py
        test_abc.py
        test_errstate.py
        test_arrayprint.py
        test_regression.py
        data
        astype_copy.pkl
        recarray_from_file.fits
        test_memmap.py
        test_numerictypes.py
        test_print.py
        test_scalarprint.py
        __init__.py
        test_machar.py
        test_records.py
        test_datetime.py
        test_dtype.py
        test_deprecations.py
        test_umath.py
        test_overrides.py
        test_api.py
        test_scalar_ctors.py
        test_scalarbuffer.py
        test_function_base.py
        test_mem_overlap.py
        test_indexerrors.py
        records.py
        cversions.py
        _methods.py
        generate_numpy_api.py
        _aliased_types.py
        overrides.py
        _operand_flag_tests.cpython-37m-x86_64-linux-gnu.so
        _dummy.cpython-37m-x86_64-linux-gnu.so
      - linalg
        lapack_lite.cpython-37m-x86_64-linux-gnu.so
        info.py
        setup.py
        linalg.py
        __init__.py
        tests
        test_linalg.py
        test_regression.py
        test_build.py
        __init__.py
        test_deprecations.py
      - matlib.py
      - matrixlib
        defmatrix.py
        setup.py
        __init__.py
        tests
        test_defmatrix.py
        test_numeric.py
        test_masked_matrix.py
        test_multiarray.py
        test_interaction.py
        test_regression.py
        __init__.py
        test_matrix_linalg.py
      - LICENSE.txt
      - doc
        ufuncs.py
        creation.py
        misc.py
        internals.py
        glossary.py
        subclassing.py
        indexing.py
        constants.py
        structured_arrays.py
        basics.py
        __init__.py
        byteswapping.py
        broadcasting.py
      - dual.py
      - conftest.py
      - testing
        nosetester.py
        decorators.py
        noseclasses.py
        print_coercion_tables.py
        _private
        nosetester.py
        decorators.py
        noseclasses.py
        __init__.py
        utils.py
        parameterized.py
        setup.py
        __init__.py
        utils.py
        tests
        test_utils.py
        test_decorators.py
        test_doctesting.py
        __init__.py
    - pytz
      - lazy.py
      - exceptions.py
      - tzfile.py
      - __init__.py
      - tzinfo.py
      - reference.py
      - zoneinfo
        MET
        Iceland
        CET
        Universal
        Cuba
        zone.tab
        Canada
        Eastern
        Newfoundland
        Mountain
        Saskatchewan
        Atlantic
        Central
        Yukon
        Pacific
        Japan
        Navajo
        Egypt
        MST
        Kwajalein
        Asia
        Yangon
        Makassar
        Kolkata
        Dushanbe
        Aqtau
        Choibalsan
        Tokyo
        Ujung_Pandang
        Phnom_Penh
        Irkutsk
        Ho_Chi_Minh
        Tehran
        Dubai
        Kathmandu
        Thimbu
        Pontianak
        Chita
        Chongqing
        Hovd
        Bangkok
        Yekaterinburg
        Magadan
        Seoul
        Chungking
        Katmandu
        Muscat
        Colombo
        Ulaanbaatar
        Hong_Kong
        Vladivostok
        Qatar
        Aqtobe
        Aden
        Jerusalem
        Dili
        Urumqi
        Baku
        Istanbul
        Macao
        Bahrain
        Calcutta
        Thimphu
        Ust-Nera
        Famagusta
        Manila
        Krasnoyarsk
        Singapore
        Tomsk
        Oral
        Qyzylorda
        Nicosia
        Ulan_Bator
        Ashkhabad
        Omsk
        Bishkek
        Kamchatka
        Yakutsk
        Kabul
        Ashgabat
        Almaty
        Amman
        Baghdad
        Riyadh
        Khandyga
        Karachi
        Brunei
        Saigon
        Tashkent
        Srednekolymsk
        Gaza
        Beirut
        Tbilisi
        Barnaul
        Dacca
        Vientiane
        Kuching
        Jakarta
        Yerevan
        Kuala_Lumpur
        Jayapura
        Qostanay
        Pyongyang
        Hebron
        Novosibirsk
        Tel_Aviv
        Atyrau
        Anadyr
        Kashgar
        Damascus
        Shanghai
        Kuwait
        Macau
        Novokuznetsk
        Rangoon
        Sakhalin
        Taipei
        Harbin
        Dhaka
        Samarkand
        Europe
        Jersey
        Vilnius
        Sofia
        Lisbon
        Ulyanovsk
        Minsk
        Volgograd
        Budapest
        Uzhgorod
        Zurich
        Guernsey
        Zagreb
        Berlin
        London
        Luxembourg
        Warsaw
        Samara
        Paris
        Podgorica
        Busingen
        Tirane
        Brussels
        Istanbul
        San_Marino
        Chisinau
        Kiev
        Monaco
        Nicosia
        Vaduz
        Malta
        Prague
        Rome
        Sarajevo
        Ljubljana
        Moscow
        Madrid
        Bratislava
        Kaliningrad
        Andorra
        Gibraltar
        Belfast
        Amsterdam
        Copenhagen
        Skopje
        Dublin
        Tallinn
        Riga
        Mariehamn
        Helsinki
        Isle_of_Man
        Saratov
        Tiraspol
        Bucharest
        Stockholm
        Vatican
        Vienna
        Kirov
        Belgrade
        Simferopol
        Astrakhan
        Athens
        Zaporozhye
        Oslo
        posixrules
        iso3166.tab
        zone1970.tab
        Zulu
        PST8PDT
        Mexico
        General
        BajaNorte
        BajaSur
        Turkey
        PRC
        NZ-CHAT
        GMT0
        EET
        Factory
        Antarctica
        Syowa
        Casey
        Palmer
        McMurdo
        South_Pole
        Mawson
        DumontDUrville
        Macquarie
        Rothera
        Davis
        Troll
        Vostok
        Poland
        W-SU
        ROK
        GMT-0
        America
        Rankin_Inlet
        North_Dakota
        Beulah
        New_Salem
        Center
        Ensenada
        Edmonton
        Virgin
        Anguilla
        Rosario
        Araguaina
        Punta_Arenas
        Rainy_River
        Caracas
        Maceio
        Martinique
        Kralendijk
        St_Barthelemy
        Fort_Wayne
        Vancouver
        Santo_Domingo
        Moncton
        Montreal
        Whitehorse
        Godthab
        Dominica
        Cambridge_Bay
        New_York
        Kentucky
        Monticello
        Louisville
        Havana
        Rio_Branco
        Antigua
        Phoenix
        St_Kitts
        St_Vincent
        Indianapolis
        Swift_Current
        Matamoros
        Montserrat
        Anchorage
        Inuvik
        Guadeloupe
        Curacao
        Panama
        Manaus
        Halifax
        Bahia
        Tijuana
        Tegucigalpa
        Costa_Rica
        Port-au-Prince
        Atka
        Creston
        Chihuahua
        Santarem
        Lima
        Thule
        Sao_Paulo
        Regina
        Denver
        Buenos_Aires
        Adak
        Danmarkshavn
        Tortola
        Shiprock
        Bahia_Banderas
        Porto_Acre
        Nome
        Scoresbysund
        Guyana
        Managua
        Recife
        Nipigon
        Resolute
        Bogota
        Blanc-Sablon
        Chicago
        Iqaluit
        Jamaica
        Cuiaba
        Indiana
        Indianapolis
        Tell_City
        Vincennes
        Vevay
        Winamac
        Knox
        Marengo
        Petersburg
        Coral_Harbour
        Jujuy
        Guatemala
        Montevideo
        Guayaquil
        Dawson_Creek
        Santiago
        Cayman
        Miquelon
        Dawson
        Cordoba
        Detroit
        Merida
        Boa_Vista
        Boise
        Glace_Bay
        Barbados
        La_Paz
        Grand_Turk
        Belem
        Aruba
        Mendoza
        El_Salvador
        Goose_Bay
        St_Lucia
        Mexico_City
        Porto_Velho
        Santa_Isabel
        Pangnirtung
        Los_Angeles
        Metlakatla
        Hermosillo
        Paramaribo
        Juneau
        Yellowknife
        Grenada
        Louisville
        Eirunepe
        Puerto_Rico
        Lower_Princes
        Campo_Grande
        Noronha
        Toronto
        St_Johns
        Argentina
        La_Rioja
        San_Juan
        Ushuaia
        Salta
        Buenos_Aires
        San_Luis
        Jujuy
        Cordoba
        ComodRivadavia
        Mendoza
        Tucuman
        Rio_Gallegos
        Catamarca
        Cayenne
        Ojinaga
        Fort_Nelson
        Marigot
        Winnipeg
        Sitka
        Asuncion
        Mazatlan
        Monterrey
        Menominee
        Fortaleza
        St_Thomas
        Port_of_Spain
        Catamarca
        Cancun
        Thunder_Bay
        Yakutat
        Knox_IN
        Atikokan
        Belize
        Nassau
        tzdata.zi
        Africa
        Sao_Tome
        Nouakchott
        Abidjan
        Conakry
        Mbabane
        Windhoek
        Porto-Novo
        Brazzaville
        Bamako
        Lome
        Ouagadougou
        Gaborone
        Dar_es_Salaam
        Douala
        Timbuktu
        Monrovia
        Ndjamena
        Mogadishu
        Asmera
        Kinshasa
        Kigali
        Maputo
        El_Aaiun
        Blantyre
        Lubumbashi
        Niamey
        Juba
        Kampala
        Malabo
        Casablanca
        Algiers
        Luanda
        Bangui
        Maseru
        Lagos
        Ceuta
        Tunis
        Asmara
        Johannesburg
        Bujumbura
        Tripoli
        Freetown
        Lusaka
        Harare
        Addis_Ababa
        Banjul
        Bissau
        Cairo
        Nairobi
        Dakar
        Accra
        Djibouti
        Libreville
        Khartoum
        Israel
        Portugal
        Indian
        Comoro
        Mayotte
        Mahe
        Mauritius
        Cocos
        Maldives
        Kerguelen
        Reunion
        Antananarivo
        Christmas
        Chagos
        EST5EDT
        EST
        Singapore
        Jamaica
        Chile
        EasterIsland
        Continental
        US
        Eastern
        Alaska
        Mountain
        Hawaii
        Samoa
        Indiana-Starke
        Arizona
        Central
        East-Indiana
        Aleutian
        Michigan
        Pacific
        Libya
        Iran
        Etc
        GMT+12
        Universal
        GMT-9
        GMT-4
        GMT-10
        GMT+9
        Zulu
        GMT+4
        GMT-3
        GMT0
        GMT-6
        GMT+2
        GMT-7
        GMT-5
        GMT-0
        GMT-11
        GMT+10
        GMT-14
        GMT-12
        GMT-2
        GMT+1
        GMT+6
        GMT+8
        UCT
        GMT+11
        GMT
        GMT-8
        GMT+3
        Greenwich
        UTC
        GMT-1
        GMT+0
        GMT+5
        GMT+7
        GMT-13
        WET
        UCT
        Australia
        Perth
        Tasmania
        Queensland
        Lindeman
        Victoria
        North
        South
        Adelaide
        Sydney
        Eucla
        Yancowinna
        Melbourne
        West
        Hobart
        LHI
        Canberra
        Lord_Howe
        Broken_Hill
        NSW
        Darwin
        Brisbane
        ACT
        Currie
        GMT
        Atlantic
        Faeroe
        St_Helena
        Canary
        Azores
        South_Georgia
        Reykjavik
        Cape_Verde
        Bermuda
        Faroe
        Jan_Mayen
        Stanley
        Madeira
        Hongkong
        HST
        Eire
        Arctic
        Longyearbyen
        Greenwich
        UTC
        CST6CDT
        Brazil
        Acre
        West
        DeNoronha
        East
        GMT+0
        MST7MDT
        GB
        ROC
        NZ
        GB-Eire
        Pacific
        Rarotonga
        Marquesas
        Chuuk
        Kwajalein
        Tongatapu
        Norfolk
        Guam
        Tahiti
        Apia
        Easter
        Wallis
        Funafuti
        Galapagos
        Pitcairn
        Guadalcanal
        Kiritimati
        Nauru
        Saipan
        Samoa
        Honolulu
        Enderbury
        Ponape
        Port_Moresby
        Johnston
        Kosrae
        Midway
        Efate
        Niue
        Auckland
        Pago_Pago
        Yap
        Palau
        Noumea
        Pohnpei
        Fakaofo
        Tarawa
        Wake
        Chatham
        Gambier
        Majuro
        Bougainville
        Fiji
        Truk
        leapseconds
  - notebooks
    - sagemaker_predictive_maintenance.ipynb
    - sagemaker_predictive_maintenance_entry_point
      - sagemaker_predictive_maintenance_entry_point.py
      - requirements.txt
- LICENSE
- CONTRIBUTING.md
- CHANGELOG.md
- deployment
  - predictive-maintenance-using-machine-learning.template
  - run-unit-tests.sh
  - build-s3-dist.sh
- README.md
- CODE_OF_CONDUCT.md
- NOTICE

# -*- coding: utf-8 -*-

""" test where we are determining what we are grouping, or getting groups """

import numpy as np
import pytest

from pandas.compat import long, lrange

import pandas as pd
from pandas import (
    CategoricalIndex, DataFrame, Index, MultiIndex, Series, Timestamp, compat,
    date_range)
from pandas.core.groupby.grouper import Grouping
import pandas.util.testing as tm
from pandas.util.testing import (
    assert_almost_equal, assert_frame_equal, assert_panel_equal,
    assert_series_equal)

# selection
# --------------------------------


class TestSelection(object):

    def test_select_bad_cols(self):
        df = DataFrame([[1, 2]], columns=['A', 'B'])
        g = df.groupby('A')
        with pytest.raises(KeyError, match='"Columns not found: \'C\'"'):
            g[['C']]

        with pytest.raises(KeyError, match='^[^A]+$'):
            # A should not be referenced as a bad column...
            # will have to rethink regex if you change message!
            g[['A', 'C']]

    def test_groupby_duplicated_column_errormsg(self):
        # GH7511
        df = DataFrame(columns=['A', 'B', 'A', 'C'],
                       data=[range(4), range(2, 6), range(0, 8, 2)])

        msg = "Grouper for 'A' not 1-dimensional"
        with pytest.raises(ValueError, match=msg):
            df.groupby('A')
        with pytest.raises(ValueError, match=msg):
            df.groupby(['A', 'B'])

        grouped = df.groupby('B')
        c = grouped.count()
        assert c.columns.nlevels == 1
        assert c.columns.size == 3

    def test_column_select_via_attr(self, df):
        result = df.groupby('A').C.sum()
        expected = df.groupby('A')['C'].sum()
        assert_series_equal(result, expected)

        df['mean'] = 1.5
        result = df.groupby('A').mean()
        expected = df.groupby('A').agg(np.mean)
        assert_frame_equal(result, expected)

    def test_getitem_list_of_columns(self):
        df = DataFrame(
            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
             'C': np.random.randn(8),
             'D': np.random.randn(8),
             'E': np.random.randn(8)})

        result = df.groupby('A')[['C', 'D']].mean()
        result2 = df.groupby('A')['C', 'D'].mean()
        result3 = df.groupby('A')[df.columns[2:4]].mean()

        expected = df.loc[:, ['A', 'C', 'D']].groupby('A').mean()

        assert_frame_equal(result, expected)
        assert_frame_equal(result2, expected)
        assert_frame_equal(result3, expected)

    def test_getitem_numeric_column_names(self):
        # GH #13731
        df = DataFrame({0: list('abcd') * 2,
                        2: np.random.randn(8),
                        4: np.random.randn(8),
                        6: np.random.randn(8)})
        result = df.groupby(0)[df.columns[1:3]].mean()
        result2 = df.groupby(0)[2, 4].mean()
        result3 = df.groupby(0)[[2, 4]].mean()

        expected = df.loc[:, [0, 2, 4]].groupby(0).mean()

        assert_frame_equal(result, expected)
        assert_frame_equal(result2, expected)
        assert_frame_equal(result3, expected)


# grouping
# --------------------------------

class TestGrouping():

    def test_grouper_index_types(self):
        # related GH5375
        # groupby misbehaving when using a Floatlike index
        df = DataFrame(np.arange(10).reshape(5, 2), columns=list('AB'))
        for index in [tm.makeFloatIndex, tm.makeStringIndex,
                      tm.makeUnicodeIndex, tm.makeIntIndex, tm.makeDateIndex,
                      tm.makePeriodIndex]:

            df.index = index(len(df))
            df.groupby(list('abcde')).apply(lambda x: x)

            df.index = list(reversed(df.index.tolist()))
            df.groupby(list('abcde')).apply(lambda x: x)

    def test_grouper_multilevel_freq(self):

        # GH 7885
        # with level and freq specified in a pd.Grouper
        from datetime import date, timedelta
        d0 = date.today() - timedelta(days=14)
        dates = date_range(d0, date.today())
        date_index = pd.MultiIndex.from_product(
            [dates, dates], names=['foo', 'bar'])
        df = pd.DataFrame(np.random.randint(0, 100, 225), index=date_index)

        # Check string level
        expected = df.reset_index().groupby([pd.Grouper(
            key='foo', freq='W'), pd.Grouper(key='bar', freq='W')]).sum()
        # reset index changes columns dtype to object
        expected.columns = pd.Index([0], dtype='int64')

        result = df.groupby([pd.Grouper(level='foo', freq='W'), pd.Grouper(
            level='bar', freq='W')]).sum()
        assert_frame_equal(result, expected)

        # Check integer level
        result = df.groupby([pd.Grouper(level=0, freq='W'), pd.Grouper(
            level=1, freq='W')]).sum()
        assert_frame_equal(result, expected)

    def test_grouper_creation_bug(self):

        # GH 8795
        df = DataFrame({'A': [0, 0, 1, 1, 2, 2], 'B': [1, 2, 3, 4, 5, 6]})
        g = df.groupby('A')
        expected = g.sum()

        g = df.groupby(pd.Grouper(key='A'))
        result = g.sum()
        assert_frame_equal(result, expected)

        result = g.apply(lambda x: x.sum())
        assert_frame_equal(result, expected)

        g = df.groupby(pd.Grouper(key='A', axis=0))
        result = g.sum()
        assert_frame_equal(result, expected)

        # GH14334
        # pd.Grouper(key=...) may be passed in a list
        df = DataFrame({'A': [0, 0, 0, 1, 1, 1],
                        'B': [1, 1, 2, 2, 3, 3],
                        'C': [1, 2, 3, 4, 5, 6]})
        # Group by single column
        expected = df.groupby('A').sum()
        g = df.groupby([pd.Grouper(key='A')])
        result = g.sum()
        assert_frame_equal(result, expected)

        # Group by two columns
        # using a combination of strings and Grouper objects
        expected = df.groupby(['A', 'B']).sum()

        # Group with two Grouper objects
        g = df.groupby([pd.Grouper(key='A'), pd.Grouper(key='B')])
        result = g.sum()
        assert_frame_equal(result, expected)

        # Group with a string and a Grouper object
        g = df.groupby(['A', pd.Grouper(key='B')])
        result = g.sum()
        assert_frame_equal(result, expected)

        # Group with a Grouper object and a string
        g = df.groupby([pd.Grouper(key='A'), 'B'])
        result = g.sum()
        assert_frame_equal(result, expected)

        # GH8866
        s = Series(np.arange(8, dtype='int64'),
                   index=pd.MultiIndex.from_product(
                       [list('ab'), range(2),
                        date_range('20130101', periods=2)],
                       names=['one', 'two', 'three']))
        result = s.groupby(pd.Grouper(level='three', freq='M')).sum()
        expected = Series([28], index=Index(
            [Timestamp('2013-01-31')], freq='M', name='three'))
        assert_series_equal(result, expected)

        # just specifying a level breaks
        result = s.groupby(pd.Grouper(level='one')).sum()
        expected = s.groupby(level='one').sum()
        assert_series_equal(result, expected)

    def test_grouper_column_and_index(self):
        # GH 14327

        # Grouping a multi-index frame by a column and an index level should
        # be equivalent to resetting the index and grouping by two columns
        idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 3),
                                         ('b', 1), ('b', 2), ('b', 3)])
        idx.names = ['outer', 'inner']
        df_multi = pd.DataFrame({"A": np.arange(6),
                                 'B': ['one', 'one', 'two',
                                       'two', 'one', 'one']},
                                index=idx)
        result = df_multi.groupby(['B', pd.Grouper(level='inner')]).mean()
        expected = df_multi.reset_index().groupby(['B', 'inner']).mean()
        assert_frame_equal(result, expected)

        # Test the reverse grouping order
        result = df_multi.groupby([pd.Grouper(level='inner'), 'B']).mean()
        expected = df_multi.reset_index().groupby(['inner', 'B']).mean()
        assert_frame_equal(result, expected)

        # Grouping a single-index frame by a column and the index should
        # be equivalent to resetting the index and grouping by two columns
        df_single = df_multi.reset_index('outer')
        result = df_single.groupby(['B', pd.Grouper(level='inner')]).mean()
        expected = df_single.reset_index().groupby(['B', 'inner']).mean()
        assert_frame_equal(result, expected)

        # Test the reverse grouping order
        result = df_single.groupby([pd.Grouper(level='inner'), 'B']).mean()
        expected = df_single.reset_index().groupby(['inner', 'B']).mean()
        assert_frame_equal(result, expected)

    def test_groupby_levels_and_columns(self):
        # GH9344, GH9049
        idx_names = ['x', 'y']
        idx = pd.MultiIndex.from_tuples(
            [(1, 1), (1, 2), (3, 4), (5, 6)], names=idx_names)
        df = pd.DataFrame(np.arange(12).reshape(-1, 3), index=idx)

        by_levels = df.groupby(level=idx_names).mean()
        # reset_index changes columns dtype to object
        by_columns = df.reset_index().groupby(idx_names).mean()

        tm.assert_frame_equal(by_levels, by_columns, check_column_type=False)

        by_columns.columns = pd.Index(by_columns.columns, dtype=np.int64)
        tm.assert_frame_equal(by_levels, by_columns)

    def test_groupby_categorical_index_and_columns(self, observed):
        # GH18432
        columns = ['A', 'B', 'A', 'B']
        categories = ['B', 'A']
        data = np.ones((5, 4), int)
        cat_columns = CategoricalIndex(columns,
                                       categories=categories,
                                       ordered=True)
        df = DataFrame(data=data, columns=cat_columns)
        result = df.groupby(axis=1, level=0, observed=observed).sum()
        expected_data = 2 * np.ones((5, 2), int)

        if observed:
            # if we are not-observed we undergo a reindex
            # so need to adjust the output as our expected sets us up
            # to be non-observed
            expected_columns = CategoricalIndex(['A', 'B'],
                                                categories=categories,
                                                ordered=True)
        else:
            expected_columns = CategoricalIndex(categories,
                                                categories=categories,
                                                ordered=True)
        expected = DataFrame(data=expected_data, columns=expected_columns)
        assert_frame_equal(result, expected)

        # test transposed version
        df = DataFrame(data.T, index=cat_columns)
        result = df.groupby(axis=0, level=0, observed=observed).sum()
        expected = DataFrame(data=expected_data.T, index=expected_columns)
        assert_frame_equal(result, expected)

    def test_grouper_getting_correct_binner(self):

        # GH 10063
        # using a non-time-based grouper and a time-based grouper
        # and specifying levels
        df = DataFrame({'A': 1}, index=pd.MultiIndex.from_product(
            [list('ab'), date_range('20130101', periods=80)], names=['one',
                                                                     'two']))
        result = df.groupby([pd.Grouper(level='one'), pd.Grouper(
            level='two', freq='M')]).sum()
        expected = DataFrame({'A': [31, 28, 21, 31, 28, 21]},
                             index=MultiIndex.from_product(
                                 [list('ab'),
                                  date_range('20130101', freq='M', periods=3)],
                                 names=['one', 'two']))
        assert_frame_equal(result, expected)

    def test_grouper_iter(self, df):
        assert sorted(df.groupby('A').grouper) == ['bar', 'foo']

    def test_empty_groups(self, df):
        # see gh-1048
        with pytest.raises(ValueError, match="No group keys passed!"):
            df.groupby([])

    def test_groupby_grouper(self, df):
        grouped = df.groupby('A')

        result = df.groupby(grouped.grouper).mean()
        expected = grouped.mean()
        tm.assert_frame_equal(result, expected)

    def test_groupby_dict_mapping(self):
        # GH #679
        from pandas import Series
        s = Series({'T1': 5})
        result = s.groupby({'T1': 'T2'}).agg(sum)
        expected = s.groupby(['T2']).agg(sum)
        assert_series_equal(result, expected)

        s = Series([1., 2., 3., 4.], index=list('abcd'))
        mapping = {'a': 0, 'b': 0, 'c': 1, 'd': 1}

        result = s.groupby(mapping).mean()
        result2 = s.groupby(mapping).agg(np.mean)
        expected = s.groupby([0, 0, 1, 1]).mean()
        expected2 = s.groupby([0, 0, 1, 1]).mean()
        assert_series_equal(result, expected)
        assert_series_equal(result, result2)
        assert_series_equal(result, expected2)

    def test_groupby_grouper_f_sanity_checked(self):
        dates = date_range('01-Jan-2013', periods=12, freq='MS')
        ts = Series(np.random.randn(12), index=dates)

        # GH3035
        # index.map is used to apply grouper to the index
        # if it fails on the elements, map tries it on the entire index as
        # a sequence. That can yield invalid results that cause trouble
        # down the line.
        # the surprise comes from using key[0:6] rather then str(key)[0:6]
        # when the elements are Timestamp.
        # the result is Index[0:6], very confusing.

        msg = r"Grouper result violates len\(labels\) == len\(data\)"
        with pytest.raises(AssertionError, match=msg):
            ts.groupby(lambda key: key[0:6])

    def test_grouping_error_on_multidim_input(self, df):
        msg = ("Grouper for '<class 'pandas.core.frame.DataFrame'>'"
               " not 1-dimensional")
        with pytest.raises(ValueError, match=msg):
            Grouping(df.index, df[['A', 'A']])

    def test_multiindex_passthru(self):

        # GH 7997
        # regression from 0.14.1
        df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
        df.columns = pd.MultiIndex.from_tuples([(0, 1), (1, 1), (2, 1)])

        result = df.groupby(axis=1, level=[0, 1]).first()
        assert_frame_equal(result, df)

    def test_multiindex_negative_level(self, mframe):
        # GH 13901
        result = mframe.groupby(level=-1).sum()
        expected = mframe.groupby(level='second').sum()
        assert_frame_equal(result, expected)

        result = mframe.groupby(level=-2).sum()
        expected = mframe.groupby(level='first').sum()
        assert_frame_equal(result, expected)

        result = mframe.groupby(level=[-2, -1]).sum()
        expected = mframe
        assert_frame_equal(result, expected)

        result = mframe.groupby(level=[-1, 'first']).sum()
        expected = mframe.groupby(level=['second', 'first']).sum()
        assert_frame_equal(result, expected)

    def test_multifunc_select_col_integer_cols(self, df):
        df.columns = np.arange(len(df.columns))

        # it works!
        df.groupby(1, as_index=False)[2].agg({'Q': np.mean})

    def test_multiindex_columns_empty_level(self):
        lst = [['count', 'values'], ['to filter', '']]
        midx = MultiIndex.from_tuples(lst)

        df = DataFrame([[long(1), 'A']], columns=midx)

        grouped = df.groupby('to filter').groups
        assert grouped['A'] == [0]

        grouped = df.groupby([('to filter', '')]).groups
        assert grouped['A'] == [0]

        df = DataFrame([[long(1), 'A'], [long(2), 'B']], columns=midx)

        expected = df.groupby('to filter').groups
        result = df.groupby([('to filter', '')]).groups
        assert result == expected

        df = DataFrame([[long(1), 'A'], [long(2), 'A']], columns=midx)

        expected = df.groupby('to filter').groups
        result = df.groupby([('to filter', '')]).groups
        tm.assert_dict_equal(result, expected)

    def test_groupby_multiindex_tuple(self):
        # GH 17979
        df = pd.DataFrame([[1, 2, 3, 4], [3, 4, 5, 6], [1, 4, 2, 3]],
                          columns=pd.MultiIndex.from_arrays(
                              [['a', 'b', 'b', 'c'],
                               [1, 1, 2, 2]]))
        expected = df.groupby([('b', 1)]).groups
        result = df.groupby(('b', 1)).groups
        tm.assert_dict_equal(expected, result)

        df2 = pd.DataFrame(df.values,
                           columns=pd.MultiIndex.from_arrays(
                               [['a', 'b', 'b', 'c'],
                                ['d', 'd', 'e', 'e']]))
        expected = df2.groupby([('b', 'd')]).groups
        result = df.groupby(('b', 1)).groups
        tm.assert_dict_equal(expected, result)

        df3 = pd.DataFrame(df.values,
                           columns=[('a', 'd'), ('b', 'd'), ('b', 'e'), 'c'])
        expected = df3.groupby([('b', 'd')]).groups
        result = df.groupby(('b', 1)).groups
        tm.assert_dict_equal(expected, result)

    @pytest.mark.parametrize('sort', [True, False])
    def test_groupby_level(self, sort, mframe, df):
        # GH 17537
        frame = mframe
        deleveled = frame.reset_index()

        result0 = frame.groupby(level=0, sort=sort).sum()
        result1 = frame.groupby(level=1, sort=sort).sum()

        expected0 = frame.groupby(deleveled['first'].values, sort=sort).sum()
        expected1 = frame.groupby(deleveled['second'].values, sort=sort).sum()

        expected0.index.name = 'first'
        expected1.index.name = 'second'

        assert result0.index.name == 'first'
        assert result1.index.name == 'second'

        assert_frame_equal(result0, expected0)
        assert_frame_equal(result1, expected1)
        assert result0.index.name == frame.index.names[0]
        assert result1.index.name == frame.index.names[1]

        # groupby level name
        result0 = frame.groupby(level='first', sort=sort).sum()
        result1 = frame.groupby(level='second', sort=sort).sum()
        assert_frame_equal(result0, expected0)
        assert_frame_equal(result1, expected1)

        # axis=1

        result0 = frame.T.groupby(level=0, axis=1, sort=sort).sum()
        result1 = frame.T.groupby(level=1, axis=1, sort=sort).sum()
        assert_frame_equal(result0, expected0.T)
        assert_frame_equal(result1, expected1.T)

        # raise exception for non-MultiIndex
        msg = "level > 0 or level < -1 only valid with MultiIndex"
        with pytest.raises(ValueError, match=msg):
            df.groupby(level=1)

    def test_groupby_level_index_names(self):
        # GH4014 this used to raise ValueError since 'exp'>1 (in py2)
        df = DataFrame({'exp': ['A'] * 3 + ['B'] * 3,
                        'var1': lrange(6), }).set_index('exp')
        df.groupby(level='exp')
        msg = "level name foo is not the name of the index"
        with pytest.raises(ValueError, match=msg):
            df.groupby(level='foo')

    @pytest.mark.parametrize('sort', [True, False])
    def test_groupby_level_with_nas(self, sort):
        # GH 17537
        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
                           codes=[[1, 1, 1, 1, 0, 0, 0, 0], [0, 1, 2, 3, 0, 1,
                                                             2, 3]])

        # factorizing doesn't confuse things
        s = Series(np.arange(8.), index=index)
        result = s.groupby(level=0, sort=sort).sum()
        expected = Series([6., 22.], index=[0, 1])
        assert_series_equal(result, expected)

        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
                           codes=[[1, 1, 1, 1, -1, 0, 0, 0], [0, 1, 2, 3, 0,
                                                              1, 2, 3]])

        # factorizing doesn't confuse things
        s = Series(np.arange(8.), index=index)
        result = s.groupby(level=0, sort=sort).sum()
        expected = Series([6., 18.], index=[0.0, 1.0])
        assert_series_equal(result, expected)

    def test_groupby_args(self, mframe):
        # PR8618 and issue 8015
        frame = mframe

        msg = "You have to supply one of 'by' and 'level'"
        with pytest.raises(TypeError, match=msg):
            frame.groupby()

        msg = "You have to supply one of 'by' and 'level'"
        with pytest.raises(TypeError, match=msg):
            frame.groupby(by=None, level=None)

    @pytest.mark.parametrize('sort,labels', [
        [True, [2, 2, 2, 0, 0, 1, 1, 3, 3, 3]],
        [False, [0, 0, 0, 1, 1, 2, 2, 3, 3, 3]]
    ])
    def test_level_preserve_order(self, sort, labels, mframe):
        # GH 17537
        grouped = mframe.groupby(level=0, sort=sort)
        exp_labels = np.array(labels, np.intp)
        assert_almost_equal(grouped.grouper.labels[0], exp_labels)

    def test_grouping_labels(self, mframe):
        grouped = mframe.groupby(mframe.index.get_level_values(0))
        exp_labels = np.array([2, 2, 2, 0, 0, 1, 1, 3, 3, 3], dtype=np.intp)
        assert_almost_equal(grouped.grouper.labels[0], exp_labels)

    def test_list_grouper_with_nat(self):
        # GH 14715
        df = pd.DataFrame({'date': pd.date_range('1/1/2011',
                                                 periods=365, freq='D')})
        df.iloc[-1] = pd.NaT
        grouper = pd.Grouper(key='date', freq='AS')

        # Grouper in a list grouping
        result = df.groupby([grouper])
        expected = {pd.Timestamp('2011-01-01'): pd.Index(list(range(364)))}
        tm.assert_dict_equal(result.groups, expected)

        # Test case without a list
        result = df.groupby(grouper)
        expected = {pd.Timestamp('2011-01-01'): 365}
        tm.assert_dict_equal(result.groups, expected)


# get_group
# --------------------------------

class TestGetGroup():

    @pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
    def test_get_group(self):
        wp = tm.makePanel()
        grouped = wp.groupby(lambda x: x.month, axis='major')

        gp = grouped.get_group(1)
        expected = wp.reindex(
            major=[x for x in wp.major_axis if x.month == 1])
        assert_panel_equal(gp, expected)

        # GH 5267
        # be datelike friendly
        df = DataFrame({'DATE': pd.to_datetime(
            ['10-Oct-2013', '10-Oct-2013', '10-Oct-2013', '11-Oct-2013',
             '11-Oct-2013', '11-Oct-2013']),
            'label': ['foo', 'foo', 'bar', 'foo', 'foo', 'bar'],
            'VAL': [1, 2, 3, 4, 5, 6]})

        g = df.groupby('DATE')
        key = list(g.groups)[0]
        result1 = g.get_group(key)
        result2 = g.get_group(Timestamp(key).to_pydatetime())
        result3 = g.get_group(str(Timestamp(key)))
        assert_frame_equal(result1, result2)
        assert_frame_equal(result1, result3)

        g = df.groupby(['DATE', 'label'])

        key = list(g.groups)[0]
        result1 = g.get_group(key)
        result2 = g.get_group((Timestamp(key[0]).to_pydatetime(), key[1]))
        result3 = g.get_group((str(Timestamp(key[0])), key[1]))
        assert_frame_equal(result1, result2)
        assert_frame_equal(result1, result3)

        # must pass a same-length tuple with multiple keys
        msg = "must supply a tuple to get_group with multiple grouping keys"
        with pytest.raises(ValueError, match=msg):
            g.get_group('foo')
        with pytest.raises(ValueError, match=msg):
            g.get_group(('foo'))
        msg = ("must supply a same-length tuple to get_group with multiple"
               " grouping keys")
        with pytest.raises(ValueError, match=msg):
            g.get_group(('foo', 'bar', 'baz'))

    def test_get_group_empty_bins(self, observed):

        d = pd.DataFrame([3, 1, 7, 6])
        bins = [0, 5, 10, 15]
        g = d.groupby(pd.cut(d[0], bins), observed=observed)

        # TODO: should prob allow a str of Interval work as well
        # IOW '(0, 5]'
        result = g.get_group(pd.Interval(0, 5))
        expected = DataFrame([3, 1], index=[0, 1])
        assert_frame_equal(result, expected)

        msg = r"Interval\(10, 15, closed='right'\)"
        with pytest.raises(KeyError, match=msg):
            g.get_group(pd.Interval(10, 15))

    def test_get_group_grouped_by_tuple(self):
        # GH 8121
        df = DataFrame([[(1, ), (1, 2), (1, ), (1, 2)]], index=['ids']).T
        gr = df.groupby('ids')
        expected = DataFrame({'ids': [(1, ), (1, )]}, index=[0, 2])
        result = gr.get_group((1, ))
        assert_frame_equal(result, expected)

        dt = pd.to_datetime(['2010-01-01', '2010-01-02', '2010-01-01',
                             '2010-01-02'])
        df = DataFrame({'ids': [(x, ) for x in dt]})
        gr = df.groupby('ids')
        result = gr.get_group(('2010-01-01', ))
        expected = DataFrame({'ids': [(dt[0], ), (dt[0], )]}, index=[0, 2])
        assert_frame_equal(result, expected)

    def test_groupby_with_empty(self):
        index = pd.DatetimeIndex(())
        data = ()
        series = pd.Series(data, index)
        grouper = pd.Grouper(freq='D')
        grouped = series.groupby(grouper)
        assert next(iter(grouped), None) is None

    def test_groupby_with_single_column(self):
        df = pd.DataFrame({'a': list('abssbab')})
        tm.assert_frame_equal(df.groupby('a').get_group('a'), df.iloc[[0, 5]])
        # GH 13530
        exp = pd.DataFrame([], index=pd.Index(['a', 'b', 's'], name='a'))
        tm.assert_frame_equal(df.groupby('a').count(), exp)
        tm.assert_frame_equal(df.groupby('a').sum(), exp)
        tm.assert_frame_equal(df.groupby('a').nth(1), exp)

    def test_gb_key_len_equal_axis_len(self):
            # GH16843
            # test ensures that index and column keys are recognized correctly
            # when number of keys equals axis length of groupby
            df = pd.DataFrame([['foo', 'bar', 'B', 1],
                               ['foo', 'bar', 'B', 2],
                               ['foo', 'baz', 'C', 3]],
                              columns=['first', 'second', 'third', 'one'])
            df = df.set_index(['first', 'second'])
            df = df.groupby(['first', 'second', 'third']).size()
            assert df.loc[('foo', 'bar', 'B')] == 2
            assert df.loc[('foo', 'baz', 'C')] == 1


# groups & iteration
# --------------------------------

class TestIteration():

    def test_groups(self, df):
        grouped = df.groupby(['A'])
        groups = grouped.groups
        assert groups is grouped.groups  # caching works

        for k, v in compat.iteritems(grouped.groups):
            assert (df.loc[v]['A'] == k).all()

        grouped = df.groupby(['A', 'B'])
        groups = grouped.groups
        assert groups is grouped.groups  # caching works

        for k, v in compat.iteritems(grouped.groups):
            assert (df.loc[v]['A'] == k[0]).all()
            assert (df.loc[v]['B'] == k[1]).all()

    def test_grouping_is_iterable(self, tsframe):
        # this code path isn't used anywhere else
        # not sure it's useful
        grouped = tsframe.groupby([lambda x: x.weekday(), lambda x: x.year])

        # test it works
        for g in grouped.grouper.groupings[0]:
            pass

    def test_multi_iter(self):
        s = Series(np.arange(6))
        k1 = np.array(['a', 'a', 'a', 'b', 'b', 'b'])
        k2 = np.array(['1', '2', '1', '2', '1', '2'])

        grouped = s.groupby([k1, k2])

        iterated = list(grouped)
        expected = [('a', '1', s[[0, 2]]), ('a', '2', s[[1]]),
                    ('b', '1', s[[4]]), ('b', '2', s[[3, 5]])]
        for i, ((one, two), three) in enumerate(iterated):
            e1, e2, e3 = expected[i]
            assert e1 == one
            assert e2 == two
            assert_series_equal(three, e3)

    def test_multi_iter_frame(self, three_group):
        k1 = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
        k2 = np.array(['1', '2', '1', '2', '1', '2'])
        df = DataFrame({'v1': np.random.randn(6),
                        'v2': np.random.randn(6),
                        'k1': k1, 'k2': k2},
                       index=['one', 'two', 'three', 'four', 'five', 'six'])

        grouped = df.groupby(['k1', 'k2'])

        # things get sorted!
        iterated = list(grouped)
        idx = df.index
        expected = [('a', '1', df.loc[idx[[4]]]),
                    ('a', '2', df.loc[idx[[3, 5]]]),
                    ('b', '1', df.loc[idx[[0, 2]]]),
                    ('b', '2', df.loc[idx[[1]]])]
        for i, ((one, two), three) in enumerate(iterated):
            e1, e2, e3 = expected[i]
            assert e1 == one
            assert e2 == two
            assert_frame_equal(three, e3)

        # don't iterate through groups with no data
        df['k1'] = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
        df['k2'] = np.array(['1', '1', '1', '2', '2', '2'])
        grouped = df.groupby(['k1', 'k2'])
        groups = {key: gp for key, gp in grouped}
        assert len(groups) == 2

        # axis = 1
        three_levels = three_group.groupby(['A', 'B', 'C']).mean()
        grouped = three_levels.T.groupby(axis=1, level=(1, 2))
        for key, group in grouped:
            pass

    @pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
    def test_multi_iter_panel(self):
        wp = tm.makePanel()
        grouped = wp.groupby([lambda x: x.month, lambda x: x.weekday()],
                             axis=1)

        for (month, wd), group in grouped:
            exp_axis = [x
                        for x in wp.major_axis
                        if x.month == month and x.weekday() == wd]
            expected = wp.reindex(major=exp_axis)
            assert_panel_equal(group, expected)

    def test_dictify(self, df):
        dict(iter(df.groupby('A')))
        dict(iter(df.groupby(['A', 'B'])))
        dict(iter(df['C'].groupby(df['A'])))
        dict(iter(df['C'].groupby([df['A'], df['B']])))
        dict(iter(df.groupby('A')['C']))
        dict(iter(df.groupby(['A', 'B'])['C']))

    def test_groupby_with_small_elem(self):
        # GH 8542
        # length=2
        df = pd.DataFrame({'event': ['start', 'start'],
                           'change': [1234, 5678]},
                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10']))
        grouped = df.groupby([pd.Grouper(freq='M'), 'event'])
        assert len(grouped.groups) == 2
        assert grouped.ngroups == 2
        assert (pd.Timestamp('2014-09-30'), 'start') in grouped.groups
        assert (pd.Timestamp('2013-10-31'), 'start') in grouped.groups

        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
        tm.assert_frame_equal(res, df.iloc[[0], :])
        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
        tm.assert_frame_equal(res, df.iloc[[1], :])

        df = pd.DataFrame({'event': ['start', 'start', 'start'],
                           'change': [1234, 5678, 9123]},
                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10',
                                                  '2014-09-15']))
        grouped = df.groupby([pd.Grouper(freq='M'), 'event'])
        assert len(grouped.groups) == 2
        assert grouped.ngroups == 2
        assert (pd.Timestamp('2014-09-30'), 'start') in grouped.groups
        assert (pd.Timestamp('2013-10-31'), 'start') in grouped.groups

        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
        tm.assert_frame_equal(res, df.iloc[[0, 2], :])
        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
        tm.assert_frame_equal(res, df.iloc[[1], :])

        # length=3
        df = pd.DataFrame({'event': ['start', 'start', 'start'],
                           'change': [1234, 5678, 9123]},
                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10',
                                                  '2014-08-05']))
        grouped = df.groupby([pd.Grouper(freq='M'), 'event'])
        assert len(grouped.groups) == 3
        assert grouped.ngroups == 3
        assert (pd.Timestamp('2014-09-30'), 'start') in grouped.groups
        assert (pd.Timestamp('2013-10-31'), 'start') in grouped.groups
        assert (pd.Timestamp('2014-08-31'), 'start') in grouped.groups

        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
        tm.assert_frame_equal(res, df.iloc[[0], :])
        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
        tm.assert_frame_equal(res, df.iloc[[1], :])
        res = grouped.get_group((pd.Timestamp('2014-08-31'), 'start'))
        tm.assert_frame_equal(res, df.iloc[[2], :])

    def test_grouping_string_repr(self):
        # GH 13394
        mi = MultiIndex.from_arrays([list("AAB"), list("aba")])
        df = DataFrame([[1, 2, 3]], columns=mi)
        gr = df.groupby(df[('A', 'a')])

        result = gr.grouper.groupings[0].__repr__()
        expected = "Grouping(('A', 'a'))"
        assert result == expected