python source code of streaming_random

scikit-multiflow-master
- .github
  - pull_request_template.md
  - ISSUE_TEMPLATE
    - feature_request.md
    - bug_report.md
- src
  - skmultiflow
    - lazy
      - src
        libNearestNeighbors
        nearestNeighbor.cpp
      - knn_adwin.py
      - base_neighbors.py
      - setup.py
      - sam_knn.py
      - __init__.py
      - knn_classifier.py
      - knn_regressor.py
    - prototype
      - __init__.py
      - robust_soft_learning_vector_quantization.py
    - options
      - file_option.py
      - README.md
      - base_option.py
    - trees
      - arf_hoeffding_tree_regressor.py
      - gaussian_estimator.py
      - hoeffding_adaptive_tree.py
      - attribute_test
        nominal_attribute_binary_test.py
        instance_conditional_test.py
        nominal_attribute_multiway_test.py
        numeric_attribute_binary_test.py
        __init__.py
      - hoeffding_adaptive_tree_regressor.py
      - stacked_single_target_hoeffding_tree_regressor.py
      - isoup_tree.py
      - arf_hoeffding_tree.py
      - hoeffding_tree_regressor.py
      - label_combination_hoeffding_tree.py
      - setup.py
      - extremely_fast_decision_tree.py
      - hoeffding_tree.py
      - attribute_split_suggestion.py
      - nodes
        sst_active_learning_node.py
        inactive_learning_node_perceptron_multi_target.py
        ada_split_node_for_regression.py
        split_node.py
        inactive_learning_node.py
        anytime_split_node.py
        random_learning_node_for_regression.py
        random_learning_node_classification.py
        sst_inactive_learning_node.py
        active_learning_node_perceptron.py
        sst_inactive_learning_node_adaptive.py
        ada_learning_node.py
        random_learning_node_nb_adaptive.py
        lc_inactive_learning_node.py
        active_learning_node_for_regression.py
        anytime_learning_node_nb_adaptive.py
        found_node.py
        lc_learning_node_nb.py
        inactive_learning_node_perceptron.py
        active_learning_node_adaptive_multi_target.py
        inactive_learning_node_for_regression.py
        learning_node_nb_adaptive.py
        anytime_learning_node_nb.py
        ada_learning_node_for_regression.py
        node.py
        active_learning_node_for_regression_multi_target.py
        ada_split_node.py
        anytime_active_learning_node.py
        active_learning_node.py
        __init__.py
        random_learning_node_perceptron.py
        sst_active_learning_node_adaptive.py
        active_learning_node_perceptron_multi_target.py
        learning_node.py
        random_learning_node_nb.py
        anytime_inactive_learning_node.py
        lc_active_learning_node.py
        inactive_learning_node_adaptive_multi_target.py
        lc_learning_node_nba.py
        learning_node_nb.py
        ada_node.py
      - __init__.py
      - attribute_observer
        attribute_class_observer.py
        nominal_attribute_class_observer.py
        numeric_attribute_class_observer_binary_tree.py
        numeric_attribute_regression_observer.py
        __init__.py
        attribute_class_observer_null.py
        nominal_attribute_regression_observer.py
        numeric_attribute_class_observer_gaussian.py
      - split_criterion
        base_split_criterion.py
        gini_split_criterion.py
        variance_reduction_split_criterion.py
        hellinger_distance_criterion.py
        __init__.py
        intra_cluster_variance_reduction_split_criterion.py
        info_gain_split_criterion.py
    - utils
      - statistics.py
      - data_structures.py
      - _show_versions.py
      - file_scripts.py
      - validation.py
      - constants.py
      - __init__.py
      - utils.py
      - _pprint.py
    - bayes
      - __init__.py
      - utils.py
      - naive_bayes.py
    - neural_networks
      - perceptron.py
      - __init__.py
    - evaluation
      - evaluate_prequential.py
      - evaluate_prequential_delayed.py
      - evaluation_data_buffer.py
      - evaluate_holdout.py
      - __init__.py
      - base_evaluator.py
      - evaluate_stream_gen_speed.py
    - setup.py
    - data
      - agrawal_generator.py
      - sea_generator.py
      - synth.py
      - temporal_data_stream.py
      - base_stream.py
      - mixed_generator.py
      - led_generator_drift.py
      - hyper_plane_generator.py
      - data_stream.py
      - random_tree_generator.py
      - led_generator.py
      - unsupervised_stream.py
      - waveform_generator.py
      - sine_generator.py
      - pseudo_random_processes.py
      - __init__.py
      - random_rbf_generator.py
      - anomaly_sine_generator.py
      - file_stream.py
      - concept_drift_stream.py
      - multilabel_generator.py
      - regression_generator.py
      - time_manager.py
      - stagger_generator.py
      - random_rbf_generator_drift.py
    - anomaly_detection
      - __init__.py
      - half_space_trees.py
    - rules
      - info_gain_rule_criterion.py
      - very_fast_decision_rules.py
      - foil_gain_rule_criterion.py
      - numeric_attribute_class_observer.py
      - nominal_attribute_class_observer.py
      - hellinger_distance_criterion.py
      - attribute_expand_suggestion.py
      - __init__.py
      - base_predicate.py
      - base_rule.py
    - drift_detection
      - base_drift_detector.py
      - hddm_a.py
      - adwin.py
      - __init__.py
      - hddm_w.py
      - ddm.py
      - eddm.py
      - page_hinkley.py
      - kswin.py
    - _demos
      - _test_file_stream_multiple_cfier.py
      - _test_oza_bagging_adwin.py
      - _test_filters.py
      - _test_pipeline.py
      - _test_prequential_mol.py
      - _test_knn.py
      - _test_sam_knn.py
      - _test_adwin.ipynb
      - _test_knn_adwin.py
      - _test_file_stream.py
      - _test_mol.py
      - _test_regression.py
      - _test_comparison_holdout.py
      - _test_leverage_bagging.py
      - _test_streams.py
      - _test_holdout.py
      - _test_sam_knn_prequential.py
      - README.md
      - _test_isoup_tree.py
      - _test_stream_speed.py
      - _test_adwin.py
      - _test_oza_bagging.py
      - _test_comparison_prequential.py
      - _test_file_cleaning.py
      - _test_prequential_bagging.py
      - _test_prequential.py
    - __init__.py
    - _version.py
    - visualization
      - base_listener.py
      - evaluation_visualizer.py
      - __init__.py
    - core
      - pipeline.py
      - instance_header.py
      - __init__.py
      - base.py
    - metrics
      - _confusion_matrix.pyx
      - _classification_performance_evaluator.pxd
      - setup.py
      - __init__.py
      - _classification_performance_evaluator.pyx
      - _confusion_matrix.pxd
      - measure_collection.py
    - meta
      - streaming_random_patches.py
      - online_adac2.py
      - online_boosting.py
      - accuracy_weighted_ensemble.py
      - online_under_over_bagging.py
      - learn_pp.py
      - oza_bagging.py
      - leverage_bagging.py
      - dynamic_weighted_majority.py
      - oza_bagging_adwin.py
      - adaptive_random_forest_regressor.py
      - adaptive_random_forests.py
      - online_rus_boost.py
      - online_smote_bagging.py
      - online_csb2.py
      - learn_nse.py
      - __init__.py
      - regressor_chains.py
      - classifier_chains.py
      - additive_expert_ensemble.py
      - multi_output_learner.py
      - batch_incremental.py
    - transform
      - missing_values_cleaner.py
      - windowed_minmax_scaler.py
      - windowed_standard_scaler.py
      - base_transform.py
      - one_hot_to_categorical.py
      - __init__.py
- _config.yml
- LICENSE
- .readthedocs.yml
- CONTRIBUTING.md
- AUTHORS.md
- .gitattributes
- setup.py
- docker
  - Makefile
  - examples
    - src
      - ht_from_file.py
      - hoeffding_tree.py
    - notebooks
      - QuickStart.ipynb
    - data
      - data.py
  - dockerfiles
    - devel.Dockerfile
    - jupyter.Dockerfile
    - Dockerfile
    - devel-jupyter.Dockerfile
  - readme.md
- dev
  - linter.sh
- requirements-dev.txt
- cicd
  - azure-test-helpers
    - azure-test.yml
    - azure-install.yml
  - azure-pipelines.yml
  - azure-pipeline-build.yml
  - azure-wheel-helpers
    - azure-steps.yml
    - requirements-test.txt
    - azure-manylinux-wheels.yml
    - requirements-dev.txt
    - azure-setup.yml
    - build-wheels.sh
    - macos-install-python.sh
    - azure-publish-dist.yml
    - azure-tests.yml
- setup.cfg
- .travis.yml
- README.md
- tests
  - lazy
    - test_knn_adwin.py
    - test_knn_regressor.py
    - test_knn_classifier.py
    - test_sam_knn.py
    - __init__.py
    - conftest.py
  - prototype
    - test_robust_soft_learning_vector_quantization.py
    - __init__.py
  - trees
    - expected_preds_multi_target_regression_mean.npy
    - test_hoeffding_adaptive_tree_regressor.py
    - test_hoeffding_adaptive_tree.py
    - expected_preds_multi_target_regression_adaptive.npy
    - expected_preds_stacked_single_target_hoeffding_tree_perceptron.npy
    - test_hoeffding_tree_regressor.py
    - test_hoeffding_adaptive_tree_nb.npy
    - test_hoeffding_adaptive_tree_mc.npy
    - test_hoeffding_tree.py
    - test_hoeffding_adaptive_tree_nba.npy
    - expected_preds_stacked_single_target_hoeffding_tree_adaptive.npy
    - test_extremely_fast_decision_tree.py
    - test_isoup_tree.py
    - __init__.py
    - expected_preds_multi_target_regression_perceptron.npy
    - test_stacked_single_target_hoeffding_tree_regressor.py
    - test_hoeffding_anytime_tree.npy
    - test_hoeffding_tree.npy
    - conftest.py
    - test_label_combination_hoeffding_tree.py
  - utils
    - test_show_versions.py
    - test_utils.py
    - test_file_scripts.py
    - file_with_header.csv
    - file_without_header.csv
    - __init__.py
    - test_validation.py
    - conftest.py
  - bayes
    - data_naive_bayes_proba.npy
    - test_naive_bayes.py
    - __init__.py
    - conftest.py
  - neural_networks
    - data_perceptron_proba.npy
    - __init__.py
    - test_perceptron.py
    - conftest.py
  - evaluation
    - test_evaluate_stream_gen_speed.py
    - test_evaluate_prequential_delayed.py
    - test_evaluate_prequential.py
    - prequential_summary.csv
    - prequential_delayed_summary.csv
    - test_evaluate_holdout.py
    - __init__.py
    - holdout_summary.csv
    - conftest.py
  - data
    - test_concept_drift_stream.py
    - test_anomaly_sine_generator.py
    - test_sine_generator.py
    - agrawal_stream_2.npz
    - agrawal_stream.npz
    - test_file_stream.py
    - test_temporal_data_stream.py
    - waveform_stream.npz
    - agrawal_stream_7.npz
    - random_rbf_stream.npz
    - concept_drift_stream.npz
    - test_random_rbf_generator_drift.py
    - test_led_generator.py
    - test_led_generator_drift.py
    - agrawal_stream_6.npz
    - test_multilabel_generator.py
    - sea_stream_file.npz
    - agrawal_stream_8.npz
    - sine_noise_stream.npz
    - multilabel_stream.npz
    - agrawal_stream_9.npz
    - mixed_stream.npz
    - agrawal_stream_1.npz
    - led_stream_drift.npz
    - test_mixed_generator.py
    - test_data_stream.py
    - sea_stream.npz
    - test_random_tree_generator.py
    - regression_stream.npz
    - test_regression_generator.py
    - __init__.py
    - agrawal_stream_4.npz
    - test_synth.py
    - hyper_plane_stream.npz
    - waveform_noise_stream.npz
    - led_stream.npz
    - agrawal_stream_drift.npz
    - test_waveform_generator.py
    - stagger_stream.npz
    - agrawal_stream_0.npz
    - random_tree_stream.npz
    - test_sea_generator.py
    - test_stagger_generator.py
    - anomaly_sine_stream.npz
    - test_random_rbf_generator.py
    - agrawal_stream_3.npz
    - sea_stream_file.csv
    - random_rbf_drift_stream.npz
    - agrawal_stream_5.npz
    - test_agrawal_generator.py
    - conftest.py
    - test_hyper_plane_generator.py
  - anomaly_detection
    - test_half_space_trees.npy
    - test_half_space_trees.py
    - __init__.py
    - conftest.py
  - rules
    - __init__.py
    - conftest.py
    - test_very_fast_decision_rules.py
  - drift_detection
    - test_adwin.py
    - test_ddm.py
    - test_eddm.py
    - test_hddm_a.py
    - __init__.py
    - test_hddm_w.py
    - drift_stream.npy
    - test_kswin.py
    - test_page_hinkley.py
    - conftest.py
  - __init__.py
  - core
    - test_base.py
    - test_instance_header.py
    - __init__.py
    - test_pipeline.py
    - data-one-hot.npz
    - conftest.py
  - metrics
    - test_classification_performance_evaluator.py
    - test_measure_collection.py
    - __init__.py
  - meta
    - test_accuracy_weighted_ensemble.py
    - test_multi_output_learner.py
    - test_streaming_random_patches.py
    - test_oza_bagging.py
    - test_online_under_over_bagging.py
    - test_adaptive_random_forests.py
    - test_leverage_bagging.py
    - test_online_boosting.py
    - test_adaptive_random_forest_regressor.py
    - test_regressor_chains.py
    - test_classifier_chains.py
    - test_batch_incremental.py
    - test_online_smote_bagging.py
    - test_oza_bagging_adwin.py
    - test_online_adac2.py
    - test_dynamic_weighted_majority.py
    - __init__.py
    - test_learn_nse.py
    - test_online_csb2.py
    - test_online_rus_boost.py
    - test_additive_expert_ensemble.py
    - conftest.py
    - test_learn_pp.py
  - transform
    - test_one_hot_to_categorical.py
    - test_missing_values_cleaner.py
    - test_windowed_minmax_scaler.py
    - data_nan.npy
    - data_complete.npy
    - data-categorical.npy
    - __init__.py
    - test_windowed_standard_scaler.py
    - data-one-hot.npz
    - std_scaler.npy
    - minmax_scaler.npy
    - conftest.py
- requirements.txt
- .codecov.yml
- .gitignore
- docs
  - Makefile
  - make.bat
  - legacy-doc.rst
  - user-guide
    - core-concepts.rst
    - package_map.rst
    - quick-start.rst
    - core-concepts.architecture.rst
    - user-guide.rst
    - core-concepts.stream-class.rst
    - quick-start-docker.rst
    - streams-intro.rst
  - sphinxext
    - sphinx_issues.py
    - README.txt
    - github_link.py
    - LICENSE.txt
    - MANIFEST.in
  - api
    - api.rst
  - changelog
    - v0.3.rst
    - v0.5.rst
    - v0.1.rst
    - v0.2.rst
    - _labels.rst
    - v0.4.rst
  - requirements.txt
  - index.rst
  - conf.py
  - whats_new.rst
  - _templates
    - class.rst
  - _static
    - images
      - skmultiflow-logo-wide.svg
      - skmultiflow-favicon.ico
    - css
      - skmultiflow.css
  - installation.rst
- MANIFEST.in
- tox.ini

from copy import deepcopy
from typing import List, Optional
from collections import deque

import numpy as np

from sklearn.preprocessing import normalize

from skmultiflow.core import BaseSKMObject, ClassifierMixin, MetaEstimatorMixin, clone
from skmultiflow.drift_detection.base_drift_detector import BaseDriftDetector
from skmultiflow.trees import HoeffdingTreeClassifier
from skmultiflow.drift_detection import ADWIN
from skmultiflow.utils import check_random_state, get_dimensions
from skmultiflow.metrics import ClassificationPerformanceEvaluator


class StreamingRandomPatchesClassifier(BaseSKMObject, ClassifierMixin, MetaEstimatorMixin):
    """ Streaming Random Patches ensemble classifier.

    Parameters
    ----------
    base_estimator: BaseSKMObject or sklearn.BaseObject, \
        (default=HoeffdingTreeClassifier)
        The base estimator.

    n_estimators: int, (default=100)
        Number of members in the ensemble.

    subspace_mode: str, (default='percentage')
        | Indicates how ``m``, defined by subspace_size, is interpreted.
          ``M``  represents the total number of features.
        | Only applies when training method is random subspaces or
          random patches.
        | 'm' - Specified value
        | 'sqrtM1' - ``sqrt(M)+1``
        | 'MsqrtM1' - ``M-(sqrt(M)+1)``
        | 'percentage' - Percentage

    subspace_size: int, (default=60)
        Number of features per subset for each classifier.
        Negative value means ``total_features - subspace_size``.

    training_method: str, (default='randompatches')
        | The training method to use.
        | 'randomsubspaces' - Random subspaces
        | 'resampling' - Resampling (bagging)
        | 'randompatches' - Random patches

    lam: float, (default=6.0)
        Lambda value for bagging.

    drift_detection_method: BaseDriftDetector, (default=ADWIN(delta=1e-5))
        Drift detection method.

    warning_detection_method: BaseDriftDetector, (default=ADWIN(delta=1e-4))
        Warning detection method.

    disable_weighted_vote: bool (default=False)
        If True, disables weighted voting.

    disable_drift_detection: bool (default=False)
        If True, disables drift detection and background learner.

    disable_background_learner: bool (default=False)
        If True, disables background learner and trees are reset
        immediately if drift is detected.

    nominal_attributes: list, optional
        List of Nominal attributes. If emtpy, then assume that all
        attributes are numerical.

    random_state: int, RandomState instance or None, optional (default=None)
       If int, random_state is the seed used by the random number generator;
       If RandomState instance, random_state is the random number generator;
       If None, the random number generator is the RandomState instance used
       by `np.random`.

    Notes
    -----
    The Streaming Random Patches (SRP) [1]_ ensemble method simulates bagging
    or random subspaces. The default algorithm uses both bagging and random
    subspaces, namely Random Patches. The default base estimator is a
    Hoeffding Tree, but it can be used with any other base estimator
    (differently from random forest variations).

    References
    ----------
    .. [1] Heitor Murilo Gomes, Jesse Read, Albert Bifet.
       Streaming Random Patches for Evolving Data Stream Classification.
       IEEE International Conference on Data Mining (ICDM), 2019.

    Examples
    --------
    >>> from skmultiflow.data import AGRAWALGenerator
    >>> from skmultiflow.meta import StreamingRandomPatchesClassifier
    >>>
    >>> stream = AGRAWALGenerator(random_state=1)
    >>> srp = StreamingRandomPatchesClassifier(random_state=1,
    >>>                                              n_estimators=3)
    >>>
    >>> # Variables to control loop and track performance
    >>> n_samples = 0
    >>> correct_cnt = 0
    >>> max_samples = 200
    >>>
    >>> # Run test-then-train loop for max_samples
    >>> # or while there is data in the stream
    >>> while n_samples < max_samples and stream.has_more_samples():
    >>>     X, y = stream.next_sample()
    >>>     y_pred = srp.predict(X)
    >>>     if y[0] == y_pred[0]:
    >>>         correct_cnt += 1
    >>>     srp.partial_fit(X, y)
    >>>     n_samples += 1
    >>>
    >>> print('{} samples analyzed.'.format(n_samples))

    """

    _TRAIN_RANDOM_SUBSPACES = "randomsubspaces"
    _TRAIN_RESAMPLING = "resampling"
    _TRAIN_RANDOM_PATCHES = "randompatches"

    _FEATURES_M = 'm'
    _FEATURES_SQRT = "sqrtM1"
    _FEATURES_SQRT_INV = "MsqrtM1"
    _FEATURES_PERCENT = "percentage"

    def __init__(self, base_estimator=HoeffdingTreeClassifier(grace_period=50,
                                                              split_confidence=0.01),
                 n_estimators: int = 100,
                 subspace_mode: str = "percentage",
                 subspace_size: int = 60,
                 training_method: str = "randompatches",
                 lam: float = 6.0,
                 drift_detection_method: BaseDriftDetector = ADWIN(delta=1e-5),
                 warning_detection_method: BaseDriftDetector = ADWIN(delta=1e-4),
                 disable_weighted_vote: bool = False,
                 disable_drift_detection: bool = False,
                 disable_background_learner: bool = False,
                 nominal_attributes=None,
                 random_state=None):

        self.base_estimator = base_estimator   # Not restricted to a specific base estimator.
        self.n_estimators = n_estimators
        if subspace_mode not in {self._FEATURES_SQRT, self._FEATURES_SQRT_INV,
                                 self._FEATURES_PERCENT, self._FEATURES_M}:
            raise ValueError("Invalid subspace_mode: {}.\n"
                             "Valid options are: {}".format(subspace_mode,
                                                            {self._FEATURES_M, self._FEATURES_SQRT,
                                                             self._FEATURES_SQRT_INV,
                                                             self._FEATURES_PERCENT}))
        self.subspace_mode = subspace_mode
        self.subspace_size = subspace_size
        if training_method not in {self._TRAIN_RESAMPLING, self._TRAIN_RANDOM_PATCHES,
                                   self._TRAIN_RANDOM_SUBSPACES}:
            raise ValueError("Invalid training_method: {}.\n"
                             "Valid options are: {}".format(training_method,
                                                            {self._TRAIN_RANDOM_PATCHES,
                                                             self._TRAIN_RANDOM_SUBSPACES,
                                                             self._TRAIN_RESAMPLING}))
        self.training_method = training_method
        self.lam = lam
        self.drift_detection_method = drift_detection_method
        self.warning_detection_method = warning_detection_method
        self.disable_weighted_vote = disable_weighted_vote
        self.disable_drift_detection = disable_drift_detection
        self.disable_background_learner = disable_background_learner
        # Single option (accuracy) for drift detection criteria. Could be extended in the future.
        self.drift_detection_criteria = 'accuracy'
        self.nominal_attributes = nominal_attributes if nominal_attributes else []
        self.random_state = random_state
        # self._random_state is the actual object used internally
        self._random_state = check_random_state(self.random_state)
        self.ensemble = None

        self._n_samples_seen = 0
        self._subspaces = None

        self._base_performance_evaluator = ClassificationPerformanceEvaluator()
        self._base_learner_class = StreamingRandomPatchesBaseLearner

    def partial_fit(self, X, y, classes=None, sample_weight=None):
        """ Partially (incrementally) fit the model.

        Parameters
        ----------
        X : numpy.ndarray of shape (n_samples, n_features)
            The features to train the model.

        y: numpy.ndarray of shape (n_samples)
            An array-like with the class labels of all samples in X.

        classes: numpy.ndarray, optional (default=None)
            No used.

        sample_weight: numpy.ndarray of shape (n_samples), optional \
            (default=None)
            Samples weight. If not provided, uniform weights are assumed.
            Usage varies depending on the learning method.

        Returns
        -------
        self

        """
        n_rows, n_cols = get_dimensions(X)

        if sample_weight is None:
            sample_weight = np.ones(n_rows)

        for i in range(n_rows):
            self._partial_fit(np.asarray([X[i]]), np.asarray([y[i]]),
                              classes=classes, sample_weight=np.asarray([sample_weight[i]]))

        return self

    def _partial_fit(self, X, y, classes=None, sample_weight=None):
        self._n_samples_seen += 1
        _, n_features = get_dimensions(X)

        if not self.ensemble:
            self._init_ensemble(n_features)

        for i in range(len(self.ensemble)):
            # Get prediction for instance
            y_pred = np.asarray([np.argmax(self.ensemble[i].predict_proba(X))])

            # Update performance evaluator
            self.ensemble[i].performance_evaluator.add_result(y[0], y_pred[0], sample_weight[0])

            # Train using random subspaces without resampling,
            # i.e. all instances are used for training.
            if self.training_method == self._TRAIN_RANDOM_SUBSPACES:
                self.ensemble[i].partial_fit(X=X, y=y, classes=classes,
                                             sample_weight=np.asarray([1.]),
                                             n_samples_seen=self._n_samples_seen,
                                             random_state=self._random_state)
            # Train using random patches or resampling,
            # thus we simulate online bagging with Poisson(lambda=...)
            else:
                k = self._random_state.poisson(lam=self.lam)
                if k > 0:
                    self.ensemble[i].partial_fit(X=X, y=y, classes=classes,
                                                 sample_weight=np.asarray([k]),
                                                 n_samples_seen=self._n_samples_seen,
                                                 random_state=self._random_state)

    def predict(self, X):
        """ Predict classes for the passed data.

        Parameters
        ----------
        X : numpy.ndarray of shape (n_samples, n_features)
            The set of data samples to predict the class labels for.

        Returns
        -------
        A numpy.ndarray with all the predictions for the samples in X.

        """
        n_samples, n_features = get_dimensions(X)

        if self.ensemble is None:
            self._init_ensemble(n_features=n_features)
            return np.zeros(n_samples)

        y_proba = self.predict_proba(X)
        y_pred = np.argmax(y_proba, axis=1)
        return y_pred

    def predict_proba(self, X):
        """ Estimate the probability of X belonging to each class-labels.

        Parameters
        ----------
        X : numpy.ndarray of shape (n_samples, n_features)
            Samples one wants to predict the class probabilities for.

        Returns
        -------
        A numpy.ndarray of shape (n_samples, n_labels), in which each outer
        entry is associated with the X entry of the same index. And where the
        list in index [i] contains len(self.target_values) elements, each of
        which represents the probability that the i-th sample of X belongs to
        a certain class-label.

        """
        n_samples, n_features = get_dimensions(X)
        y_proba = []

        if self.ensemble is None:
            self._init_ensemble(n_features=n_features)
            return np.zeros(n_samples)

        for i in range(n_samples):
            y_proba.append(self._predict_proba(np.asarray([X[i]])))
        return np.asarray(y_proba)

    def _predict_proba(self, X):
        y_proba = np.asarray([0.])

        for i in range(len(self.ensemble)):
            y_proba_temp = self.ensemble[i].predict_proba(X)
            if np.sum(y_proba_temp) > 0.0:
                y_proba_temp = normalize(y_proba_temp, norm='l1')[0].copy()
                acc = self.ensemble[i].performance_evaluator.accuracy_score()
                if not self.disable_weighted_vote and acc > 0.0:
                    y_proba_temp *= acc
                # Check array length consistency
                if len(y_proba_temp) != len(y_proba):
                    if len(y_proba_temp) > len(y_proba):
                        y_proba.resize((len(y_proba_temp), ), refcheck=False)
                    else:
                        y_proba_temp.resize((len(y_proba), ), refcheck=False)
                # Add values
                y_proba += y_proba_temp
        return y_proba

    def _init_ensemble(self, n_features: int):
        # Select the size of k, which depends on 2 parameters:
        # subspace_size and subspace_mode
        k = self.subspace_size

        if self.training_method != self._TRAIN_RESAMPLING:
            # This only applies to subspaces and random patches options
            if self.subspace_mode == self._FEATURES_SQRT:
                k = int(np.round(np.sqrt(n_features)) + 1)
            elif self.subspace_mode == self._FEATURES_SQRT_INV:
                k = n_features - int(np.round(np.sqrt(n_features)) + 1)
            elif self.subspace_mode == self._FEATURES_PERCENT:
                percent = (100. + k) / 100. if k < 0 else k / 100.
                k = int(np.round(n_features * percent))
                if k < 2:
                    k = int(np.round(n_features * percent)) + 1
            # else: do nothing (k = m)
            if k < 0:
                # k is negative, calculate M - k
                k = n_features + k

        # Generate subspaces. The subspaces is a 2D matrix of shape
        # (n_estimators, k) where each row contains the k feature indices
        # to be used by each estimator.
        if self.training_method == self._TRAIN_RANDOM_SUBSPACES or \
                self.training_method == self._TRAIN_RANDOM_PATCHES:
            if k != 0 and k < n_features:
                # For low dimensionality it is better to avoid more than
                # 1 classifier with the same subspace, thus we generate all
                # possible combinations of subsets of features and select
                # without replacement.
                # n_features is the total number of features and k is the
                # actual size of the subspaces.
                if n_features <= 20 or k < 2:
                    if k == 1 and n_features > 2:
                        k = 2
                    # Generate all possible combinations of size k
                    self._subspaces = get_all_k_combinations(k, n_features)
                    # Increase the subspaces to match the ensemble size
                    # (if required)
                    i = 0
                    while len(self._subspaces) < self.n_estimators:
                        i = 0 if i == len(self._subspaces) else i
                        np.vstack((self._subspaces, self._subspaces[i]))
                        i += 1
                # For high dimensionality we can't generate all combinations
                # as it is too expensive (memory). On top of that, the chance
                # of repeating a subspace is lower, so we can just randomly
                # generate subspaces without worrying about repetitions.
                else:
                    self._subspaces = get_random_k_combinations(k, n_features,
                                                                self.n_estimators,
                                                                self._random_state)

            # k == 0 or k > n_features (subspace size is larger than the
            # number of features), then default to re-sampling
            else:
                self.training_method = self._TRAIN_RESAMPLING

        # Reset the base estimator for safety.
        self.base_estimator.reset()

        # Initialize ensemble members
        self._init_ensemble_members()

    def _init_ensemble_members(self):
        # Create empty ensemble:
        base_learner_class = self._base_learner_class
        self.ensemble = []   # type: List[base_learner_class]

        performance_evaluator = self._base_performance_evaluator

        subspace_indexes = np.arange(self.n_estimators)
        if self.training_method == self._TRAIN_RANDOM_PATCHES or \
                self.training_method == self._TRAIN_RANDOM_SUBSPACES:
            # Shuffle indexes that match subspaces with members of the ensemble
            self._random_state.shuffle(subspace_indexes)
        for i in range(self.n_estimators):
            # When self.training_method == self._TRAIN_RESAMPLING
            features_indexes = None
            # Otherwise set feature indexes
            if self.training_method == self._TRAIN_RANDOM_PATCHES or \
                    self.training_method == self._TRAIN_RANDOM_SUBSPACES:
                features_indexes = self._subspaces[subspace_indexes[i]]
            self.ensemble.append(base_learner_class(
                idx_original=i,
                base_estimator=clone(self.base_estimator),
                performance_evaluator=deepcopy(performance_evaluator),
                created_on=self._n_samples_seen,
                disable_background_learner=self.disable_background_learner,
                disable_drift_detector=self.disable_drift_detection,
                drift_detection_method=self.drift_detection_method,
                warning_detection_method=self.warning_detection_method,
                drift_detection_criteria=self.drift_detection_criteria,
                is_background_learner=False,
                feature_indexes=features_indexes,
                nominal_attributes=self.nominal_attributes,
                random_state=self._random_state))

    def reset(self):
        self.ensemble = None
        self._n_samples_seen = 0
        self._random_state = check_random_state(self.random_state)


class StreamingRandomPatchesBaseLearner:
    """
    Class representing the base learner of StreamingRandomPatchesClassifier.
    """
    def __init__(self,
                 idx_original,
                 base_estimator,
                 performance_evaluator,
                 created_on,
                 disable_background_learner,
                 disable_drift_detector,
                 drift_detection_method,
                 warning_detection_method,
                 drift_detection_criteria,
                 is_background_learner,
                 feature_indexes=None,
                 nominal_attributes=None,
                 random_state=None):
        self.idx_original = idx_original
        self.created_on = created_on
        self.base_estimator = base_estimator
        self.performance_evaluator = performance_evaluator

        # Store current model subspace representation of the original instances
        self.feature_indexes = feature_indexes

        # Drift detection
        self.disable_background_learner = disable_background_learner
        self.disable_drift_detector = disable_drift_detector
        self.drift_detection_method = clone(drift_detection_method)   # type: BaseDriftDetector
        self.warning_detection_method = clone(warning_detection_method)   # type: BaseDriftDetector
        self.drift_detection_criteria = drift_detection_criteria

        # Background learner
        self.is_background_learner = is_background_learner

        # Statistics
        self.n_drifts_detected = 0
        self.n_drifts_induced = 0
        self.n_warnings_detected = 0
        self.n_warnings_induced = 0

        # Background learner
        self._background_learner = None   # type: Optional[StreamingRandomPatchesBaseLearner]
        self._background_learner_class = StreamingRandomPatchesBaseLearner

        # Nominal attributes
        self.nominal_attributes = nominal_attributes
        self._set_nominal_attributes = self._can_set_nominal_attributes()

        # Random_state
        self.random_state = random_state
        self._random_state = check_random_state(self.random_state)

    def partial_fit(self, X: np.ndarray, y: np.ndarray, classes: list, sample_weight: np.ndarray,
                    n_samples_seen: int, random_state: np.random):
        n_features_total = get_dimensions(X)[1]
        if self.feature_indexes is not None:
            # Select the subset of features to use
            X_subset = np.asarray([X[0][self.feature_indexes]])
            if self._set_nominal_attributes and hasattr(self.base_estimator, 'nominal_attributes'):
                self.base_estimator.nominal_attributes = \
                    self._remap_nominal_attributes(self.feature_indexes, self.nominal_attributes)
                self._set_nominal_attributes = False
        else:
            # Use all features
            X_subset = X

        self.base_estimator.partial_fit(X=X_subset, y=y,
                                        classes=classes,
                                        sample_weight=sample_weight)
        correctly_classifies = self.base_estimator.predict(X_subset)[0] == y
        if self._background_learner:
            # Note: Pass the original instance X so features are correctly
            # selected at the beginning of partial_fit
            self._background_learner.partial_fit(X=X, y=y,
                                                 classes=classes,
                                                 sample_weight=sample_weight,
                                                 n_samples_seen=n_samples_seen,
                                                 random_state=random_state)

        if not self.disable_drift_detector and not self.is_background_learner:
            # Check for warnings only if the background learner is active
            if not self.disable_background_learner:
                # Update the warning detection method
                self.warning_detection_method.add_element(0 if correctly_classifies else 1)
                # Check if there was a change
                if self.warning_detection_method.detected_change():
                    self.n_warnings_detected += 1
                    self._trigger_warning(n_features=n_features_total,
                                          n_samples_seen=n_samples_seen,
                                          random_state=random_state)

            # ===== Drift detection =====
            # Update the drift detection method
            self.drift_detection_method.add_element(0 if correctly_classifies else 1)
            # Check if the was a change
            if self.drift_detection_method.detected_change():
                self.n_drifts_detected += 1
                # There was a change, reset the model
                self.reset(n_features=n_features_total, n_samples_seen=n_samples_seen,
                           random_state=random_state)

    def predict_proba(self, X):
        if self.feature_indexes is not None:
            # Select the subset of features to use
            X_subset = np.asarray([X[0][self.feature_indexes]])
        else:
            # Use all features
            X_subset = X

        return self.base_estimator.predict_proba(X_subset)

    def _trigger_warning(self, n_features, n_samples_seen: int, random_state: np.random):
        background_base_estimator = clone(self.base_estimator)
        background_base_estimator.reset()

        background_performance_evaluator = deepcopy(self.performance_evaluator)
        background_performance_evaluator.reset()

        feature_indexes = self._reset_subset(n_features=n_features, random_state=random_state)

        self._background_learner = self._background_learner_class(
            idx_original=self.idx_original,
            base_estimator=background_base_estimator,
            performance_evaluator=background_performance_evaluator,
            created_on=n_samples_seen,
            disable_background_learner=self.disable_background_learner,
            disable_drift_detector=self.disable_drift_detector,
            drift_detection_method=self.drift_detection_method,
            warning_detection_method=self.warning_detection_method,
            drift_detection_criteria=self.drift_detection_criteria,
            is_background_learner=True,
            feature_indexes=feature_indexes,
            nominal_attributes=self.nominal_attributes,
            random_state=self._random_state
        )

        # Hard-reset the warning method
        self.warning_detection_method = clone(self.warning_detection_method)

    def _reset_subset(self, n_features: int, random_state: np.random):
        feature_indexes = None
        if self.feature_indexes is not None:
            k = len(self.feature_indexes)
            feature_indexes = random_state.choice(range(n_features), k, replace=False)
        return feature_indexes

    def reset(self, n_features: int, n_samples_seen: int, random_state: np.random):
        if not self.disable_background_learner and self._background_learner is not None:
            self.base_estimator = self._background_learner.base_estimator
            self.drift_detection_method = self._background_learner.drift_detection_method
            self.warning_detection_method = self._background_learner.warning_detection_method
            self.performance_evaluator = self._background_learner.performance_evaluator
            self.performance_evaluator.reset()
            self.created_on = self._background_learner.created_on
            self.feature_indexes = self._background_learner.feature_indexes
            self._background_learner = None
        else:
            self.base_estimator.reset()
            self.performance_evaluator.reset()
            self.created_on = n_samples_seen
            self.drift_detection_method = clone(self.drift_detection_method)
            self.feature_indexes = self._reset_subset(n_features, random_state)
            self._set_nominal_attributes = self._can_set_nominal_attributes()

    @staticmethod
    def _remap_nominal_attributes(sel_features: np.ndarray, nominal_attributes: list) -> list:
        remapped_idx = []
        for i, idx in enumerate([i for i in sel_features]):
            if idx in nominal_attributes:
                remapped_idx.append(i)
        return remapped_idx if len(remapped_idx) > 0 else None

    def _can_set_nominal_attributes(self):
        return True if (self.nominal_attributes is not None and len(self.nominal_attributes) > 0) \
            else False


def _get_all_k_combinations_rec(offset: int, k: int, combination: deque, original_size: int,
                                combinations: deque):
    """ Recursive function to generate all k-combinations. """
    if k == 0:
        combinations.append(deepcopy(combination))
        return

    for i in range(offset, original_size - k + 1, 1):
        combination.append(i)
        _get_all_k_combinations_rec(i + 1, k - 1, combination, original_size, combinations)
        combination.pop()


def get_all_k_combinations(k: int, n_items: int) -> np.ndarray:
    """ Generates all k-combinations from n_features

    Parameters
    ----------
    k: int
        Number of items per combination
    n_items
        Total number of items

    Returns
    -------
    np.ndarray
        2D array containing all k-combinations

    """
    combinations = deque()
    combination = deque()
    _get_all_k_combinations_rec(0, k, combination, n_items, combinations)
    return np.array(combinations)


def get_random_k_combinations(k: int, n_items: int, n_combinations: int,
                              random_state: np.random) -> np.ndarray:
    """ Gets random k-combinations from n_features

    Parameters
    ----------
    k: int
        Number of items per combination
    n_items
        Total number of items
    n_combinations: int
        Number of combinations
    random_state: int, RandomState instance or None, optional (default=None)
        If int, random_state is the seed used by the random number generator;
        If RandomState instance, random_state is the random number generator;
        If None, the random number generator is the RandomState instance used
        by `np.random`.

    Returns
    -------
    np.ndarray
        2D array containing all k-combinations

    """
    return np.array([random_state.choice(range(n_items), k, replace=False)
                     for _ in range(n_combinations)])