java source code of RPartConverter

jpmml-r-master
- NOTICE.txt
- src
  - main
    - javacc
      - expression.jj
    - java
      - org
        jpmml
        rexp
        LMConverter.java
        EmptyFormulaContext.java
        RVector.java
        RStringVector.java
        OLSConverter.java
        RandomForestConverter.java
        MVRConverter.java
        ModelFrameFormulaContext.java
        XLevelsFormulaContext.java
        SerializationTypes.java
        RangerConverter.java
        ScorecardConverter.java
        NNetConverter.java
        AdaConverter.java
        RPartConverter.java
        GLMConverter.java
        visitors
        RandomForestCompactor.java
        RExpUtil.java
        RClosure.java
        RBooleanVector.java
        EarthConverter.java
        LogNetConverter.java
        SerializationUtil.java
        ModelConverter.java
        Converter.java
        RecipeEncoder.java
        SVMConverter.java
        FormulaUtil.java
        GLMNetConverter.java
        FormulaContext.java
        RPair.java
        LRMConverter.java
        CrossValGLMNetConverter.java
        RDoubleVector.java
        RNumberVector.java
        ConverterFactory.java
        RExp.java
        NNConverter.java
        Main.java
        RFunctionCall.java
        PartyConverter.java
        SExpTypes.java
        WrappedModelConverter.java
        RMSConverter.java
        ElNetConverter.java
        BaggingConverter.java
        TrainConverter.java
        NaiveBayesConverter.java
        RExpParser.java
        PreProcessEncoder.java
        RRaw.java
        FilterModelConverter.java
        XGBoostConverter.java
        AdaBagConverter.java
        RGenericVector.java
        RString.java
        TransformerEncoder.java
        KMeansConverter.java
        RIntegerVector.java
        MultNetConverter.java
        TreeModelConverter.java
        GBMConverter.java
        CaretEnsembleConverter.java
        IForestConverter.java
        BoostingConverter.java
        BinaryTreeConverter.java
        MultinomConverter.java
        RDataInput.java
        RExpEncoder.java
        Formula.java
        DecorationUtil.java
        XDRInput.java
        ElmNNConverter.java
        FunctionExpression.java
        S4Object.java
        RPartEnsembleConverter.java
        FishNetConverter.java
  - test
    - resources
      - csv
        RangerProbIris.csv
        MultNetIris.csv
        AdaAudit.csv
        RandomForestFormulaWineQuality.csv
        LMFormulaWineQuality.csv
        RandomForestWineColor.csv
        AdaFormulaVersicolor.csv
        Iris.csv
        LibSVMIris.csv
        NNetFormulaIris.csv
        PLSRegressionFormulaWineQuality.csv
        XGBoostAuto.csv
        BinaryTreeAudit.csv
        RandomForestFormulaAuto.csv
        BaggingAudit.csv
        IrisNA.csv
        Versicolor.csv
        ElNetWineQuality.csv
        XGBoostIris.csv
        GBMAdaBoostAuditNA.csv
        XGBoostAuditNA.csv
        EvTreeAudit.csv
        BoostingAudit.csv
        GBMBernoulliAuditNA.csv
        RangerAutoNA.csv
        CaretEnsembleVersicolor.csv
        RandomForestCustFormulaAudit.csv
        RandomForestIris.csv
        LibSVMAnomalyFormulaAudit.csv
        NNetFormulaAudit.csv
        RangerProbAudit.csv
        PLSRegressionFormulaAuto.csv
        ElmNNFormulaAuto.csv
        TrainRandomForestAuto.csv
        GBMFormulaIris.csv
        RPartWineQuality.csv
        LMFormulaAuto.csv
        NaiveBayesAudit.csv
        EvTreeWineQuality.csv
        ElmNNFormulaWineQuality.csv
        RangerAudit.csv
        Visit.csv
        RPartIrisNA.csv
        NaiveBayesFormulaAudit.csv
        LibSVMAuto.csv
        IForestIris.csv
        RandomForestCustFormulaIris.csv
        CaretEnsembleAuto.csv
        IForestAuto.csv
        GLMCustFormulaAudit.csv
        GBMIris.csv
        TrainRandomForestFormulaAuto.csv
        ChaidIris.csv
        RandomForestWineQuality.csv
        CrossValLogNetVersicolor.csv
        NNWineQuality.csv
        KMeansIris.csv
        RPartIris.csv
        GBMAutoNA.csv
        LibSVMFormulaIris.csv
        GLMCustFormulaWineQuality.csv
        Audit.csv
        LibSVMAnomalyFormulaIris.csv
        WrappedGLMFormulaAudit.csv
        EvTreeAuto.csv
        ChaidAudit.csv
        TrainRandomForestIris.csv
        NaiveBayesIris.csv
        WrappedGBMAdaBoostAuditNA.csv
        RPartAuditNA.csv
        BinaryTreeAuto.csv
        GLMCustFormulaAuto.csv
        EarthCustFormulaAuto.csv
        LRMFormulaAudit.csv
        FishNetVisit.csv
        LibSVMFormulaAuto.csv
        AdaFormulaAudit.csv
        GLMFormulaWineQuality.csv
        RandomForestAuto.csv
        MultinomIris.csv
        BinaryTreeIris.csv
        TrainGBMFormulaIris.csv
        RandomForestCustFormulaAuto.csv
        CrossValElNetWineQuality.csv
        LibSVMFormulaAudit.csv
        TrainGLMFormulaAudit.csv
        ElNetAuto.csv
        RandomForestAudit.csv
        AuditNA.csv
        TrainRandomForestFormulaAudit.csv
        TrainRandomForestAudit.csv
        OLSRegressionFormulaAuto.csv
        RPartAuto.csv
        TrainGLMFormulaAuto.csv
        GBMFormulaAutoNA.csv
        LMCustFormulaAuto.csv
        EarthFormulaAuto.csv
        MultinomAudit.csv
        RangerIris.csv
        BaggingIris.csv
        Auto.csv
        GLMFormulaAudit.csv
        TrainRPartIris.csv
        TrainRandomForestFormulaIris.csv
        EvTreeIris.csv
        RPartAutoNA.csv
        RPartAudit.csv
        RandomForestFormulaAudit.csv
        AutoNA.csv
        NaiveBayesFormulaIris.csv
        NNetFormulaAuto.csv
        GLMFormulaAuto.csv
        RandomForestFormulaWineColor.csv
        PLSRegressionCustFormulaAuto.csv
        RandomForestFormulaIris.csv
        TrainGBMFormulaAutoNA.csv
        WrappedLMFormulaAuto.csv
        BoostingIris.csv
        RPartWineQualityNA.csv
        GLMFormulaVisit.csv
      - rds
        GBMFormulaAutoNA.rds
        MultNetWineColor.rds
        TrainRandomForestIris.rds
        NaiveBayesFormulaAudit.rds
        LibSVMAnomalyFormulaIris.rds
        LibSVMAuto.rds
        IForestAuto.rds
        RPartAutoNA.rds
        ElNetWineQuality.rds
        RandomForestAudit.rds
        GBMBernoulliAuditNA.rds
        MultinomAudit.rds
        RPartAuditNA.rds
        EvTreeIris.rds
        GLMCustFormulaAuto.rds
        LibSVMFormulaAudit.rds
        TrainRandomForestAuto.rds
        RandomForestFormulaAuto.rds
        RPartIrisNA.rds
        RandomForestFormulaIris.rds
        LogNetWineColor.rds
        BoostingIris.rds
        BinaryTreeIris.rds
        RandomForestAuto.rds
        LMCustFormulaAuto.rds
        GBMIris.rds
        XGBoostAuto.rds
        GBMAutoNA.rds
        LibSVMAnomalyFormulaAudit.rds
        PLSRegressionCustFormulaAuto.rds
        OLSRegressionFormulaAuto.rds
        BaggingIris.rds
        EarthCustFormulaAuto.rds
        LibSVMIris.rds
        RPartWineColor.rds
        LMFormulaAuto.rds
        NNetFormulaIris.rds
        NNetFormulaAudit.rds
        RangerIris.rds
        CrossValLogNetWineColor.rds
        XGBoostIris.rds
        NaiveBayesIris.rds
        RPartAudit.rds
        TrainRandomForestFormulaAuto.rds
        KMeansIris.rds
        EarthFormulaAuto.rds
        ElmNNFormulaAuto.rds
        RPartAuto.rds
        ChaidAudit.rds
        TrainGBMFormulaAutoNA.rds
        ElNetAuto.rds
        EvTreeAuto.rds
        TrainRPartIris.rds
        RandomForestWineColor.rds
        RPartWineColorNA.rds
        RandomForestCustFormulaAuto.rds
        FishNetVisit.rds
        RandomForestFormulaWineColor.rds
        WrappedLMFormulaAuto.rds
        TrainGBMFormulaIris.rds
        RPartIris.rds
        XGBoostAuditNA.rds
        AdaFormulaVersicolor.rds
        IForestIris.rds
        EvTreeAudit.rds
        LibSVMFormulaAuto.rds
        MultinomIris.rds
        GBMFormulaIris.rds
        BinaryTreeAuto.rds
        PLSRegressionFormulaAuto.rds
        GLMFormulaAuto.rds
        RangerProbAudit.rds
        NaiveBayesAudit.rds
        MultNetIris.rds
        RangerAutoNA.rds
        CrossValLogNetVersicolor.rds
        LibSVMFormulaIris.rds
        TrainRandomForestFormulaIris.rds
        RandomForestIris.rds
        NNetFormulaAuto.rds
        ChaidIris.rds
        LRMFormulaAudit.rds
        CrossValElNetWineQuality.rds
        WrappedGBMAdaBoostAuditNA.rds
        RandomForestCustFormulaIris.rds
        NaiveBayesFormulaIris.rds
        RangerProbIris.rds
        GBMAdaBoostAuditNA.rds
        RangerAudit.rds
    - java
      - org
        jpmml
        rexp
        RPartConverterTest.java
        ExpressionTranslatorTest.java
        ConverterTestBatch.java
        CaretEnsembleConverterTest.java
        BoostingConverterTest.java
        KMeansConverterTest.java
        RandomForestConverterTest.java
        FunctionExpressionTest.java
        LMConverterTest.java
        NNetConverterTest.java
        IForestConverterTest.java
        SVMConverterTest.java
        PartyConverterTest.java
        GBMConverterTest.java
        ElmNNConverterTest.java
        CrossValGLMNetConverterTest.java
        NNConverterTest.java
        ConverterTest.java
        XGBoostConverterTest.java
        BaggingConverterTest.java
        ChaidConverterTest.java
        EarthConverterTest.java
        FormulaTest.java
        AdaConverterTest.java
        NaiveBayesConverterTest.java
        GLMConverterTest.java
        RExpUtilTest.java
        MVRConverterTest.java
        GLMNetConverterTest.java
        LRMConverterTest.java
        RangerConverterTest.java
        MultinomConverterTest.java
        BinaryTreeConverterTest.java
        OLSConverterTest.java
        EvTreeConverterTest.java
    - R
      - lm.R
      - caretEnsemble.R
      - naiveBayes.R
      - ranger.R
      - bagging.R
      - mvr.R
      - ols.R
      - data.R
      - lrm.R
      - rpart.R
      - glmnet.R
      - IsolationForest.R
      - nn.R
      - kmeans.R
      - multinom.R
      - glm.R
      - randomForest.R
      - gbm.R
      - xgboost.R
      - chaid.R
      - cv.glmnet.R
      - elmNN.R
      - version.R
      - evtree.R
      - ada.R
      - svm.R
      - util.R
      - nnet.R
      - ctree.R
      - earth.R
      - boosting.R
- pom.xml
- README.md
- LICENSE.txt

/*
 * Copyright (c) 2018 Villu Ruusmann
 *
 * This file is part of JPMML-R
 *
 * JPMML-R is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * JPMML-R is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with JPMML-R.  If not, see <http://www.gnu.org/licenses/>.
 */
package org.jpmml.rexp;

import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;

import org.dmg.pmml.CompoundPredicate;
import org.dmg.pmml.DataType;
import org.dmg.pmml.FieldName;
import org.dmg.pmml.MiningFunction;
import org.dmg.pmml.Predicate;
import org.dmg.pmml.ScoreDistribution;
import org.dmg.pmml.SimplePredicate;
import org.dmg.pmml.True;
import org.dmg.pmml.tree.ClassifierNode;
import org.dmg.pmml.tree.CountingBranchNode;
import org.dmg.pmml.tree.CountingLeafNode;
import org.dmg.pmml.tree.Node;
import org.dmg.pmml.tree.TreeModel;
import org.jpmml.converter.CategoricalFeature;
import org.jpmml.converter.CategoricalLabel;
import org.jpmml.converter.Feature;
import org.jpmml.converter.FortranMatrixUtil;
import org.jpmml.converter.ModelUtil;
import org.jpmml.converter.Schema;
import org.jpmml.converter.ValueUtil;

public class RPartConverter extends TreeModelConverter<RGenericVector> {

	private int useSurrogate = 0;

	private Formula formula = null;


	public RPartConverter(RGenericVector rpart){
		super(rpart);

		RGenericVector control = rpart.getGenericElement("control");

		RNumberVector<?> useSurrogate = control.getNumericElement("usesurrogate");

		this.useSurrogate = ValueUtil.asInt(useSurrogate.asScalar());

		switch(this.useSurrogate){
			case 0:
			case 1:
			case 2:
				break;
			default:
				throw new IllegalArgumentException();
		}
	}

	public boolean hasScoreDistribution(){
		return true;
	}

	@Override
	public void encodeSchema(RExpEncoder encoder){
		RGenericVector rpart = getObject();

		RGenericVector frame = rpart.getGenericElement("frame");
		RExp terms = rpart.getElement("terms");

		RGenericVector xlevels = rpart.getGenericAttribute("xlevels", false);
		RStringVector ylevels = rpart.getStringAttribute("ylevels", false);

		RIntegerVector var = frame.getFactorElement("var");

		FormulaContext context = new XLevelsFormulaContext(xlevels);

		Formula formula = FormulaUtil.createFormula(terms, context, encoder);

		FormulaUtil.setLabel(formula, terms, ylevels, encoder);

		List<String> names = FormulaUtil.removeSpecialSymbol(RExpUtil.getFactorLevels(var), "<leaf>", 0);

		FormulaUtil.addFeatures(formula, names, false, encoder);

		this.formula = formula;
	}

	@Override
	public TreeModel encodeModel(Schema schema){
		RGenericVector rpart = getObject();

		RGenericVector frame = rpart.getGenericElement("frame");
		RStringVector method = rpart.getStringElement("method");
		RNumberVector<?> splits = rpart.getNumericElement("splits");
		RIntegerVector csplit = rpart.getIntegerElement("csplit", false);

		RIntegerVector var = frame.getIntegerElement("var");
		RIntegerVector n = frame.getIntegerElement("n");
		RIntegerVector ncompete = frame.getIntegerElement("ncompete");
		RIntegerVector nsurrogate = frame.getIntegerElement("nsurrogate");

		RIntegerVector rowNames = frame.getIntegerAttribute("row.names");

		if((rowNames.getValues()).indexOf(Integer.MIN_VALUE) > -1){
			throw new IllegalArgumentException();
		}

		int[][] splitInfo = new int[1 + rowNames.size()][3];

		for(int offset = 0; offset < rowNames.size(); offset++){
			splitInfo[offset][1] = ncompete.getValue(offset);
			splitInfo[offset][2] = nsurrogate.getValue(offset);

			splitInfo[offset + 1][0] = splitInfo[offset][0] + splitInfo[offset][1] + splitInfo[offset][2] + (var.getValue(offset) != 1 ? 1 : 0);
		}

		switch(method.asScalar()){
			case "anova":
				return encodeRegression(frame, rowNames, var, n, splitInfo, splits, csplit, schema);
			case "class":
				return encodeClassification(frame, rowNames, var, n, splitInfo, splits, csplit, schema);
			default:
				throw new IllegalArgumentException();
		}
	}

	private TreeModel encodeRegression(RGenericVector frame, RIntegerVector rowNames, RIntegerVector var, RIntegerVector n, int[][] splitInfo, RNumberVector<?> splits, RIntegerVector csplit, Schema schema){
		RNumberVector<?> yval = frame.getNumericElement("yval");

		ScoreEncoder scoreEncoder = new ScoreEncoder(){

			@Override
			public Node encode(Node node, int offset){
				Number score = yval.getValue(offset);
				Number recordCount = n.getValue(offset);

				node
					.setScore(score)
					.setRecordCount(recordCount);

				return node;
			}
		};

		Node root = encodeNode(True.INSTANCE, 1, rowNames, var, n, splitInfo, splits, csplit, scoreEncoder, schema);

		TreeModel treeModel = new TreeModel(MiningFunction.REGRESSION, ModelUtil.createMiningSchema(schema.getLabel()), root);

		return configureTreeModel(treeModel);
	}

	private TreeModel encodeClassification(RGenericVector frame, RIntegerVector rowNames, RIntegerVector var, RIntegerVector n, int[][] splitInfo, RNumberVector<?> splits, RIntegerVector csplit, Schema schema){
		RDoubleVector yval2 = frame.getDoubleElement("yval2");

		CategoricalLabel categoricalLabel = (CategoricalLabel)schema.getLabel();

		List<?> categories = categoricalLabel.getValues();

		boolean hasScoreDistribution = hasScoreDistribution();

		ScoreEncoder scoreEncoder = new ScoreEncoder(){

			private List<Integer> classes = null;

			private List<List<? extends Number>> recordCounts = null;


			{
				int rows = rowNames.size();
				int columns = 1 + (2 * categories.size()) + 1;

				List<Integer> classes = ValueUtil.asIntegers(FortranMatrixUtil.getColumn(yval2.getValues(), rows, columns, 0));

				this.classes = new ArrayList<>(classes);

				if(hasScoreDistribution){
					this.recordCounts = new ArrayList<>();

					for(int i = 0; i < categories.size(); i++){
						List<? extends Number> recordCounts = FortranMatrixUtil.getColumn(yval2.getValues(), rows, columns, 1 + i);

						this.recordCounts.add(new ArrayList<>(recordCounts));
					}
				}
			}

			@Override
			public Node encode(Node node, int offset){
				Object score = categories.get(this.classes.get(offset) - 1);
				Integer recordCount = n.getValue(offset);

				node
					.setScore(score)
					.setRecordCount(recordCount);

				if(hasScoreDistribution){
					node = new ClassifierNode(node);

					List<ScoreDistribution> scoreDistributions = node.getScoreDistributions();

					for(int i = 0; i < categories.size(); i++){
						List<? extends Number> recordCounts = this.recordCounts.get(i);

						ScoreDistribution scoreDistribution = new ScoreDistribution()
							.setValue(categories.get(i))
							.setRecordCount(recordCounts.get(offset));

						scoreDistributions.add(scoreDistribution);
					}
				}

				return node;
			}
		};

		Node root = encodeNode(True.INSTANCE, 1, rowNames, var, n, splitInfo, splits, csplit, scoreEncoder, schema);

		TreeModel treeModel = new TreeModel(MiningFunction.CLASSIFICATION, ModelUtil.createMiningSchema(schema.getLabel()), root);

		if(hasScoreDistribution){
			treeModel.setOutput(ModelUtil.createProbabilityOutput(DataType.DOUBLE, categoricalLabel));
		}

		return configureTreeModel(treeModel);
	}

	private TreeModel configureTreeModel(TreeModel treeModel){
		TreeModel.NoTrueChildStrategy noTrueChildStrategy = TreeModel.NoTrueChildStrategy.RETURN_LAST_PREDICTION;
		TreeModel.MissingValueStrategy missingValueStrategy;

		switch(this.useSurrogate){
			case 0:
				missingValueStrategy = TreeModel.MissingValueStrategy.NULL_PREDICTION; // XXX
				break;
			case 1:
				missingValueStrategy = TreeModel.MissingValueStrategy.LAST_PREDICTION;
				break;
			case 2:
				missingValueStrategy = null;
				break;
			default:
				throw new IllegalArgumentException();
		}

		treeModel
			.setNoTrueChildStrategy(noTrueChildStrategy)
			.setMissingValueStrategy(missingValueStrategy);

		return treeModel;
	}

	private Node encodeNode(Predicate predicate, int rowName, RIntegerVector rowNames, RIntegerVector var, RIntegerVector n, int[][] splitInfo, RNumberVector<?> splits, RIntegerVector csplit, ScoreEncoder scoreEncoder, Schema schema){
		int offset = getIndex(rowNames, rowName);

		Integer id = Integer.valueOf(rowName);

		int splitVar = var.getValue(offset) - 1;
		if(splitVar == 0){
			Node result = new CountingLeafNode(null, predicate)
				.setId(id);

			return scoreEncoder.encode(result, offset);
		}

		int leftRowName = rowName * 2;
		int rightRowName = (rowName * 2) + 1;

		Integer majorityDir = null;

		if(this.useSurrogate == 2){
			int leftOffset = getIndex(rowNames, leftRowName);
			int rightOffset = getIndex(rowNames, rightRowName);

			majorityDir = Double.compare(n.getValue(leftOffset), n.getValue(rightOffset));
		}

		Feature feature = schema.getFeature(splitVar - 1);

		int splitOffset = splitInfo[offset][0];

		int splitNumCompete = splitInfo[offset][1];
		int splitNumSurrogate = splitInfo[offset][2];

		List<Predicate> predicates = encodePredicates(feature, splitOffset, splits, csplit);

		Predicate leftPredicate = predicates.get(0);
		Predicate rightPredicate = predicates.get(1);

		if(this.useSurrogate > 0 && splitNumSurrogate > 0){
			CompoundPredicate leftCompoundPredicate = new CompoundPredicate(CompoundPredicate.BooleanOperator.SURROGATE, null)
				.addPredicates(leftPredicate);

			CompoundPredicate rightCompoundPredicate = new CompoundPredicate(CompoundPredicate.BooleanOperator.SURROGATE, null)
				.addPredicates(rightPredicate);

			RStringVector splitRowNames = splits.dimnames(0);

			for(int i = 0; i < splitNumSurrogate; i++){
				int surrogateSplitOffset = (splitOffset + 1) + splitNumCompete + i;

				feature = getFeature(FieldName.create(splitRowNames.getValue(surrogateSplitOffset)));

				predicates = encodePredicates(feature, surrogateSplitOffset, splits, csplit);

				leftCompoundPredicate.addPredicates(predicates.get(0));
				rightCompoundPredicate.addPredicates(predicates.get(1));
			}

			leftPredicate = leftCompoundPredicate;
			rightPredicate = rightCompoundPredicate;
		}

		Node leftChild = encodeNode(leftPredicate, leftRowName, rowNames, var, n, splitInfo, splits, csplit, scoreEncoder, schema);
		Node rightChild = encodeNode(rightPredicate, rightRowName, rowNames, var, n, splitInfo, splits, csplit, scoreEncoder, schema);

		if(this.useSurrogate == 2){

			if(majorityDir < 0){
				makeDefault(rightChild);
			} else

			if(majorityDir > 0){
				Node tmp = leftChild;

				makeDefault(leftChild);

				leftChild = rightChild;
				rightChild = tmp;
			}
		}

		Node result = new CountingBranchNode(null, predicate)
			.setId(id)
			.addNodes(leftChild, rightChild);

		return scoreEncoder.encode(result, offset);
	}

	private List<Predicate> encodePredicates(Feature feature, int splitOffset, RNumberVector<?> splits, RIntegerVector csplit){
		Predicate leftPredicate;
		Predicate rightPredicate;

		RIntegerVector splitsDim = splits.dim();

		int splitRows = splitsDim.getValue(0);
		int splitColumns = splitsDim.getValue(1);

		List<? extends Number> ncat = FortranMatrixUtil.getColumn(splits.getValues(), splitRows, splitColumns, 1);
		List<? extends Number> index = FortranMatrixUtil.getColumn(splits.getValues(), splitRows, splitColumns, 3);

		int splitType = ValueUtil.asInt(ncat.get(splitOffset));

		Number splitValue = index.get(splitOffset);

		if(Math.abs(splitType) == 1){
			SimplePredicate.Operator leftOperator;
			SimplePredicate.Operator rightOperator;

			if(splitType == -1){
				leftOperator = SimplePredicate.Operator.LESS_THAN;
				rightOperator = SimplePredicate.Operator.GREATER_OR_EQUAL;
			} else

			{
				leftOperator = SimplePredicate.Operator.GREATER_OR_EQUAL;
				rightOperator = SimplePredicate.Operator.LESS_THAN;
			}

			leftPredicate = createSimplePredicate(feature, leftOperator, splitValue);
			rightPredicate = createSimplePredicate(feature, rightOperator, splitValue);
		} else

		{
			CategoricalFeature categoricalFeature = (CategoricalFeature)feature;

			RIntegerVector csplitDim = csplit.dim();

			int csplitRows = csplitDim.getValue(0);
			int csplitColumns = csplitDim.getValue(1);

			List<Integer> csplitRow = FortranMatrixUtil.getRow(csplit.getValues(), csplitRows, csplitColumns, ValueUtil.asInt(splitValue) - 1);

			List<?> values = categoricalFeature.getValues();

			leftPredicate = createSimpleSetPredicate(categoricalFeature, selectValues(values, csplitRow, 1));
			rightPredicate = createSimpleSetPredicate(categoricalFeature, selectValues(values, csplitRow, 3));
		}

		return Arrays.asList(leftPredicate, rightPredicate);
	}

	private void makeDefault(Node node){
		Predicate predicate = node.getPredicate();

		CompoundPredicate compoundPredicate;

		if(predicate instanceof CompoundPredicate){
			compoundPredicate = (CompoundPredicate)predicate;
		} else

		{
			compoundPredicate = new CompoundPredicate(CompoundPredicate.BooleanOperator.SURROGATE, null)
				.addPredicates(predicate);

			node.setPredicate(compoundPredicate);
		}

		compoundPredicate.addPredicates(True.INSTANCE);
	}

	private Feature getFeature(FieldName name){
		return this.formula.resolveFeature(name);
	}

	static
	private int getIndex(RIntegerVector rowNames, int rowName){
		int index = rowNames.indexOf(rowName);
		if(index < 0){
			throw new IllegalArgumentException();
		}

		return index;
	}

	static
	private <E> List<E> selectValues(List<E> values, List<Integer> valueFlags, int flag){
		List<E> result = new ArrayList<>(values.size());

		for(int i = 0; i < values.size(); i++){
			E value = values.get(i);
			Integer valueFlag = valueFlags.get(i);

			if(valueFlag == flag){
				result.add(value);
			}
		}

		return result;
	}

	static
	private interface ScoreEncoder {

		Node encode(Node node, int offset);
	}
}