13#ifndef MLPACK_METHODS_HOEFFDING_TREES_HOEFFDING_CATEGORICAL_SPLIT_HPP
14#define MLPACK_METHODS_HOEFFDING_TREES_HOEFFDING_CATEGORICAL_SPLIT_HPP
43template<
typename FitnessFunction>
58 const size_t numClasses = 0);
67 const size_t numClasses,
77 void Train(eT value,
const size_t label);
93 size_t NumChildren()
const {
return sufficientStatistics.n_cols; }
110 template<
typename Archive>
113 ar & BOOST_SERIALIZATION_NVP(sufficientStatistics);
120 arma::Mat<size_t> sufficientStatistics;
127#include "hoeffding_categorical_split_impl.hpp"
This is the standard Hoeffding-bound categorical feature proposed in the paper below:
void Train(eT value, const size_t label)
Train on the given value with the given label.
void Split(arma::Col< size_t > &childMajorities, SplitInfo &splitInfo)
Gather the information for a split: get the labels of the child majorities, and initialize the SplitI...
size_t NumChildren() const
Return the number of children, if the node were to split.
size_t MajorityClass() const
Get the majority class seen so far.
double MajorityProbability() const
Get the probability of the majority class given the points seen so far.
HoeffdingCategoricalSplit(const size_t numCategories, const size_t numClasses, const HoeffdingCategoricalSplit &other)
Create the HoeffdingCategoricalSplit given a number of categories for this dimension and a number of ...
void EvaluateFitnessFunction(double &bestFitness, double &secondBestFitness) const
Given the points seen so far, evaluate the fitness function, returning the gain for the best possible...
HoeffdingCategoricalSplit(const size_t numCategories=0, const size_t numClasses=0)
Create the HoeffdingCategoricalSplit given a number of categories for this dimension and a number of ...
CategoricalSplitInfo SplitInfo
The type of split information required by the HoeffdingCategoricalSplit.
void serialize(Archive &ar, const unsigned int)
Serialize the categorical split.
Linear algebra utility functions, generally performed on matrices or vectors.
The core includes that mlpack expects; standard C++ includes and Armadillo.