15 #ifndef __MLPACK_CORE_TREE_COSINE_TREE_COSINE_TREE_HPP
16 #define __MLPACK_CORE_TREE_COSINE_TREE_COSINE_TREE_HPP
19 #include <boost/heap/priority_queue.hpp>
25 class CompareCosineNode;
29 typedef boost::heap::priority_queue<
CosineTree*,
55 CosineTree(CosineTree& parentNode,
const std::vector<size_t>& subIndices);
92 arma::vec& newBasisVector,
93 arma::vec* addBasisVector = NULL);
108 CosineNodeQueue& treeQueue,
109 arma::vec* addBasisVector1 = NULL,
110 arma::vec* addBasisVector2 = NULL);
133 arma::vec& probabilities,
size_t numSamples);
155 size_t BinarySearch(arma::vec& cDistribution,
double value,
size_t start,
250 bool operator() (
const CosineTree* a,
const CosineTree* b)
const
void CalculateCosines(arma::vec &cosines)
Calculate cosines of the columns present in the node, with respect to the sampled splitting point...
CosineTree * left
Left child of the node.
std::vector< size_t > indices
Indices of columns of input matrix in the node.
Linear algebra utility functions, generally performed on matrices or vectors.
size_t numColumns
Number of columns of input matrix in the node.
arma::vec l2NormsSquared
L2-norm squared of columns in the node.
size_t SplitPointIndex() const
Get the column index of split point of the node.
double FrobNormSquared() const
Get the Frobenius norm squared of columns in the node.
void CosineNodeSplit()
This function splits the cosine node into two children based on the cosines of the columns contained ...
double MonteCarloError(CosineTree *node, CosineNodeQueue &treeQueue, arma::vec *addBasisVector1=NULL, arma::vec *addBasisVector2=NULL)
Estimates the squared error of the projection of the input node's matrix onto the current vector subs...
size_t splitPointIndex
Index of split point of cosine node.
void GetFinalBasis(arma::mat &finalBasis)
Returns the basis of the constructed subspace.
size_t ColumnSampleLS()
Sample a point from the Length-Squared distribution of the cosine node.
arma::vec centroid
Centroid of columns of input matrix in the node.
const arma::mat & dataset
Matrix for which cosine tree is constructed.
arma::vec & Centroid()
Get pointer to the centroid vector.
void ConstructBasis(CosineNodeQueue &treeQueue)
Constructs the final basis matrix, after the cosine tree construction.
~CosineTree()
Destroy the cosine tree and all of its children (take care of the memory allocations too)...
double epsilon
Error tolerance fraction for calculated subspace.
bool operator()(const CosineTree *a, const CosineTree *b) const
CosineTree * Left()
Get pointer to the left child of the node.
CosineTree(const arma::mat &dataset)
CosineTree constructor for the root node of the tree.
void BasisVector(arma::vec &bVector)
Set the basis vector of the node.
size_t BinarySearch(arma::vec &cDistribution, double value, size_t start, size_t end)
Sample a column based on the cumulative Length-Squared distribution of the cosine node...
arma::vec & BasisVector()
Get the basis vector of the node.
void CalculateCentroid()
Calculate centroid of the columns present in the node.
CosineTree * parent
Parent of the node.
arma::vec basisVector
Orthonormalized basis vector of the node.
CosineTree * right
Right child of the node.
double L2Error() const
Get the Monte Carlo error.
size_t NumColumns() const
Get number of columns of input matrix in the node.
CosineTree * Right()
Get pointer to the right child of the node.
void ModifiedGramSchmidt(CosineNodeQueue &treeQueue, arma::vec ¢roid, arma::vec &newBasisVector, arma::vec *addBasisVector=NULL)
Calculates the orthonormalization of the passed centroid, with respect to the current vector subspace...
boost::heap::priority_queue< CosineTree *, boost::heap::compare< CompareCosineNode > > CosineNodeQueue
double l2Error
Monte Carlo error for this node.
arma::mat basis
Subspace basis of the input dataset.
double frobNormSquared
Frobenius norm squared of columns in the node.
void ColumnSamplesLS(std::vector< size_t > &sampledIndices, arma::vec &probabilities, size_t numSamples)
Sample 'numSamples' points from the Length-Squared distribution of the cosine node.
void L2Error(const double error)
Set the Monte Carlo error.
const arma::mat & GetDataset() const
Get pointer to the dataset matrix.
std::vector< size_t > & VectorIndices()
Get the indices of columns in the node.
double delta
Cumulative probability for Monte Carlo error lower bound.