16 #ifndef __MLPACK_METHODS_KMEANS_REFINED_START_HPP 17 #define __MLPACK_METHODS_KMEANS_REFINED_START_HPP 61 template<
typename MatType>
62 void Cluster(
const MatType& data,
63 const size_t clusters,
64 arma::Row<size_t>& assignments)
const;
77 template<
typename Archive>
95 #include "refined_start_impl.hpp" size_t Samplings() const
Get the number of samplings that will be performed.
void Serialize(Archive &ar, const unsigned int)
Serialize the object.
Linear algebra utility functions, generally performed on matrices or vectors.
FirstShim< T > CreateNVP(T &t, const std::string &name, typename boost::enable_if< HasSerialize< T >>::type *=0)
Call this function to produce a name-value pair; this is similar to BOOST_SERIALIZATION_NVP(), but should be used for types that have a Serialize() function (or contain a type that has a Serialize() function) instead of a serialize() function.
RefinedStart(const size_t samplings=100, const double percentage=0.02)
Create the RefinedStart object, optionally specifying parameters for the number of samplings to perfo...
void Cluster(const MatType &data, const size_t clusters, arma::Row< size_t > &assignments) const
Partition the given dataset into the given number of clusters according to the random sampling scheme...
double & Percentage()
Modify the percentage of the data used by each subsampling.
double percentage
The percentage of the data to use for each subsampling.
double Percentage() const
Get the percentage of the data used by each subsampling.
size_t samplings
The number of samplings to perform.
Include all of the base components required to write MLPACK methods, and the main MLPACK Doxygen docu...
A refined approach for choosing initial points for k-means clustering.
size_t & Samplings()
Modify the number of samplings that will be performed.