1#ifndef UMAPPP_INITIALIZE_HPP
2#define UMAPPP_INITIALIZE_HPP
5#include "combine_neighbor_sets.hpp"
7#include "neighbor_similarities.hpp"
8#include "spectral_init.hpp"
29template<
typename Index_>
30int choose_num_epochs(
const std::optional<int> num_epochs,
const Index_ size) {
31 if (num_epochs.has_value()) {
42 constexpr Index_ limit = 10000;
43 const int minimal = 200, maximal = 300;
45 return minimal + maximal;
47 return minimal +
static_cast<int>(std::ceil(maximal *
static_cast<double>(limit) /
static_cast<double>(size)));
74template<
typename Index_,
typename Float_>
76 internal::NeighborSimilaritiesOptions<Float_> nsopt;
80 internal::neighbor_similarities(x, nsopt);
82 internal::combine_neighbor_sets(x,
static_cast<Float_
>(options.
mix_ratio));
86 const bool spectral_okay = internal::spectral_init(
100 internal::random_init<Index_>(
110 if (options.
a <= 0 || options.
b <= 0) {
111 const auto found = internal::find_ab(options.
spread, options.
min_dist);
112 options.
a = found.first;
113 options.
b = found.second;
143template<
typename Index_,
typename Input_,
typename Float_>
146 return initialize(std::move(output), num_dim, embedding, std::move(options));
171template<
typename Index_,
typename Float_,
class Matrix_ = knncolle::Matrix<Index_, Float_> >
173 const std::size_t data_dim,
174 const Index_ num_obs,
175 const Float_*
const data,
177 const std::size_t num_dim,
178 Float_*
const embedding,
182 return initialize(*prebuilt, num_dim, embedding, std::move(options));
Defines the NeighborList alias.
Status of the UMAP algorithm.
std::unique_ptr< Prebuilt< Index_, Data_, Distance_ > > build_unique(const Matrix_ &data) const
Status of the UMAP optimization iterations.
Definition Status.hpp:26
NeighborList< Index_, Distance_ > find_nearest_neighbors(const Prebuilt< Index_, Data_, Distance_ > &index, int k, int num_threads=1)
Methods for UMAP.
Definition initialize.hpp:22
knncolle::NeighborList< Index_, Float_ > NeighborList
Lists of neighbors for each observation.
Definition NeighborList.hpp:29
Status< Index_, Float_ > initialize(NeighborList< Index_, Float_ > x, const std::size_t num_dim, Float_ *const embedding, Options options)
Definition initialize.hpp:75
Options for initialize().
Definition Options.hpp:33
double initialize_random_scale
Definition Options.hpp:126
double mix_ratio
Definition Options.hpp:53
double negative_sample_rate
Definition Options.hpp:157
bool initialize_spectral_jitter
Definition Options.hpp:114
InitializeMethod initialize_method
Definition Options.hpp:92
double bandwidth
Definition Options.hpp:45
double min_dist
Definition Options.hpp:65
std::optional< int > num_epochs
Definition Options.hpp:144
double initialize_spectral_jitter_sd
Definition Options.hpp:120
double b
Definition Options.hpp:81
int num_neighbors
Definition Options.hpp:164
double a
Definition Options.hpp:73
double spread
Definition Options.hpp:58
int num_threads
Definition Options.hpp:178
RngEngine::result_type initialize_seed
Definition Options.hpp:133
bool initialize_random_on_spectral_fail
Definition Options.hpp:99
double local_connectivity
Definition Options.hpp:39
double initialize_spectral_scale
Definition Options.hpp:107