1#ifndef UMAPPP_INITIALIZE_HPP
2#define UMAPPP_INITIALIZE_HPP
5#include "combine_neighbor_sets.hpp"
7#include "neighbor_similarities.hpp"
8#include "spectral_init.hpp"
29template<
typename Index_>
30int choose_num_epochs(
const std::optional<int> num_epochs,
const Index_ size) {
31 if (num_epochs.has_value()) {
42 constexpr Index_ limit = 10000;
43 const int minimal = 200, maximal = 300;
45 return minimal + maximal;
47 return minimal +
static_cast<int>(std::ceil(maximal *
static_cast<double>(limit) /
static_cast<double>(size)));
73template<
typename Index_,
typename Float_>
75 internal::NeighborSimilaritiesOptions<Float_> nsopt;
79 internal::neighbor_similarities(x, nsopt);
81 internal::combine_neighbor_sets(x,
static_cast<Float_
>(options.
mix_ratio));
85 const bool spectral_okay = internal::spectral_init(
100 internal::random_init<Index_>(
110 if (!options.
a.has_value() || !options.
b.has_value()) {
111 const auto found = internal::find_ab(options.
spread, options.
min_dist);
112 options.
a = found.first;
113 options.
b = found.second;
142template<
typename Index_,
typename Input_,
typename Float_>
145 return initialize(std::move(output), num_dim, embedding, std::move(options));
169template<
typename Index_,
typename Float_,
class Matrix_ = knncolle::Matrix<Index_, Float_> >
171 const std::size_t data_dim,
172 const Index_ num_obs,
173 const Float_*
const data,
175 const std::size_t num_dim,
176 Float_*
const embedding,
180 return initialize(*prebuilt, num_dim, embedding, std::move(options));
Defines the NeighborList alias.
Status of the UMAP algorithm.
std::unique_ptr< Prebuilt< Index_, Data_, Distance_ > > build_unique(const Matrix_ &data) const
Status of the UMAP optimization iterations.
Definition Status.hpp:26
NeighborList< Index_, Distance_ > find_nearest_neighbors(const Prebuilt< Index_, Data_, Distance_ > &index, int k, int num_threads=1)
Functions for creating UMAP embeddings.
Definition initialize.hpp:22
knncolle::NeighborList< Index_, Float_ > NeighborList
Lists of neighbors for each observation.
Definition NeighborList.hpp:29
Status< Index_, Float_ > initialize(NeighborList< Index_, Float_ > x, const std::size_t num_dim, Float_ *const embedding, Options options)
Definition initialize.hpp:74
Options for initialize().
Definition Options.hpp:36
double initialize_random_scale
Definition Options.hpp:138
double mix_ratio
Definition Options.hpp:56
double negative_sample_rate
Definition Options.hpp:170
std::optional< double > a
Definition Options.hpp:78
bool initialize_spectral_jitter
Definition Options.hpp:124
std::optional< double > b
Definition Options.hpp:86
InitializeMethod initialize_method
Definition Options.hpp:97
double bandwidth
Definition Options.hpp:48
double min_dist
Definition Options.hpp:70
std::optional< int > num_epochs
Definition Options.hpp:158
double initialize_spectral_jitter_sd
Definition Options.hpp:130
int num_neighbors
Definition Options.hpp:177
irlba::Options initialize_spectral_irlba_options
Definition Options.hpp:109
double spread
Definition Options.hpp:62
int num_threads
Definition Options.hpp:191
RngEngine::result_type initialize_seed
Definition Options.hpp:146
bool initialize_random_on_spectral_fail
Definition Options.hpp:104
double local_connectivity
Definition Options.hpp:42
double initialize_spectral_scale
Definition Options.hpp:117