#include <mlpack/prereqs.hpp>
#include <mlpack/core/util/io.hpp>
#include <mlpack/core/data/normalize_labels.hpp>
#include <mlpack/core/util/mlpack_main.hpp>
#include <mlpack/core/math/random.hpp>
#include <mlpack/core/metrics/lmetric.hpp>
#include "nca.hpp"
#include <ensmallen.hpp>

Include dependency graph for nca_main.cpp:

This graph shows which files directly or indirectly include this file:

Functions
	BINDING_NAME ("Neighborhood Components Analysis (NCA)")

	BINDING_SHORT_DESC ("An implementation of neighborhood components analysis, a distance learning" " technique that can be used for preprocessing. Given a labeled dataset, " "this uses NCA, which seeks to improve the k-nearest-neighbor " "classification, and returns the learned distance metric.")

	BINDING_LONG_DESC ("This program implements Neighborhood Components Analysis, both a linear " "dimensionality reduction technique and a distance learning technique. The" " method seeks to improve k-nearest-neighbor classification on a dataset " "by scaling the dimensions. The method is nonparametric, and does not " "require a value of k. It works by using stochastic (\oft\ neighbor " "assignments and using optimization techniques over the gradient of the " "accuracy of the neighbor assignments." "\" "To work, this algorithm needs labeled data. It can be given as the last " "row of the input dataset (specified with "+PRINT_PARAM_STRING("input")+"), or alternatively as a separate matrix (specified with "+PRINT_PARAM_STRING("labels")+")." "\" "This implementation of NCA uses stochastic gradient descent, mini-batch " "stochastic gradient descent, or the L_BFGS optimizer. These optimizers do" " not guarantee global convergence for a nonconvex objective function " "(NCA's objective function is nonconvex), so the final results could depend" " on the random seed or other optimizer parameters." "\" "Stochastic gradient descent, specified by the value 'sgd' for the " "parameter "+PRINT_PARAM_STRING("optimizer")+", depends " "primarily on three parameters: the step size (specified with "+PRINT_PARAM_STRING("step_size")+"), the batch size (specified with "+PRINT_PARAM_STRING("batch_size")+"), and the maximum number of iterations" " (specified with "+PRINT_PARAM_STRING("max_iterations")+"). In " "addition, a normalized starting point can be used by specifying the "+PRINT_PARAM_STRING("normalize")+" parameter, which is necessary if many " "warnings of the form 'Denominator of p_i is 0!' are given. Tuning the " "step size can be a tedious affair. In general, the step size is too large" " if the objective is not mostly uniformly decreasing, or if zero-valued " "denominator warnings are being issued. The step size is too small if the " "objective is changing very slowly. Setting the termination condition can " "be done easily once a good step size parameter is found; either increase " "the maximum iterations to a large number and allow SGD to find a minimum, " "or set the maximum iterations to 0 (allowing infinite iterations) and set " "the tolerance (specified by "+PRINT_PARAM_STRING("tolerance")+") to " "define the maximum allowed difference between objectives for SGD to " "terminate. Be careful---setting the tolerance instead of the maximum " "iterations can take a very long time and may actually never converge due " "to the properties of the SGD optimizer. Note that a single iteration of " "SGD refers to a single point, so to take a single pass over the dataset, " "set the value of the "+PRINT_PARAM_STRING("max_iterations")+" parameter equal to the number of points in the dataset." "\" "The L-BFGS optimizer, specified by the value 'lbfgs' for the parameter "+PRINT_PARAM_STRING("optimizer")+", uses a back-tracking line search " "algorithm to minimize a function. The following parameters are used by " "L-BFGS: "+PRINT_PARAM_STRING("num_basis")+" (specifies the number" " of memory points used by L-BFGS), "+PRINT_PARAM_STRING("max_iterations")+", "+PRINT_PARAM_STRING("armijo_constant")+", "+PRINT_PARAM_STRING("wolfe")+", "+PRINT_PARAM_STRING("tolerance")+" (the optimization is terminated when the gradient norm is below this " "value), "+PRINT_PARAM_STRING("max_line_search_trials")+", "+PRINT_PARAM_STRING("min_step")+", and "+PRINT_PARAM_STRING("max_step")+" (which both refer to the line search " "routine). For more details on the L-BFGS optimizer, consult either the " "mlpack L-BFGS documentation (in lbfgs.hpp) or the vast set of published " "literature on L-BFGS." "\" "By default, the SGD optimizer is used.")

	BINDING_SEE_ALSO ("@lmnn", "#lmnn")

	BINDING_SEE_ALSO ("Neighbourhood components analysis on Wikipedia", "https://en.wikipedia.org/wiki/Neighbourhood_components_analysis")

	BINDING_SEE_ALSO ("Neighbourhood components analysis (pdf)", "http://papers.nips.cc/paper/2566-neighbourhood-components-" "analysis.pdf")

	BINDING_SEE_ALSO ("mlpack::nca::NCA C++ class documentation", "@doxygen/classmlpack_1_1nca_1_1NCA.html")

	PARAM_MATRIX_IN_REQ ("input", "Input dataset to run NCA on.", "i")

	PARAM_MATRIX_OUT ("output", "Output matrix for learned distance matrix.", "o")

	PARAM_UROW_IN ("labels", "Labels for input dataset.", "l")

	PARAM_STRING_IN ("optimizer", "Optimizer to use; 'sgd' or 'lbfgs'.", "O", "sgd")

	PARAM_FLAG ("normalize", "Use a normalized starting point for optimization. This" " is useful for when points are far apart, or when SGD is returning NaN.", "N")

	PARAM_INT_IN ("max_iterations", "Maximum number of iterations for SGD or L-BFGS " "(0 indicates no limit).", "n", 500000)

	PARAM_DOUBLE_IN ("tolerance", "Maximum tolerance for termination of SGD or " "L-BFGS.", "t", 1e-7)

	PARAM_DOUBLE_IN ("step_size", "Step size for stochastic gradient descent " "(alpha).", "a", 0.01)

	PARAM_FLAG ("linear_scan", "Don't shuffle the order in which data points are " "visited for SGD or mini-batch SGD.", "L")

	PARAM_INT_IN ("batch_size", "Batch size for mini-batch SGD.", "b", 50)

	PARAM_INT_IN ("num_basis", "Number of memory points to be stored for L-BFGS.", "B", 5)

	PARAM_DOUBLE_IN ("armijo_constant", "Armijo constant for L-BFGS.", "A", 1e-4)

	PARAM_DOUBLE_IN ("wolfe", "Wolfe condition parameter for L-BFGS.", "w", 0.9)

	PARAM_INT_IN ("max_line_search_trials", "Maximum number of line search trials " "for L-BFGS.", "T", 50)

	PARAM_DOUBLE_IN ("min_step", "Minimum step of line search for L-BFGS.", "m", 1e-20)

	PARAM_DOUBLE_IN ("max_step", "Maximum step of line search for L-BFGS.", "M", 1e20)

	PARAM_INT_IN ("seed", "Random seed. If 0, 'std::time(NULL)' is used.", "s", 0)

Detailed Description

Author: Ryan Curtin

Executable for Neighborhood Components Analysis.

mlpack is free software; you may redistribute it and/or modify it under the terms of the 3-clause BSD license. You should have received a copy of the 3-clause BSD license along with mlpack. If not, see http://www.opensource.org/licenses/BSD-3-Clause for more information.

Functions

Detailed Description