CVE/CVE_R/R/cve_simple.R

#' Simple implementation of the CVE method. 'Simple' means that this method is
#' a classic GD method unsing no further tricks.
#'
#' @keywords internal
#' @export
cve_simple <- function(X, Y, k,
                       nObs = sqrt(nrow(X)),
                       h = NULL,
                       tau = 1.0,
                       tol = 1e-3,
                       slack = 0,
                       epochs = 50L,
                       attempts = 10L,
                       logger = NULL
) {
    # Set `grad` functions environment to enable if to find this environments
    # local variabels, needed to enable the manipulation of this local variables
    # from within `grad`.
    environment(grad) <- environment()

    # Get dimensions.
    n <- nrow(X) # Number of samples.
    p <- ncol(X) # Data dimensions
    q <- p - k   # Complement dimension of the SDR space.

    # Save initial learning rate `tau`.
    tau.init <- tau
    # Addapt tolearance for break condition.
    tol <- sqrt(2 * q) * tol

    # Estaimate bandwidth if not given.
    if (missing(h) || !is.numeric(h)) {
        h <- estimate.bandwidth(X, k, nObs)
    }

    # Compute persistent data.
    # Compute lookup indexes for symmetrie, lower/upper
    # triangular parts and vectorization.
    pair.index <- elem.pairs(seq(n))
    i <- pair.index[1, ] # `i` indices of `(i, j)` pairs
    j <- pair.index[2, ] # `j` indices of `(i, j)` pairs
    # Index of vectorized matrix, for lower and upper triangular part.
    lower <- ((i - 1) * n) + j
    upper <- ((j - 1) * n) + i

    # Create all pairewise differences of rows of `X`.
    X_diff <- X[i, , drop = F] - X[j, , drop = F]
    # Identity matrix.
    I_p <- diag(1, p)

    # Init tracking of current best (according multiple attempts).
    V.best <- NULL
    loss.best <- Inf

    # Start loop for multiple attempts.
    for (attempt in 1:attempts) {
        # Reset learning rate `tau`.
        tau <- tau.init

        # Sample a `(p, q)` dimensional matrix from the stiefel manifold as
        # optimization start value.
        V <- rStiefl(p, q)

        # Initial loss and gradient.
        loss <- Inf
        G <- grad(X, Y, V, h, loss.out = TRUE, persistent = TRUE)
        # Set last loss (aka, loss after applying the step).
        loss.last <- loss

        # Cayley transform matrix `A`
        A <- (G %*% t(V)) - (V %*% t(G))

        # Call logger with initial values before starting optimization.
        if (is.function(logger)) {
            epoch <- 0 # Set epoch count to 0 (only relevant for logging).
            error <- NA
            logger(environment())
        }

        ## Start optimization loop.
        for (epoch in 1:epochs) {
            # Apply learning rate `tau`.
            A.tau <- tau * A
            # Parallet transport (on Stiefl manifold) into direction of `G`.
            V.tau <- solve(I_p + A.tau) %*% ((I_p - A.tau) %*% V)

            # Loss at position after a step.
            loss <- grad(X, Y, V.tau, h, loss.only = TRUE, persistent = TRUE)

            # Check if step is appropriate, iff not reduce learning rate.
            if ((loss - loss.last) > slack * loss.last) {
                tau <- tau / 2
                next() # Keep position and try with smaller `tau`.
            }

            # Compute error.
            error <- norm(V %*% t(V) - V.tau %*% t(V.tau), type = "F")

            # Check break condition (epoch check to skip ignored gradient calc).
            # Note: the devision by `sqrt(2 * k)` is included in `tol`.
            if (error < tol || epoch >= epochs) {
                # take last step and stop optimization.
                V <- V.tau
                # Call logger last time befor stoping.
                if (is.function(logger)) {
                    logger(environment())
                }
                break()
            }

            # Perform the step and remember previous loss.
            V <- V.tau
            loss.last <- loss

            # Call logger after taking a step.
            if (is.function(logger)) {
                logger(environment())
            }

            # Compute gradient at new position.
            G <- grad(X, Y, V, h, persistent = TRUE)

            # Cayley transform matrix `A`
            A <- (G %*% t(V)) - (V %*% t(G))
        }

        # Check if current attempt improved previous ones
        if (loss < loss.best) {
            loss.best <- loss
            V.best <- V
        }

    }

    return(list(
        loss = loss.best,
        V = V.best,
        B = null(V.best),
        h = h
    ))
}
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`#' Simple implementation of the CVE method. 'Simple' means that this method is`
			`#' a classic GD method unsing no further tricks.`
			`#'`
			`#' @keywords internal`
			`#' @export`
			`cve_simple <- function(X, Y, k,`
			`nObs = sqrt(nrow(X)),`
			`h = NULL,`
			`tau = 1.0,`
			`tol = 1e-3,`
			`slack = 0,`
			`epochs = 50L,`
wip: writing C gradient version 2019-09-12 16:42:28 +00:00			`attempts = 10L,`
			`logger = NULL`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`) {`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			# Set `grad` functions environment to enable if to find this environments
			`# local variabels, needed to enable the manipulation of this local variables`
			# from within `grad`.
			`environment(grad) <- environment()`

add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`# Get dimensions.`
wip: writing C gradient version 2019-09-12 16:42:28 +00:00			`n <- nrow(X) # Number of samples.`
			`p <- ncol(X) # Data dimensions`
			`q <- p - k # Complement dimension of the SDR space.`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			# Save initial learning rate `tau`.
			`tau.init <- tau`
			`# Addapt tolearance for break condition.`
			`tol <- sqrt(2 * q) * tol`

add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`# Estaimate bandwidth if not given.`
wip: writing C gradient version 2019-09-12 16:42:28 +00:00			`if (missing(h) \|\| !is.numeric(h)) {`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`h <- estimate.bandwidth(X, k, nObs)`
			`}`

add: cve_linesearch, fix: cleaned and optimized gradient, add. notes 2019-09-02 19:07:56 +00:00			`# Compute persistent data.`
			`# Compute lookup indexes for symmetrie, lower/upper`
			`# triangular parts and vectorization.`
			`pair.index <- elem.pairs(seq(n))`
wip: writing C gradient version 2019-09-12 16:42:28 +00:00			i <- pair.index[1, ] # `i` indices of `(i, j)` pairs
			j <- pair.index[2, ] # `j` indices of `(i, j)` pairs
			`# Index of vectorized matrix, for lower and upper triangular part.`
			`lower <- ((i - 1) * n) + j`
			`upper <- ((j - 1) * n) + i`
add: cve_linesearch, fix: cleaned and optimized gradient, add. notes 2019-09-02 19:07:56 +00:00
			# Create all pairewise differences of rows of `X`.
			`X_diff <- X[i, , drop = F] - X[j, , drop = F]`
			`# Identity matrix.`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`I_p <- diag(1, p)`

fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`# Init tracking of current best (according multiple attempts).`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`V.best <- NULL`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`loss.best <- Inf`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`# Start loop for multiple attempts.`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`for (attempt in 1:attempts) {`
wip: writing C gradient version 2019-09-12 16:42:28 +00:00			# Reset learning rate `tau`.
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`tau <- tau.init`

			# Sample a `(p, q)` dimensional matrix from the stiefel manifold as
			`# optimization start value.`
			`V <- rStiefl(p, q)`

fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`# Initial loss and gradient.`
			`loss <- Inf`
add: cve_linesearch, fix: cleaned and optimized gradient, add. notes 2019-09-02 19:07:56 +00:00			`G <- grad(X, Y, V, h, loss.out = TRUE, persistent = TRUE)`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`# Set last loss (aka, loss after applying the step).`
			`loss.last <- loss`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			# Cayley transform matrix `A`
			`A <- (G %% t(V)) - (V %% t(G))`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00
wip: writing C gradient version 2019-09-12 16:42:28 +00:00			`# Call logger with initial values before starting optimization.`
			`if (is.function(logger)) {`
			`epoch <- 0 # Set epoch count to 0 (only relevant for logging).`
			`error <- NA`
			`logger(environment())`
			`}`

add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`## Start optimization loop.`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`for (epoch in 1:epochs) {`
			# Apply learning rate `tau`.
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`A.tau <- tau * A`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			# Parallet transport (on Stiefl manifold) into direction of `G`.
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`V.tau <- solve(I_p + A.tau) %% ((I_p - A.tau) %% V)`

fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`# Loss at position after a step.`
add: cve_linesearch, fix: cleaned and optimized gradient, add. notes 2019-09-02 19:07:56 +00:00			`loss <- grad(X, Y, V.tau, h, loss.only = TRUE, persistent = TRUE)`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00
wip: writing C gradient version 2019-09-12 16:42:28 +00:00			`# Check if step is appropriate, iff not reduce learning rate.`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`if ((loss - loss.last) > slack * loss.last) {`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`tau <- tau / 2`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			next() # Keep position and try with smaller `tau`.
			`}`

			`# Compute error.`
			`error <- norm(V %% t(V) - V.tau %% t(V.tau), type = "F")`
add: cve_linesearch, fix: cleaned and optimized gradient, add. notes 2019-09-02 19:07:56 +00:00
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`# Check break condition (epoch check to skip ignored gradient calc).`
			# Note: the devision by `sqrt(2 * k)` is included in `tol`.
wip: writing C gradient version 2019-09-12 16:42:28 +00:00			`if (error < tol \|\| epoch >= epochs) {`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`# take last step and stop optimization.`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`V <- V.tau`
wip: writing C gradient version 2019-09-12 16:42:28 +00:00			`# Call logger last time befor stoping.`
			`if (is.function(logger)) {`
			`logger(environment())`
			`}`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`break()`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`}`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00
			`# Perform the step and remember previous loss.`
			`V <- V.tau`
			`loss.last <- loss`

wip: writing C gradient version 2019-09-12 16:42:28 +00:00			`# Call logger after taking a step.`
			`if (is.function(logger)) {`
			`logger(environment())`
			`}`

fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`# Compute gradient at new position.`
add: cve_linesearch, fix: cleaned and optimized gradient, add. notes 2019-09-02 19:07:56 +00:00			`G <- grad(X, Y, V, h, persistent = TRUE)`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00
			# Cayley transform matrix `A`
			`A <- (G %% t(V)) - (V %% t(G))`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`}`

			`# Check if current attempt improved previous ones`
fix: cve_simple runs correct, add: notes 2019-09-02 13:22:35 +00:00			`if (loss < loss.best) {`
			`loss.best <- loss`
			`V.best <- V`
add: runtime test, add: new CVE pure R implementation, fix: small adaptation of legacy code to make it run, wip: ... 2019-08-30 19:16:52 +00:00			`}`

			`}`

			`return(list(`
			`loss = loss.best,`
			`V = V.best,`
			`B = null(V.best),`
			`h = h`
			`))`
			`}`