ppclp: Probabilistic Principal Curve with Length Penalty

Documented in ppclp2D ppclp3D

#' 2D prbabilistic principal curve with length penalty
#'
#' This function applies the probabilistic principal curve algorithm with length penalty
#'
#' @param x The coordinate of the x axis
#' @param y The coordinate of the y axis
#' @param x_fix The cordinate of the starting point of the curve
#' @param y_fix The coordinate of the ending point of the curve
#' @param K the number of knots of the curve
#' @param degree_free the degree of freedom of the B spline
#' @param lambda The magnitude value added to the length penalty
#' @param T The total number of iterations to do the EM algorithm
#' @import tidyverse splines splines2
#' @export ppclp2D
#' @examples
#' data("threeExample")
#' tmpCurve = ppclp2D(threeExample$x, threeExample$y, threeExample$xFix, threeExample$yFix)
#' plot(threeExample$x, threeExample$y, xlim = c(0,1), ylim = c(0,1), pch = 16, cex = 0.8)
#' lines(tmpCurve$xFit, tmpCurve$yFit, type = "l", col = "red", lwd = 5)



ppclp2D <- function(x, y, x_fix, y_fix, K = 50, degree_free = 10, lambda = 0.5, T = 100){
  ## Total number of points in the curve
  N = length(x)

  ## Basis for the spline
  w <- seq(0, 2 * pi, by = 2 * pi / K)[1 : K]
  B = cbind(1, bs(w, df = degree_free))
  B_der = cbind(0, dbs(w, df = degree_free))
  B_der_der = cbind(0, dbs(w, df = degree_free, derivs = 2))
  B_tilde = B[c(1, nrow(B)), ]


  ## PI is the matrix of p_ik
  PI = matrix(1 / K, nrow = N, ncol = K)
  PI_sum_old = rep(1 / K, K)

  ## sigma is the variance of the noise in the gaussian distribution
  sigma_old = 1

  ## beta_x and beta_y are the coefficients for the splines to the x-axis and y-axis
  beta_x_old = runif(degree_free + 1, -5, 5)
  beta_y_old = runif(degree_free + 1, -5, 5)

  likelihood_store = c()

  length_penalty = t(B_der) %*% B_der / K * 2 * pi
  smooth_penalty = t(B_der_der) %*% B_der_der / K * 2 * pi

  ## The procedure of the EM-Algorithm
  for(t in 1 : T){

    ## items used during the EM procedure
    x.i.matrix = matrix(x,nrow=length(x),ncol=K,byrow=FALSE)
    x.k.matrix = matrix(B %*% beta_x_old, nrow = N, ncol = length(B %*% beta_x_old), byrow = TRUE)
    y.i.matrix = matrix(y,nrow = length(y), ncol = K, byrow = FALSE)
    y.k.matrix = matrix(B %*% beta_y_old, nrow = N, ncol = length(B %*% beta_y_old), byrow = TRUE)

    ## E-step
    PI = exp(-1 / as.numeric((2 * sigma_old)) * ((x.i.matrix - x.k.matrix) ^ 2 + (y.i.matrix - y.k.matrix)^ 2)) %*% diag(PI_sum_old)
    PI = PI / apply(PI, 1, sum)

    ## M-step
    ## Update PI_sum
    PI_sum_new = 1 / N * apply(PI, 2, sum)

    ## Update sigma
    sigma_temp = 0
    sigma_temp = sum(((x.i.matrix - x.k.matrix)^2 + (y.i.matrix - y.k.matrix)^2 ) * PI)
    sigma_new =  sigma_temp / (2 * N)

    ## Update beta_x and beta_y
    B_XX = 0
    B_YY = 0
    B_ZZ = 0
    B_XY = 0

    for(i in 1 : N){
      B_XX = B_XX + t(B) %*% as.matrix(PI[i, ]) * x[i]
      B_YY = B_YY + t(B) %*% as.matrix(PI[i, ]) * y[i]
    }

    diag_B = apply(PI, 2, sum) %>% diag
    B_XY = t(B) %*% diag_B %*% B

    ## Inverse matrix for the estimation
    Inverse_M = solve(B_XY + lambda * length_penalty )

    beta_x_new  = Inverse_M %*% B_XX
    beta_y_new  = Inverse_M %*% B_YY

    ## Psu-inverse matrix for the estimation of coefficient

    Inverse_P = Inverse_M %*% t(B_tilde) %*%
      solve(B_tilde %*% Inverse_M %*% t(B_tilde))

    beta_x_new = beta_x_new -
      Inverse_P %*%
      (B_tilde %*% beta_x_new - x_fix)

    beta_y_new = beta_y_new -
      Inverse_P %*%
      (B_tilde %*% beta_y_new - y_fix)

    ## Computation of the log likelihood
    likelihood = 0
    for(i in 1 : N){
      likelihood_temp = 0
      for(k in 1 : K){
        likelihood_temp = likelihood_temp + PI_sum_new[k] * 1 / sigma_new * exp(-1/(2 * sigma_new) * ((x[i] - B[k, ] %*% beta_x_new )^2 + (y[i] - B[k, ] %*% beta_y_new)^2))
      }
      likelihood = likelihood +  log(likelihood_temp)
    }

    PI_sum_old = PI_sum_new
    sigma_old = sigma_new
    beta_x_old = beta_x_new
    beta_y_old = beta_y_new

    #print(likelihood)
    likelihood_store = c(likelihood_store, likelihood)

  }

  plot(x,y, xlim = c(0,1), ylim = c(0,1), pch = 16, cex = 0.8)
  lines(B %*% beta_x_new, B %*% beta_y_new, type = "l", col = "red", lwd = 5)
  dev.off()

  return(list(xFit = B %*% beta_x_new, yFit = B %*% beta_y_new))
}



#' 3D prbabilistic principal curve with length penalty
#'
#' This function applies the probabilistic principal curve algorithm with length penalty to 3D data
#'
#' @param x The coordinate of the x axis
#' @param y The coordinate of the y axis
#' @param z The coordinate of the z axis
#' @param x_fix The x coordinate of the starting and endingpoint of the curve
#' @param y_fix The y coordinate of the starting and endingpoint of the curve
#' @param z_fix The z coordinate of the starting and endingpoint of the curve
#' @param K the number of knots of the curve
#' @param degree_free the degree of freedom of the B spline
#' @param lambda The magnitude value added to the length penalty
#' @param T The total number of iterations to do the EM algorithm
#' @import tidyverse splines splines2
#' @export ppclp3D
#' @examples
#' data("spectExample")
#' tmpCurve = ppclp3D(spectExample$x, spectExample$y, spectExample$z, spectExample$xFix, spectExample$yFix, spectExample$zFix)
#' plot_ly() %>% add_trace(x = spectExample$x, y = spectExample$y, z = spectExample$z, type = "scatter3d", mode = "markers", name = 'points', marker = list(size = 1, color = 'rgba(0, 0, 0, .9)', opacity = 0.4)) %>%
#'  add_trace(x = spectExample$xFix[1], y = spectExample$yFix[1], z = spectExample$zFix[1], type = "scatter3d", mode = "markers", name = 'A', marker = list(size = 10, color = 'rgba(0, 255, 0, .9)', opacity = 1)) %>%
#'  add_trace(x = spectExample$xFix[2], y = spectExample$yFix[2], z = spectExample$zFix[2], type = "scatter3d", mode = "markers", name = 'M', marker = list(size = 10, color = 'rgba(0, 0, 255, .9)', opacity = 1)) %>%
#'  add_trace(x = as.vector(tmpCurve$xFit), y = as.vector(tmpCurve$yFit), z = as.vector(tmpCurve$zFit), type = "scatter3d", mode = "lines", name = "theoretical line", line = list(width = 5, color = 'rgba(255, 0, 0, .9)'))



ppclp3D <- function(x, y, z, x_fix, y_fix, z_fix, K = 200, degree_free = 50, lambda = 100, T = 20){
  N = length(x)

  ## Basis for the spline
  w <- seq(0, 2 * pi, by = 2 * pi / K)[1 : K]
  B = cbind(1, bs(w, df = degree_free))
  B_der = cbind(0, dbs(w, df = degree_free))
  B_der_der = cbind(0, dbs(w, df = degree_free, derivs = 2))
  B_tilde = B[c(1,nrow(B)), ]


  ## PI is the matrix of p_ik
  PI = matrix(1 / K, nrow = N, ncol = K)
  PI_sum_old = rep(1 / K, K)

  ## sigma is the variance of the noise in the gaussian distribution
  sigma_old = 1

  ## beta_x and beta_y are the coefficients for the splines to the x-axis and y-axis
  beta_x_old = runif(degree_free + 1, -5, 5) * 0
  beta_y_old = runif(degree_free + 1, -5, 5) * 0
  beta_z_old = runif(degree_free + 1, -5, 5) * 0

  likelihood_store = c()

  length_penalty = t(B_der) %*% B_der / K * 2 * pi
  smooth_penalty = t(B_der_der) %*% B_der_der / K * 2 * pi


  ## The procedure of the EM-Algorithm
  for(t in 1 : T){
    ## items used during the EM procedure
    x.i.matrix = matrix(x,nrow=length(x),ncol=K,byrow=FALSE)
    x.k.matrix = matrix(B %*% beta_x_old, nrow = N, ncol = length(B %*% beta_x_old), byrow = TRUE)
    y.i.matrix = matrix(y,nrow = length(y), ncol = K, byrow = FALSE)
    y.k.matrix = matrix(B %*% beta_y_old, nrow = N, ncol = length(B %*% beta_y_old), byrow = TRUE)
    z.i.matrix = matrix(z, nrow = length(z), ncol = K, byrow = FALSE)
    z.k.matrix = matrix(B %*% beta_z_old, nrow = N, ncol = length(B %*% beta_z_old), byrow = TRUE)

    sigma_old = matrix(sigma_old, nrow = N, ncol = K)

    ## E-step
    PI = exp(-1 / as.numeric((2 * sigma_old)) * ((x.i.matrix - x.k.matrix) ^ 2 + (y.i.matrix - y.k.matrix)^ 2 + (z.i.matrix - z.k.matrix)^ 2)) %*% diag(PI_sum_old)
    PI = PI / apply(PI, 1, sum)


    ## M-step
    ## Update PI_sum
    PI_sum_new = 1 / N * apply(PI, 2, sum)

    ## Update sigma
    sigma_temp = 0
    sigma_temp = sum(((x.i.matrix - x.k.matrix)^2 + (y.i.matrix - y.k.matrix)^2 + (z.i.matrix - z.k.matrix)^2) * PI)
    sigma_new = 1 * sigma_temp / (3 * N)

    ## Update beta_x and beta_y
    B_XX = 0
    B_YY = 0
    B_ZZ = 0
    B_XY = 0

    for(i in 1 : N){
      #B_XY = B_XY + t(B) %*% diag(PI[i, ]) %*% B
      B_XX = B_XX + t(B) %*% as.matrix(PI[i, ]) * x[i]
      B_YY = B_YY + t(B) %*% as.matrix(PI[i, ]) * y[i]
      B_ZZ = B_ZZ + t(B) %*% as.matrix(PI[i, ]) * z[i]
    }

    diag_B = apply(PI, 2, sum) %>% diag
    B_XY = t(B) %*% diag_B %*% B
    #B_XX = apply(t(B) %*% (t(PI) %*% diag(x)), 1, sum)


    ## Inverse matrix for the estimation
    Inverse_M = solve(B_XY + lambda * length_penalty)

    beta_x_new  = Inverse_M %*% B_XX
    beta_y_new  = Inverse_M %*% B_YY
    beta_z_new  = Inverse_M %*% B_ZZ

    ## Psu-inverse matrix for the estimation of coefficient

    Inverse_P = Inverse_M %*% t(B_tilde) %*%
      solve(B_tilde %*% Inverse_M %*% t(B_tilde))

    beta_x_new = beta_x_new -
      Inverse_P %*%
      (B_tilde %*% beta_x_new - x_fix)

    beta_y_new = beta_y_new -
      Inverse_P %*%
      (B_tilde %*% beta_y_new - y_fix)

    beta_z_new = beta_z_new -
      Inverse_P %*%
      (B_tilde %*% beta_z_new - z_fix)


    PI_sum_old = PI_sum_new
    sigma_old = sigma_new
    beta_x_old = beta_x_new
    beta_y_old = beta_y_new
    beta_z_old = beta_z_new

    print(t)

  }

  ## Plot the Principal for the Colon Image
  x.fit = B %*% beta_x_new
  y.fit = B %*% beta_y_new
  z.fit = B %*% beta_z_new

  return(list(xFit = x.fit, yFit = y.fit, zFit = z.fit))

}





# library(oro.nifti)
# library(brainR)
# library(rgl)
#
# Img = readANALYZE("/Users/huanchen/Downloads/DREAM-Amer_Sabrine/J001_Product\ A/J001_111516_2hr/1.2.840.113704.3.1.32161115.10110.83/J001_111516_2\ hr_ECTHd1_IRAC001_DS.img")
# ctImg = readNIfTI("/Users/huanchen/Downloads/DREAM-Amer_Sabrine/J001_Product\ A/J001_111516_2hr/1.2.840.113704.3.1.32161115.10110.83/J001_111516_2\ hr_ECTHd1_IRAC001_DS.nii.gz")
#
#
# nColLevels = 11
# col = c(gray(0), heat.colors(nColLevels - 1))
# colCT = gray(seq(0, 1, length = nColLevels))
#
# withinThresh = Img[Img >= 10]
# withinThreshCT = ctImg[ctImg >= 10]
# breaks = quantile(withinThresh, (0 : nColLevels) / nColLevels)
# breaksCT = c(0, quantile(withinThreshCT, (0 : (nColLevels - 1)) / (nColLevels - 1)))
#
# XYZ = c(70, 70, 32)
#
# image(z = ctImg[,,XYZ[3]],
#       1 : dim(Img)[1],
#       1 : dim(Img)[2],
#       col = colCT,
#       asp = 1,
#       axes = FALSE,
#       #breaks = breaksCT,
#       xlab= "",
#       ylab = ""
# )
#
#
# image(z = Img[, ,XYZ[3]],
#       1 : dim(Img)[1],
#       1 : dim(Img)[2],
#       col = col,
#       breaks = breaks,
#       asp = 1,
#       axes = FALSE,
#       add = TRUE
# )
#
# title("Z slice")
# abline(v = XYZ[1], col = "white", lwd = 3)
# abline(h = XYZ[2], col = "white", lwd = 3)
#
#
# spectExample = list(x = spectExample$x, y = spectExample$y, z = spectExample$z, xFix = spectExample$xFix, yFix = spectExample$yFix, zFix = spectExample$zFix, Img = Img, ctImg = ctImg)
#
# save(spectExample, file = "data/spectExample.RData")
#
#
#