X-Git-Url: https://git.auder.net/?p=valse.git;a=blobdiff_plain;f=R%2Fmain.R;h=42852d368f19592ab4a0ca7565dfc99a63b6f36b;hp=00b1be9b60aac9b41fa7709d51245b79a11d2ae3;hb=31463ab809c0195273ff2760606ea65361d721ab;hpb=39046da6016f15d625bd99cf0303ea8beb838c79

diff --git a/R/main.R b/R/main.R
index 00b1be9..42852d3 100644
--- a/R/main.R
+++ b/R/main.R
@@ -1,58 +1,61 @@
-SelMix = setRefClass(
-	Class = "selmix",
+#' @useDynLib valse
+
+Valse = setRefClass(
+	Class = "Valse",
 
 	fields = c(
 		# User defined
 
 		# regression data (size n*p, where n is the number of observations,
 		# and p is the number of regressors)
-		X = "numeric",
-		# response data (size n*m, where n is the number of observations, 
+		X = "matrix",
+		# response data (size n*m, where n is the number of observations,
 		# and m is the number of responses)
-		Y = "numeric",
+		Y = "matrix",
 
 		# Optionally user defined (some default values)
 
 		# power in the penalty
-		gamma = "double",
+		gamma = "numeric",
 		# minimum number of iterations for EM algorithm
 		mini = "integer",
 		# maximum number of iterations for EM algorithm
 		maxi = "integer",
 		# threshold for stopping EM algorithm
-		eps = "double",
+		eps = "numeric",
 		# minimum number of components in the mixture
 		kmin = "integer",
 		# maximum number of components in the mixture
 		kmax = "integer",
-		rangmin = "integer",
-		rangmax = "integer",
-		
+		# ranks for the Lasso-Rank procedure
+		rank.min = "integer",
+		rank.max = "integer",
+
 		# Computed through the workflow
 
 		# initialisation for the reparametrized conditional mean parameter
-		phiInit,
+		phiInit = "numeric",
 		# initialisation for the reparametrized variance parameter
-		rhoInit,
+		rhoInit = "numeric",
 		# initialisation for the proportions
-		piInit,
+		piInit = "numeric",
 		# initialisation for the allocations probabilities in each component
-		tauInit,
+		tauInit = "numeric",
 		# values for the regularization parameter grid
-		gridLambda = [];
+		gridLambda = "numeric",
 		# je ne crois pas vraiment qu'il faille les mettre en sortie, d'autant plus qu'on construit
 		# une matrice A1 et A2 pour chaque k, et elles sont grandes, donc ca coute un peu cher ...
-		A1,
-		A2,
+		A1 = "integer",
+		A2 = "integer",
 		# collection of estimations for the reparametrized conditional mean parameters
-		Phi,
+		Phi = "numeric",
 		# collection of estimations for the reparametrized variance parameters
-		Rho,
+		Rho = "numeric",
 		# collection of estimations for the proportions parameters
-		Pi,
+		Pi = "numeric",
 
-		#immutable
-		seuil = 1e-15;
+		#immutable (TODO:?)
+		thresh = "numeric"
 	),
 
 	methods = list(
@@ -61,20 +64,21 @@ SelMix = setRefClass(
 		#######################
 		initialize = function(X,Y,...)
 		{
-			"Initialize SelMix object"
+			"Initialize Valse object"
 
 			callSuper(...)
 
-			X <<- X;
-			Y <<- Y;
+			X <<- X
+			Y <<- Y
 			gamma <<- ifelse (hasArg("gamma"), gamma, 1.)
 			mini <<- ifelse (hasArg("mini"), mini, as.integer(5))
 			maxi <<- ifelse (hasArg("maxi"), maxi, as.integer(10))
 			eps <<- ifelse (hasArg("eps"), eps, 1e-6)
 			kmin <<- ifelse (hasArg("kmin"), kmin, as.integer(2))
 			kmax <<- ifelse (hasArg("kmax"), kmax, as.integer(3))
-			rangmin <<- ifelse (hasArg("rangmin"), rangmin, as.integer(2))
-			rangmax <<- ifelse (hasArg("rangmax"), rangmax, as.integer(3))
+			rank.min <<- ifelse (hasArg("rank.min"), rank.min, as.integer(2))
+			rank.max <<- ifelse (hasArg("rank.max"), rank.max, as.integer(3))
+			thresh <<- 1e-15 #immutable (TODO:?)
 		},
 
 		##################################
@@ -88,11 +92,11 @@ SelMix = setRefClass(
 			#smallEM initializes parameters by k-means and regression model in each component,
 			#doing this 20 times, and keeping the values maximizing the likelihood after 10
 			#iterations of the EM algorithm.
-			init = initSmallEM(k,sx.X,sx.Y,sx.eps);
-			phiInit <<- init$phi0;
-			rhoInit <<- init$rho0;
-			piInit	<<- init$pi0;
-			tauInit <<- init$tau0;
+			init = initSmallEM(k,X,Y,eps)
+			phiInit <<- init$phi0
+			rhoInit <<- init$rho0
+			piInit	<<- init$pi0
+			tauInit <<- init$tau0
 		},
 
 		computeGridLambda = function()
@@ -100,8 +104,7 @@ SelMix = setRefClass(
 			"computation of the regularization grid"
 			#(according to explicit formula given by EM algorithm)
 
-			gridLambda <<- grillelambda(sx.phiInit,sx.rhoInit,sx.piInit,sx.tauInit,sx.X,sx.Y,
-				sx.gamma,sx.mini,sx.maxi,sx.eps);
+			gridLambda <<- gridLambda(phiInit,rhoInit,piInit,tauInit,X,Y,gamma,mini,maxi,eps)
 		},
 
 		computeRelevantParameters = function()
@@ -109,10 +112,10 @@ SelMix = setRefClass(
 			"Compute relevant parameters"
 
 			#select variables according to each regularization parameter
-			#from the grid: sx.A1 corresponding to selected variables, and
-			#sx.A2 corresponding to unselected variables.
-			params = selectiontotale(sx.phiInit,sx.rhoInit,sx.piInit,sx.tauInit,sx.mini,sx.maxi,
-				sx.gamma,sx.gridLambda,sx.X,sx.Y,sx.seuil,sx.eps);
+			#from the grid: A1 corresponding to selected variables, and
+			#A2 corresponding to unselected variables.
+			params = selectiontotale(
+				phiInit,rhoInit,piInit,tauInit,mini,maxi,gamma,gridLambda,X,Y,thresh,eps)
 			A1 <<- params$A1
 			A2 <<- params$A2
 			Rho <<- params$Rho
@@ -125,9 +128,8 @@ SelMix = setRefClass(
 
 			#compute parameter estimations, with the Maximum Likelihood
 			#Estimator, restricted on selected variables.
-			res = constructionModelesLassoMLE(sx.phiInit,sx.rhoInit,sx.piInit,sx.tauInit,
-				sx.mini,sx.maxi,sx.gamma,sx.gridLambda,sx.X,sx.Y,sx.seuil,sx.eps,sx.A1,sx.A2);
-			return (list( phi=res$phi, rho=res$rho, pi=res$pi))
+			return ( constructionModelesLassoMLE(
+				phiInit,rhoInit,piInit,tauInit,mini,maxi,gamma,gridLambda,X,Y,thresh,eps,A1,A2) )
 		},
 
 		runProcedure2 = function()
@@ -136,75 +138,75 @@ SelMix = setRefClass(
 
 			#compute parameter estimations, with the Low Rank
 			#Estimator, restricted on selected variables.
-			return (constructionModelesLassoRank(sx.Pi,sx.Rho,sx.mini,sx.maxi,sx.X,sx.Y,sx.eps,
-				sx.A1,sx.rangmin,sx.rangmax)$phi)
+			return ( constructionModelesLassoRank(Pi,Rho,mini,maxi,X,Y,eps,
+				A1,rank.min,rank.max) )
 		},
 
-		run = function(procedure)
+		run = function()
 		{
 			"main loop: over all k and all lambda"
 
-			# Run the all procedure, 1 with the
+			# Run the whole procedure, 1 with the
 			#maximum likelihood refitting, and 2 with the Low Rank refitting.
-				p = dim(phiInit)[1]
-				m = dim(phiInit)[2]
-				for (k in kmin:kmax)
+			p = dim(phiInit)[1]
+			m = dim(phiInit)[2]
+			for (k in kmin:kmax)
+			{
+				print(k)
+				initParameters(k)
+				computeGridLambda()
+				computeRelevantParameters()
+				if (procedure == 1)
+				{
+					r1 = runProcedure1()
+					Phi2 = Phi
+					Rho2 = Rho
+					Pi2 = Pi
+					p = ncol(X)
+					m = ncol(Y)
+					if (is.null(dim(Phi2))) #test was: size(Phi2) == 0
+					{
+						Phi[,,1:k] <<- r1$phi
+						Rho[,,1:k] <<- r1$rho
+						Pi[1:k,] <<- r1$pi
+					} else
+					{
+						Phi <<- array(0., dim=c(p,m,kmax,dim(Phi2)[4]+dim(r1$phi)[4]))
+						Phi[,,1:(dim(Phi2)[3]),1:(dim(Phi2)[4])] <<- Phi2
+						Phi[,,1:k,dim(Phi2)[4]+1] <<- r1$phi
+						Rho <<- array(0., dim=c(m,m,kmax,dim(Rho2)[4]+dim(r1$rho)[4]))
+						Rho[,,1:(dim(Rho2)[3]),1:(dim(Rho2)[4])] <<- Rho2
+						Rho[,,1:k,dim(Rho2)[4]+1] <<- r1$rho
+						Pi <<- array(0., dim=c(kmax,dim(Pi2)[2]+dim(r1$pi)[2]))
+						Pi[1:nrow(Pi2),1:ncol(Pi2)] <<- Pi2
+						Pi[1:k,ncol(Pi2)+1] <<- r1$pi
+					}
+				} else
 				{
-					print(k)
-					initParameters(k)
-					computeGridLambda()
-					computeRelevantParameters()
-					if (procedure == 1)
+					phi = runProcedure2()$phi
+					Phi2 = Phi
+					if (dim(Phi2)[1] == 0)
+					{
+						Phi[,,1:k,] <<- phi
+					} else
 					{
-						r1 = runProcedure1(sx)
-						Phi2 = Phi
-						Rho2 = Rho
-						Pi2 = Pi
-						p = ncol(X)
-						m = ncol(Y)
-						if size(Phi2) == 0 #TODO: continue translation MATLAB --> R
-						sx.Phi(:,:,1:k,:) = r1$phi;
-						sx.Rho(:,:,1:k,:) = r1$rho;
-						sx.Pi(1:k,:) = r1$pi;
-						else
-						sx.Phi = zeros(p,m,sx.kmax,size(Phi2,4)+size(r1$phi,4));
-						sx.Phi(:,:,1:size(Phi2,3),1:size(Phi2,4)) = Phi2;
-						sx.Phi(:,:,1:k,size(Phi2,4)+1:end) = r1$phi;
-						sx.Rho = zeros(m,m,sx.kmax,size(Rho2,4)+size(r1$rho,4));
-						sx.Rho(:,:,1:size(Rho2,3),1:size(Rho2,4)) = Rho2;
-						sx.Rho(:,:,1:k,size(Rho2,4)+1:end) = r1$rho;
-						sx.Pi = zeros(sx.kmax,size(Pi2,2)+size(r1$pi,2));
-						sx.Pi(1:size(Pi2,1),1:size(Pi2,2)) = Pi2;
-						sx.Pi(1:k,size(Pi2,2)+1:end) = r1$pi;
-						end
-				else
-						[phi] = runProcedure2(sx);
-						phi
-						Phi2 = sx.Phi;
-						if size(Phi2,1) == 0
-						sx.Phi(:,:,1:k,:) = phi;
-						else
-						size(Phi2)
-						sx.Phi = zeros(p,m,sx.kmax,size(Phi2,4)+size(phi,4));
-						size(sx.Phi)
-						sx.Phi(:,:,1:size(Phi2,3),1:size(Phi2,4)) = Phi2;
-						sx.Phi(:,:,1:k,size(Phi2,4)+1:end) = phi;
-						end
-						
-				end
-				
-				
-				end
-		end
-		
+						Phi <<- array(0., dim=c(p,m,kmax,dim(Phi2)[4]+dim(phi)[4]))
+						Phi[,,1:(dim(Phi2)[3]),1:(dim(Phi2)[4])] <<- Phi2
+						Phi[,,1:k,-(1:(dim(Phi2)[4]))] <<- phi
+					}
+				}
+			}
+		}
+
 		##################################################
-		#pruning: select only one (or a few best ?!) model
+		#TODO: pruning: select only one (or a few best ?!) model
 		##################################################
 		#
-		# 		function[model] selectModel(sx)
+		# 		function[model] selectModel(
 		# 			#TODO
-		# 			#model = sxModel(...);
+		# 			#model = odel(...)
 		# 		end
-		
+		# Give at least the slope heuristic and BIC, and AIC ?
+
 		)
 )