[morpheus.git] / pkg / R / multiRun.R

#' multiRun
#'
#' Estimate N times some parameters, outputs of some list of functions. This method is
#' thus very generic, allowing typically bootstrap or Monte-Carlo estimations of matrices
#' μ or β. Passing a list of functions opens the possibility to compare them on a fair
#' basis (exact same inputs). It's even possible to compare methods on some deterministic
#' design of experiments.
#'
#' @param fargs List of arguments for the estimation functions
#' @param estimParams List of nf function(s) to apply on fargs - shared signature
#' @param prepareArgs Prepare arguments for the functions inside estimParams
#' @param N Number of runs
#' @param ncores Number of cores for parallel runs (<=1: sequential)
#' @param verbose TRUE to indicate runs + methods numbers
#'
#' @return A list of nf aggregates of N results (matrices).
#'
#' @examples
#' \dontrun{
#' β <- matrix(c(1,-2,3,1),ncol=2)
#'
#' # Bootstrap + computeMu, morpheus VS flexmix ; assumes fargs first 3 elts X,Y,K
#' io <- generateSampleIO(n=1000, p=1/2, β=β, b=c(0,0), "logit")
#' μ <- normalize(β)
#' res <- multiRun(list(X=io$X,Y=io$Y,optargs=list(K=2,jd_nvects=0)), list(
#'   # morpheus
#'   function(fargs) {
#'     library(morpheus)
#'     ind <- fargs$ind
#'     computeMu(fargs$X[ind,],fargs$Y[ind],fargs$optargs)
#'   },
#'   # flexmix
#'   function(fargs) {
#'     library(flexmix)
#'     ind <- fargs$ind
#'     K <- fargs$optargs$K
#'     dat = as.data.frame( cbind(fargs$Y[ind],fargs$X[ind,]) )
#'     out = refit( flexmix( cbind(V1, 1 - V1) ~ 0+., data=dat, k=K,
#'       model=FLXMRglm(family="binomial") ) )
#'     normalize( matrix(out@@coef[1:(ncol(fargs$X)*K)], ncol=K) )
#'   } ),
#'   prepareArgs = function(fargs) {
#'     fargs$ind <- sample(1:nrow(fargs$X),replace=TRUE)
#'     fargs
#'   }, N=10, ncores=3)
#' for (i in 1:2)
#'   res[[i]] <- alignMatrices(res[[i]], ref=μ, ls_mode="exact")
#'
#' # Monte-Carlo + optimParams from X,Y, morpheus VS flexmix ; first args n,p,β,b
#' res <- multiRun(list(n=1000,p=1/2,β=β,b=c(0,0),optargs=list(link="logit")),list(
#'   # morpheus
#'   function(fargs) {
#'     library(morpheus)
#'     K <- fargs$optargs$K
#'     μ <- computeMu(fargs$X, fargs$Y, fargs$optargs)
#'     V <- list( p=rep(1/K,K-1), β=μ, b=c(0,0) )
#'     optimParams(V,fargs$optargs)$β
#'   },
#'   # flexmix
#'   function(fargs) {
#'     library(flexmix)
#'     K <- fargs$optargs$K
#'     dat <- as.data.frame( cbind(fargs$Y,fargs$X) )
#'     out <- refit( flexmix( cbind(V1, 1 - V1) ~ 0+., data=dat, k=K,
#'       model=FLXMRglm(family="binomial") ) )
#'     sapply( seq_len(K), function(i) as.double( out@@components[[1]][[i]][,1] ) )
#'   } ),
#'   prepareArgs = function(fargs) {
#'     library(morpheus)
#'     io = generateSampleIO(fargs$n, fargs$p, fargs$β, fargs$b, fargs$optargs$link)
#'     fargs$X = io$X
#'     fargs$Y = io$Y
#'     fargs$optargs$K = ncol(fargs$β)
#'     fargs$optargs$M = computeMoments(io$X,io$Y)
#'     fargs
#'   }, N=10, ncores=3)
#' for (i in 1:2)
#'   res[[i]] <- alignMatrices(res[[i]], ref=β, ls_mode="exact")}
#' @export
multiRun <- function(fargs, estimParams,
	prepareArgs = function(x) x, N=10, ncores=3, agg=lapply, verbose=FALSE)
{
	if (!is.list(fargs))
		stop("fargs: list")
	# No checks on fargs: supposedly done in estimParams[[i]]()
	if (!is.list(estimParams))
		estimParams = list(estimParams)
	# Verify that the provided parameters estimations are indeed functions
	lapply(seq_along(estimParams), function(i) {
		if (!is.function(estimParams[[i]]))
			stop("estimParams: list of function(fargs)")
	})
	if (!is.numeric(N) || N < 1)
		stop("N: positive integer")

	estimParamAtIndex <- function(index)
	{
		fargs <- prepareArgs(fargs)
		if (verbose)
			cat("Run ",index,"\n")
		lapply(seq_along(estimParams), function(i) {
			if (verbose)
				cat("   Method ",i,"\n")
			out <- estimParams[[i]](fargs)
			if (is.list(out))
				do.call(rbind, out)
			else
				out
		})
	}

	if (ncores > 1)
	{
		cl = parallel::makeCluster(ncores, outfile="")
		parallel::clusterExport(cl, c("fargs","verbose"), environment())
		list_res = parallel::clusterApplyLB(cl, 1:N, estimParamAtIndex)
		parallel::stopCluster(cl)
	}
	else
		list_res = lapply(1:N, estimParamAtIndex)

	# De-interlace results: output one list per function
	nf <- length(estimParams)
	lapply( seq_len(nf), function(i) lapply(seq_len(N), function(j) list_res[[j]][[i]]) )
}
Commit	Line	Data
cbd88fe5 BA	1	#' multiRun
	2	#'
	3	#' Estimate N times some parameters, outputs of some list of functions. This method is
	4	#' thus very generic, allowing typically bootstrap or Monte-Carlo estimations of matrices
	5	#' μ or β. Passing a list of functions opens the possibility to compare them on a fair
	6	#' basis (exact same inputs). It's even possible to compare methods on some deterministic
	7	#' design of experiments.
	8	#'
	9	#' @param fargs List of arguments for the estimation functions
	10	#' @param estimParams List of nf function(s) to apply on fargs - shared signature
	11	#' @param prepareArgs Prepare arguments for the functions inside estimParams
	12	#' @param N Number of runs
	13	#' @param ncores Number of cores for parallel runs (<=1: sequential)
	14	#' @param verbose TRUE to indicate runs + methods numbers
	15	#'
	16	#' @return A list of nf aggregates of N results (matrices).
	17	#'
	18	#' @examples
	19	#' \dontrun{
	20	#' β <- matrix(c(1,-2,3,1),ncol=2)
	21	#'
	22	#' # Bootstrap + computeMu, morpheus VS flexmix ; assumes fargs first 3 elts X,Y,K
	23	#' io <- generateSampleIO(n=1000, p=1/2, β=β, b=c(0,0), "logit")
	24	#' μ <- normalize(β)
	25	#' res <- multiRun(list(X=io$X,Y=io$Y,optargs=list(K=2,jd_nvects=0)), list(
	26	#' # morpheus
	27	#' function(fargs) {
	28	#' library(morpheus)
	29	#' ind <- fargs$ind
	30	#' computeMu(fargs$X[ind,],fargs$Y[ind],fargs$optargs)
	31	#' },
	32	#' # flexmix
	33	#' function(fargs) {
	34	#' library(flexmix)
	35	#' ind <- fargs$ind
	36	#' K <- fargs$optargs$K
	37	#' dat = as.data.frame( cbind(fargs$Y[ind],fargs$X[ind,]) )
	38	#' out = refit( flexmix( cbind(V1, 1 - V1) ~ 0+., data=dat, k=K,
	39	#' model=FLXMRglm(family="binomial") ) )
	40	#' normalize( matrix(out@@coef[1:(ncol(fargs$X)*K)], ncol=K) )
	41	#' } ),
	42	#' prepareArgs = function(fargs) {
	43	#' fargs$ind <- sample(1:nrow(fargs$X),replace=TRUE)
	44	#' fargs
	45	#' }, N=10, ncores=3)
	46	#' for (i in 1:2)
	47	#' res[[i]] <- alignMatrices(res[[i]], ref=μ, ls_mode="exact")
	48	#'
	49	#' # Monte-Carlo + optimParams from X,Y, morpheus VS flexmix ; first args n,p,β,b
	50	#' res <- multiRun(list(n=1000,p=1/2,β=β,b=c(0,0),optargs=list(link="logit")),list(
	51	#' # morpheus
	52	#' function(fargs) {
	53	#' library(morpheus)
	54	#' K <- fargs$optargs$K
	55	#' μ <- computeMu(fargs$X, fargs$Y, fargs$optargs)
	56	#' V <- list( p=rep(1/K,K-1), β=μ, b=c(0,0) )
	57	#' optimParams(V,fargs$optargs)$β
	58	#' },
	59	#' # flexmix
	60	#' function(fargs) {
	61	#' library(flexmix)
	62	#' K <- fargs$optargs$K
	63	#' dat <- as.data.frame( cbind(fargs$Y,fargs$X) )
	64	#' out <- refit( flexmix( cbind(V1, 1 - V1) ~ 0+., data=dat, k=K,
65	#' model=FLXMRglm(family="binomial") ) )
66	#' sapply( seq_len(K), function(i) as.double( out@@components[[1]][[i]][,1] ) )
67	#' } ),
68	#' prepareArgs = function(fargs) {
69	#' library(morpheus)
70	#' io = generateSampleIO(fargs$n, fargs$p, fargs$β, fargs$b, fargs$optargs$link)
71	#' fargs$X = io$X
72	#' fargs$Y = io$Y
73	#' fargs$optargs$K = ncol(fargs$β)
74	#' fargs$optargs$M = computeMoments(io$X,io$Y)
75	#' fargs
76	#' }, N=10, ncores=3)
77	#' for (i in 1:2)
78	#' res[[i]] <- alignMatrices(res[[i]], ref=β, ls_mode="exact")}
79	#' @export
80	multiRun <- function(fargs, estimParams,
81	prepareArgs = function(x) x, N=10, ncores=3, agg=lapply, verbose=FALSE)
82	{
83	if (!is.list(fargs))
84	stop("fargs: list")
85	# No checks on fargs: supposedly done in estimParams[[i]]()
86	if (!is.list(estimParams))
87	estimParams = list(estimParams)
88	# Verify that the provided parameters estimations are indeed functions
89	lapply(seq_along(estimParams), function(i) {
90	if (!is.function(estimParams[[i]]))
91	stop("estimParams: list of function(fargs)")
92	})
93	if (!is.numeric(N) \|\| N < 1)
94	stop("N: positive integer")
95
96	estimParamAtIndex <- function(index)
97	{
98	fargs <- prepareArgs(fargs)
99	if (verbose)
100	cat("Run ",index,"\n")
101	lapply(seq_along(estimParams), function(i) {
102	if (verbose)
103	cat(" Method ",i,"\n")
104	out <- estimParams[[i]](fargs)
105	if (is.list(out))
106	do.call(rbind, out)
107	else
108	out
109	})
110	}
111
112	if (ncores > 1)
113	{
114	cl = parallel::makeCluster(ncores, outfile="")
115	parallel::clusterExport(cl, c("fargs","verbose"), environment())
116	list_res = parallel::clusterApplyLB(cl, 1:N, estimParamAtIndex)
117	parallel::stopCluster(cl)
118	}
119	else
120	list_res = lapply(1:N, estimParamAtIndex)
121
122	# De-interlace results: output one list per function
123	nf <- length(estimParams)
124	lapply( seq_len(nf), function(i) lapply(seq_len(N), function(j) list_res[[j]][[i]]) )
125	}