X-Git-Url: https://git.auder.net/js/app_dev.php?a=blobdiff_plain;f=epclust%2FR%2Fstage2.R;h=3ccbbad10903b256c005b0476b418bf3bbfdd9a3;hb=db6fc17ddd53fb0c64cf957296dc615ba830db56;hp=ebb44d9ae0624a9d518df7d65ee0246f38f520a2;hpb=d03c0621a8f298b19659ebc20a86099ba56d8ff7;p=epclust.git

diff --git a/epclust/R/stage2.R b/epclust/R/stage2.R
index ebb44d9..3ccbbad 100644
--- a/epclust/R/stage2.R
+++ b/epclust/R/stage2.R
@@ -1,170 +1,51 @@
-#point avec Jairo:
-#rentrer dans code C cwt continue Rwave
-#passer partie sowas Ã  C
-#fct qui pour deux series (ID, medoides) renvoie distance WER (Rwave ou Ã  moi)
-#transformee croisee , smoothing lissage 3 composantes , + calcul pour WER
-#attention : code fait pour des series temps desynchronisees ! (deltat, dt == 1,2 ...)
-#determiner nvoice noctave (entre octave + petit et + grand)
-
 library("Rwave")
 
 #EntrÃ©e : courbes synchrones, soit aprÃ¨s Ã©tape 1 itÃ©rÃ©e, soit aprÃ¨s chaqure Ã©tape 1
-#TODO: bout de code qui calcule les courbes synchrones aprÃ¨s Ã©tapes 1+2 Ã  partir des ID mÃ©doÃ¯des
-
-#toCWT: (aux)
-##NOTE: renvoie une matrice 3D
-toCWT  <- function(X, sw=  0,  tw=  0, swabs= 0, nvoice= 12, noctave= 5, s0= 2, w0= 2*pi,
-	lt= 24, dt= 0.5, spectra = FALSE, smooth = TRUE, scaled  = FALSE, scalevector)
-{
-	noctave  <- adjust.noctave(lt, dt, s0, tw, noctave)
-	if(missing(scalevector))
-		scalevector  <- 2^(0:(noctave * nvoice) / nvoice) * s0
-	res <- lapply(1:nrow(X), function(n) {
-		tsX <- ts( X[n,] )
-		tsCent <- tsX - mean(tsX)
-		if(scaled)
-			tsCent <- ts(scale(tsCent))
-		tsCent.cwt <- cwt.ts(tsCent, s0, noctave, nvoice, w0)
-		tsCent.cwt
-	})
-	if( spectra )
-		res <- lapply(res, function(l) Mod(l)^2 )
-	if( smooth  )
-		res <- lapply(res, smCWT, swabs = swabs, tw = tw, dt = dt, scalevector = scalevector)
-	resArray <- array(NA, c(nrow(res[[1]]), ncol(res[[1]]), length(res)))
-	for( l in 1:length(res) )
-		resArray[ , , l] <- res[[l]]
-	resArray
-}
-
-#from sowas
-cwt.ts <- function(ts,s0,noctave=5,nvoice=10,w0=2*pi)
-{
-	if (class(ts)!="ts")
-		stop("# This function needs a time series object as input. You may construct this by using the function ts(data,start,deltat). Try '?ts' for help.\n")
-
-	t=time(ts)
-	dt=t[2]-t[1]
-	s0unit=s0/dt*w0/(2*pi)
-	s0log=as.integer((log2(s0unit)-1)*nvoice+1.5)
-	if (s0log<1)
-	{
-		cat(paste("# s0unit = ",s0unit,"\n",sep=""))
-		cat(paste("# s0log  = ",s0log,"\n",sep=""))
-		cat("# s0 too small for w0! \n")
-	}
-	totnoct=noctave+as.integer(s0log/nvoice)+1
-
-	#cwt from package Rwave
-	totts.cwt=cwt(ts,totnoct,nvoice,w0,plot=0)
-	ts.cwt=totts.cwt[,s0log:(s0log+noctave*nvoice)]
-
-	#Normalization
-	sqs <- sqrt(2^(0:(noctave*nvoice)/nvoice)*s0)
-	smat <- matrix(rep(sqs,length(t)),nrow=length(t),byrow=TRUE)
-
-	ts.cwt*smat
-}
-
-#NOTE: vect2mat = as.matrix ?! (dans aux.R)
-vect2mat <- function(vect)
-{
-	vect <- as.vector(vect)
-	matrix(vect[-(1:2)], delta, lscvect)
-}
-
-#fonction smCWT (dans aux.R)
-smCWT <- function(CWT, sw=  0,  tw=  0, swabs= 0, nvoice= 12, noctave= 2, s0= 2, w0= 2*pi,
-	lt= 24, dt= 0.5, scalevector )
-{
-#noctave  <- adjust.noctave(lt, dt, s0, tw, noctave)
-#scalevector  <- 2^(0:(noctave * nvoice) / nvoice) * s0
-	wsp     <- Mod(CWT)
-	smwsp   <- smooth.matrix(wsp, swabs)
-	smsmwsp <- smooth.time(smwsp, tw, dt, scalevector)
-	smsmwsp
-}
-
-#dans sowas.R (...donc on ne lisse pas Ã  ce niveau ?)
-smooth.matrix <- function(wt,swabs)
-{
-	if (swabs != 0)
-	{
-		smwt <- t(filter(t(wt),rep(1,2*swabs+1)/(2*swabs+1)))
-	} else
-	{
-		smwt <- wt
-	}
-	smwt
-}
-
-smooth.time <- function(wt,tw,dt,scalevector)
-{
-	smwt <- wt
-	if (tw != 0)
-	{
-		for (i in 1:length(scalevector))
-		{
-			twi <- as.integer(scalevector[i]*tw/dt)
-			smwt[,i] <- filter(wt[,i],rep(1,2*twi+1)/(2*twi+1))
-		}
-	}
-	smwt
-}
-
 step2 = function(conso)
 {
-	#(Benjamin)
-	#Ã  partir de lÃ , "conso" == courbes synchrones
-	n     <- nrow(conso)
+	n <- nrow(conso)
 	delta <- ncol(conso)
-
-	#17000 colonnes coeff 1, puis 17000 coeff 2... [non : dans chaque tranche du cube]
-	# #NOTE: delta et lscvect pourraient etre gardÃ©s Ã  part (communs)
-
-	#TODO: automatic tune of these parameters ? (for other users)
+	#TODO: automatic tune of all these parameters ? (for other users)
 	nvoice   <- 4
-	# # noctave4 = 2^13 = 8192 half hours ~ 180 days
-	noctave4 <- adjust.noctave(N = delta, dt = 1, s0 = 2, tw = 0, noctave = 13)
-	# # 4 here represent 2^5 = 32 half-hours ~ 1 day
-	scalevector4  <- 2^(4:(noctave4 * nvoice) / nvoice) * 2
-	lscvect4      <- length(scalevector4)
-	lscvect <- lscvect4  # i should clean my code: werFam demands a lscvect
-
-	# observations node with CWT
-	Xcwt4   <- toCWT(conso, noctave = noctave4, dt = 1, scalevector = scalevector4, lt = delta,
-		smooth = FALSE, nvoice = nvoice)
-
-	#matrix:
-	############Xcwt2 <- matrix(0.0, nrow= n, ncol= 2 + delta * lscvect)
-	Xcwt2 <- matrix(NA_complex_, nrow= n, ncol= 2 + length((c(Xcwt4[,,1]))))
-
-	#NOTE: delta et lscvect pourraient etre gardÃ©s Ã  part (communs)
-	for(i in 1:n)
-		Xcwt2[i,] <- c(delta, lscvect, Xcwt4[,,i] / max(Mod(Xcwt4[,,i])) )
-	#rm(conso, Xcwt4); gc()
+	# noctave = 2^13 = 8192 half hours ~ 180 days ; ~log2(ncol(conso))
+	noctave = 13
+	# 4 here represent 2^5 = 32 half-hours ~ 1 day
+	#NOTE: default scalevector == 2^(0:(noctave * nvoice) / nvoice) * s0 (?)
+	scalevector  <- 2^(4:(noctave * nvoice) / nvoice) * 2
+	#condition: ( log2(s0*w0/(2*pi)) - 1 ) * nvoice + 1.5 >= 1
+	s0=2
+	w0=2*pi
+	scaled=FALSE
+	s0log = as.integer( (log2( s0*w0/(2*pi) ) - 1) * nvoice + 1.5 )
+	totnoct = noctave + as.integer(s0log/nvoice) + 1
+
+	# (normalized) observations node with CWT
+	Xcwt4 <- lapply(seq_len(n), function(i) {
+		ts <- scale(ts(conso[i,]), center=TRUE, scale=scaled)
+		totts.cwt = Rwave::cwt(ts,totnoct,nvoice,w0,plot=0)
+		ts.cwt = totts.cwt[,s0log:(s0log+noctave*nvoice)]
+		#Normalization
+		sqs <- sqrt(2^(0:(noctave*nvoice)/nvoice)*s0)
+		sqres <- sweep(ts.cwt,MARGIN=2,sqs,'*')
+		sqres / max(Mod(sqres))
+	})
 
-	## _.b WER^2 distances  ########
-	Xwer_dist    <- matrix(0.0, n, n)
-	for(i in 1:(n - 1))
+	Xwer_dist <- matrix(0., n, n)
+	fcoefs = rep(1/3, 3) #moving average on 3 values (TODO: very slow! correct?!)
+	for (i in 1:(n-1))
 	{
-		mat1   <- vect2mat(Xcwt2[i,])
-
-	for(j in (i + 1):n)
+		for (j in (i+1):n)
 		{
-			mat2 <- vect2mat(Xcwt2[j,])
-			num     <- Mod(mat1 * Conj(mat2))
-			WX      <- Mod(mat1 * Conj(mat1))
-			WY      <- Mod(mat2 * Conj(mat2))
-			smsmnum <- smCWT(num, scalevector = scalevector4)
-			smsmWX  <- smCWT(WX,  scalevector = scalevector4)
-			smsmWY  <- smCWT(WY,  scalevector = scalevector4)
-			wer2    <- sum(colSums(smsmnum)^2)  /
-			sum( sum(colSums(smsmWX) * colSums(smsmWY)) )
-			Xwer_dist[i, j] <- sqrt(delta * lscvect * (1 - wer2))
-			Xwer_dist[j, i] <- Xwer_dist[i, j]
+			#TODO: later, compute CWT here (because not enough storage space for 32M series)
+			#      'circular=TRUE' is wrong, should just take values on the sides; to rewrite in C
+			num <- filter(Mod(Xcwt4[[i]] * Conj(Xcwt4[[j]])), fcoefs, circular=TRUE)
+			WX <- filter(Mod(Xcwt4[[i]] * Conj(Xcwt4[[i]])), fcoefs, circular=TRUE)
+			WY <- filter(Mod(Xcwt4[[j]] * Conj(Xcwt4[[j]])), fcoefs, circular=TRUE)
+			wer2    <- sum(colSums(num)^2) / sum( sum(colSums(WX) * colSums(WY)) )
+			Xwer_dist[i,j] <- sqrt(delta * ncol(Xcwt4[[1]]) * (1 - wer2))
+			Xwer_dist[j,i] <- Xwer_dist[i,j]
 		}
 	}
 	diag(Xwer_dist) <- numeric(n)
-	Wwer_dist
+	Xwer_dist
 }