X-Git-Url: https://git.auder.net/?p=morpheus.git;a=blobdiff_plain;f=pkg%2Fsrc%2Ffunctions.c;h=6444b8649875ef2022fb5151aa77207743c48740;hp=1c7295a4fcd192e2fc3a2011bafdd2c0d9aa9290;hb=9fdd3e5f57aa1fd0f839214d9cbfac022a8739a8;hpb=19d893c4554f7f2cc9a75111cec40712c698e7e2 diff --git a/pkg/src/functions.c b/pkg/src/functions.c index 1c7295a..6444b86 100644 --- a/pkg/src/functions.c +++ b/pkg/src/functions.c @@ -1,16 +1,11 @@ #include +#include // Index matrix (by columns) -int inline mi(int i, int j, int d1, int d2) -{ - return j*d1 + i; -} +#define mi(i, j, d1, d2) (j*d1 + i) // Index 3-tensor (by columns, matrices ordered by last dim) -int inline ti(int i, int j, int k, int d1, int d2, int d3) -{ - return k*d1*d2 + j*d1 + i; -} +#define ti(i, j, k, d1, d2, d3) (k*d1*d2 + j*d1 + i) // Empirical cross-moment of order 2 between X size nxd and Y size n void Moments_M2(double* X, double* Y, int* pn, int* pd, double* M2) @@ -56,9 +51,9 @@ void Moments_M3(double* X, double* Y, int* pn, int* pd, double* M3) // W = 1/N sum( t(g(Zi,theta)) g(Zi,theta) ) // with g(Zi, theta) = i-th contribution to all moments (size dim) - real moments -void Compute_Omega(double* X, int* Y, double* M, int* pn, int* pd, double* W) +void Compute_Omega(double* X, int* Y, double* M, int* pnc, int* pn, int* pd, double* W) { - int n=*pn, d=*pd; + int nc=*pnc, n=*pn, d=*pd; int dim = d + d*d + d*d*d; //double* W = (double*)malloc(dim*dim*sizeof(double)); @@ -69,6 +64,8 @@ void Compute_Omega(double* X, int* Y, double* M, int* pn, int* pd, double* W) W[j*dim+k] = 0.0; } double* g = (double*)malloc(dim*sizeof(double)); + omp_set_num_threads(nc >= 1 ? nc : omp_get_num_procs()); + #pragma omp parallel for for (int i=0; i=0; k--) + W[baseIdx+k] += gj * g[k]; } } + // Normalize W: x 1/n + for (int j=0; j j + for (int j=0; j