JSOC_Documentation: proj/mag/pfss/apps/glbhs4gh.c Source File

00001 /*
00002  * Name:        glbhs4gh.c
00003  *
00004  * Description:     Special case of working part in jhelio2mlat.c and jqdotprod.c
00005  *
00006  * Function List:
00007  *          void helio2mlat(float *map, float *map_mlat, 
00008  *              int map_cols, int map_rows, int lmax, int map_lmax)
00009  *          void qdotprod(float *map_mlat, float *out_coeff, 
00010  *              int map_rows, int lmin, int lmax, float sinBdelta)
00011  *
00012  * Called by:       jsynop2gh.c
00013  *
00014  * Written by:      Xudong Sun (xudongs@stanford.edu)
00015  *
00016  * Version:
00017  *          v1.0        Jul 25 2009
00018  *          v1.0a       Aug 06 2009
00019  *
00020  * Issues:
00021  *          v1.0a
00022  *          Added prototypes for Fortran fuctions (scopy, setplm, sgemm)
00023  *          
00024  */
00025 
00026 #include <fftw3.h>
00027 #include "astro.h"
00028 
00029 
00030 #define absval(x)       (((x) < 0) ? (-(x)) : (x))
00031 #define minval(x,y)     (((x) < (y)) ? (x) : (y))
00032 #define maxval(x,y)     (((x) < (y)) ? (y) : (x))
00033 #define very_small      (1.0e-30)
00034 #define is_very_small(x)    (absval(x) < very_small)
00035 #define is_even(x)      (!((x)%2))
00036 #define is_odd(x)       ((x)%2)
00037 
00038 
00039 /* Simplified version of jhelio2mlat.c
00040  * No apodizing, weighted to 1, no mean substraction,
00041  * no normalize, assuming no bad points.
00042  */
00043 
00044 void helio2mlat(float *map, float *map_mlat, int map_cols, int map_rows, int lmax, int map_lmax)
00045 {
00046     int i, row, col;
00047     int map_cols2 = map_cols / 2;
00048     int nout = (lmax + 1) * 2;
00049     int lfft, nfft, nok;
00050     double norm = 1.0, normx;
00051     float *buf, *wbuf, *bp;
00052     float *ip, *inp = map;
00053     float *op, *outp = map_mlat;
00054     fftwf_plan fftwp;
00055 
00056     lfft = 2 * map_lmax;
00057     nfft = lfft + 2;
00058 
00059     // Get working buffer
00060     buf = (float *)(malloc(nfft * sizeof(float)));
00061     wbuf = (float *)(malloc(nfft * sizeof(float)));
00062     fftwp = fftwf_plan_r2r_1d(lfft, buf, wbuf, FFTW_R2HC, FFTW_ESTIMATE);
00063 
00064     // Do it
00065     for (row = 0; row < map_rows; row++) {
00066         // 0 at central meridian
00067         // First copy right side of meridian
00068         bp = buf;
00069         ip = inp + map_cols * row + map_cols2;
00070         for (col = 0; col <= map_cols2; col++) {
00071             if (!isnan(*ip)) {
00072                 *bp++ = *ip;    // weight 1
00073             } else
00074                 *bp++ = 0.0;
00075             ip++;
00076         }
00077         // Then do left side of meridian
00078         bp = buf + lfft - map_cols2;
00079         ip = inp + map_cols * row;
00080         for (col = 0; col < map_cols2; col++) {
00081             if (!isnan(*ip)) {
00082                 *bp++ = *ip;
00083             } else
00084                 *bp++ = 0.0;
00085             ip++;
00086         }
00087 
00088         // For missing (no zero_miss or normalize)
00089         norm = 1. / lfft;
00090 
00091         // Fourier transform
00092         fftwf_execute(fftwp);
00093 
00094         // Transpose, normalize
00095         // Real part
00096         for (int i = 0; i < nout / 2; i++) {
00097             op = outp + 2 * i * map_rows + row;
00098             *op = wbuf[i] * norm;
00099         }
00100         // Imaginary part, m = 0 is 0
00101         *(outp + map_rows + row) = 0.0;
00102         // Use normx to get complex conjugate
00103         normx = -norm;
00104         for (int i = 0; i < nout / 2; i++) {
00105             op = outp + (2 * i + 1) * map_rows + row;
00106             *op = wbuf[lfft - i] * normx;
00107         }          
00108     } // End of row
00109 }
00110 
00111 
00112 
00113 
00114 
00115 
00116 
00117 /* Prototypes of some FORTRAN function */
00118 
00119 void scopy_(int *n, float *x, const int *incx, float *y, const int *incy);
00120 extern int setplm_(int *lmin, int *lmax, int *m, int *nx, int *indx, 
00121         double *x, int *nplm, double *plm);
00122 void sgemm_(const char *transa, const char *transb,
00123         int *l, int *n, int *m, float *alpha,
00124         const float *a, int *lda, float *b, int *ldb,
00125         float *beta, void *c, int *ldc, int na, int nb);
00126 
00127 
00128 
00129 /* Simplified version of jqdotprod.c
00130  * No bad images, single point in time series
00131  * timechunk is 1, lchunk is 1
00132  * Need to include <astro.h> <math.h> in main
00133  */
00134 
00135 void qdotprod(float *map_mlat, float *out_coeff, int map_rows, int lmin, int lmax, float sinBdelta)
00136 {
00137     int i, l, m, modd, meven;
00138 
00139     float *oddpart, *evenpart, *inptr, *workptr, *mptr, *outptr;
00140     float *folded, *masks, *real4evenl, *real4oddl, *imag4evenl, *imag4oddl, *outx;
00141     /* used for setting up plm's */
00142     double *plm, *saveplm, *latgrid;
00143     int *indx;
00144     double *plmptr;
00145     float *maskptr;
00146 
00147     int nrecs = 1;  // Single point time series
00148     int lmax1 = lmax + 1;
00149     int mx, msize = lmax1, foldedsize;
00150     int imagesize = map_rows * 2 * msize;   // Size of map_mlat
00151 
00152     /* for scopy call */
00153     int increment1 = 1, increment2 = 2;
00154 
00155     /* arguments for sgemm call */
00156     char transpose[] = "t";
00157     char normal[] = "n";
00158     float one = 1.0;
00159     float zero = 0.0;
00160     float cnorm; /* Constant to get proper normalization. */
00161 
00162     int lfirst, llast, ifirst, ilast, lstart, ldone;
00163     int lfirsteven, llasteven, nevenl, lfirstodd, llastodd, noddl;
00164     int fromoffset, tooffset, imageoffset;
00165 
00166     int nlat = map_rows / 2, latx, ilatx, poslatx, neglatx, moffset;
00167     /* SGI's like odd leading dimensions of the first array in sgemm */
00168     int nlatx = 2 * (nlat / 2) + 1;
00169     /* make nlatx divisible by 4 on linux systems */
00170     #ifdef __linux__
00171         if (nlat % 4) nlatx = 4 * (nlat / 4 + 1);
00172         else nlatx = nlat;
00173     #endif
00174 
00175     int snx;
00176     int maxnsn = nrecs; // Equals to 1
00177     int nsn = maxnsn, fournsn = 4 * nsn;
00178     int lchunksize = msize; // lmax + 1
00179 
00180     real4evenl = (float *)(malloc(nlatx * maxnsn * sizeof(float)));
00181     real4oddl = (float *)(malloc(nlatx * maxnsn * sizeof(float)));
00182     imag4evenl = (float *)(malloc(nlatx * maxnsn * sizeof(float)));
00183     imag4oddl = (float *)(malloc(nlatx * maxnsn * sizeof(float)));
00184     outx = (float *)(malloc(maxnsn * 2 * lchunksize * sizeof(float)));
00185 
00186     plm = (double *)(malloc(lmax1 * nlat * sizeof(double))); 
00187     saveplm = (double *)(malloc(lmax1 * nlat * 2 * sizeof(double)));
00188     latgrid = (double *)(malloc(nlat * sizeof(double)));
00189     for (i = 0; i < nlat; i++) latgrid[i] = (i + 0.5) * sinBdelta;
00190 
00191     indx = (int *)(malloc(lmax1 * sizeof(int)));
00192     for (l = 0; l <= lmax; l++) indx[l] = l;
00193 
00194     masks = (float *)(malloc(nlat * lchunksize * sizeof(float)));
00195 
00196     foldedsize = 4 * nlat * lmax1 * maxnsn;
00197     folded = (float *)(malloc(foldedsize * sizeof(float)));
00198 
00199     oddpart = (float *)(malloc(nlat * sizeof(float)));
00200     evenpart = (float *)(malloc(nlat * sizeof(float)));
00201 
00202     inptr = map_mlat;
00203     imageoffset = 0;        // irec = 0
00204     // For each m, re and im
00205     for (mx = 0; mx < 2 * msize; mx++) {
00206         moffset = mx * map_rows;
00207         mptr = inptr + moffset;
00208         for (latx = 0; latx < nlat; latx++) {
00209             poslatx = nlat + latx; neglatx = nlat - 1 - latx;
00210             evenpart[latx] = mptr[poslatx] + mptr[neglatx];
00211             oddpart[latx] = mptr[poslatx] - mptr[neglatx]; 
00212         }
00213         workptr = folded + imageoffset + moffset;
00214         scopy_ (&nlat, evenpart, &increment1, workptr, &increment1);
00215         workptr += nlat;
00216         scopy_ (&nlat, oddpart, &increment1, workptr, &increment1);
00217     }
00218 
00219     /* We now have folded data for a chunk of sn's */
00220     /* Now do Jesper's tricks */
00221     /* ldone is the last l for which plm's have been set up */
00222     ldone = -1;
00223 
00224     /* loop on each chunk of l's */
00225     //lchunkfirst = lmin / lchunksize;  // 0
00226     //lchunklast = lmax / lchunksize;   // 0
00227 
00228     /* assumes the output datasets are in order with time increasing most rapidly */
00229 
00230     cnorm = sqrt(2.) * sinBdelta;   // norm = 1
00231 
00232     lfirst = 0; // lchunk = 0
00233     llast = lmax;
00234 
00235     /* get the first and last indeces into the l-m array */
00236     ifirst = lfirst * (lfirst + 1) / 2;     // 0
00237     ilast = (llast + 1) * (llast + 2) / 2 - 1;  // (lmax+1)(lmax+2)/2-1
00238 
00239     outptr = out_coeff; // (lmax+1)(lmax+2)
00240 
00241     /* loop on each m */
00242     for (m = 0; m <= llast; m++) {
00243         modd = is_odd(m);
00244         meven = !modd;
00245         lstart = maxval(lfirst, m); /* no l can be smaller than this m */
00246 
00247         /* set up masks (plm's) for this m and chunk in l */
00248         if ((lstart - 1) == ldone) {
00249             /* get saved plms if any */
00250             if ((lstart - 2) >= m)
00251                 for (latx = 0; latx < nlat; latx++)
00252                     plm[(lstart - 2) * nlat + latx] = saveplm[m * nlat + latx];
00253             if ((lstart - 1) >= m)
00254                 for (latx = 0; latx < nlat; latx++)
00255                     plm[(lstart - 1) * nlat + latx] = saveplm[msize * nlat + m * nlat + latx];
00256             /* then set up the current chunk */
00257             setplm_ (&lstart, &llast, &m, &nlat, indx, latgrid, &nlat, plm); 
00258         } else {
00259             /* This fixes the lmin != 0 problem */
00260             setplm_ (&m, &llast, &m, &nlat, indx, latgrid, &nlat, plm); 
00261         }
00262 
00263         /* save plm's for next chunk */
00264         if ((llast-1) >= m)
00265             for (latx = 0; latx < nlat; latx++)
00266                saveplm[m * nlat + latx] = plm[(llast - 1) * nlat + latx];
00267         for (latx = 0; latx < nlat; latx++)
00268             saveplm[msize * nlat + m * nlat + latx] = plm[llast * nlat + latx];
00269         ldone = llast;
00270 
00271         /* copy plm's into masks */
00272         /* note that this converts from double to single precision */
00273         /* the test prevents underflows which gobble CPU time */
00274 
00275         plmptr = plm + nlat * lstart;
00276         maskptr = masks;
00277         latx = nlat * (llast - lstart + 1);
00278         for (ilatx = 0; ilatx < latx; ilatx++)
00279             maskptr[ilatx] = plmptr[ilatx];
00280 
00281         snx = 0;    // Single chunk
00282         /* select folded data for real/imag l's and this m 
00283            into temporay arrays for matrix multiply */
00284         /* TO DO - pull offset calculations out of loop */
00285         /* New code with odd leading dimension */
00286         scopy_ (&nlat,
00287                 folded + nlat * (4 * m + modd) + snx * imagesize,
00288                 &increment1,
00289                 real4evenl + snx * nlatx,
00290                 &increment1);
00291         scopy_ (&nlat,
00292                 folded + nlat * (4 * m + meven) + snx * imagesize,
00293                 &increment1,
00294                 real4oddl + snx * nlatx,
00295                 &increment1);
00296         scopy_ (&nlat,
00297                 folded + nlat * (4 * m + 2 + modd) + snx * imagesize,
00298                 &increment1,
00299                 imag4evenl + snx * nlatx,
00300                 &increment1);
00301         scopy_ (&nlat,
00302                 folded + nlat * (4 * m + 2 + meven) + snx * imagesize,
00303                 &increment1,
00304                 imag4oddl + snx * nlatx,
00305                 &increment1);
00306 
00307         /* do even l's */
00308         lfirsteven = is_even(lstart) ? lstart : lstart + 1;
00309         llasteven = is_even(llast) ? llast : llast - 1;
00310         nevenl = (llasteven - lfirsteven) / 2 + 1; /* number of even l's */
00311         /* do real part */
00312         /* All parts used to have alpha=&one, now have alpha=&cnorm */
00313         sgemm_ (transpose, /* form of op(A) */ 
00314                 normal,    /* form of op(B) */ 
00315                 &nsn,      /* number of sn's */
00316                 &nevenl,   /* number of even l's for this m */
00317                 &nlat,     /* number of latitudes */
00318                 &cnorm,    /* scalar multiplier of op(A) */
00319                 real4evenl,  /* matrix A */
00320                 &nlatx,     /* use every nlat-long row of A */ 
00321                 masks + nlat * (lfirsteven - lstart), /* matrix B */
00322                 &map_rows,  /* 2*nlat, use every other row (nlat long) of B */ 
00323                 &zero,     /* scalar multiplier of C */
00324                 outx + nsn * 2 * (lfirsteven - lstart), /* matrix C (output) */ 
00325                 &fournsn,  /* use every fourth nsn-long row of C */
00326                 1,         /* length of transpose character string */
00327                 1);        /* length of normal character string */
00328         /* do imag part */
00329         sgemm_ (transpose, /* form of op(A) */ 
00330                 normal,    /* form of op(B) */ 
00331                 &nsn,      /* number of sn's */
00332                 &nevenl,   /* number of even l's for this m */
00333                 &nlat,     /* number of latitudes */
00334                 &cnorm,    /* scalar multiplier of op(A) */
00335                 imag4evenl,  /* matrix A */
00336                 &nlatx,     /* use every nlat-long row of A */ 
00337                 masks + nlat * (lfirsteven - lstart), /* matrix B */
00338                 &map_rows,  /* 2*nlat, use every other nlat-long row of B */ 
00339                 &zero,     /* scalar multiplier of C */
00340                 outx + nsn * ( 2 * (lfirsteven - lstart) + 1), /* matrix C (output) */ 
00341                 &fournsn,  /* use every fourth nsn-long row of C */
00342                 1,         /* length of transpose character string */
00343                 1);        /* length of normal character string */
00344 
00345         /* do odd l's */
00346         lfirstodd = is_odd(lstart) ? lstart : lstart + 1;
00347         llastodd = is_odd(llast) ? llast : llast - 1; 
00348         noddl = (llastodd - lfirstodd) / 2 + 1; /* number of odd l's */
00349         /* do real part */
00350         sgemm_ (transpose, /* form of op(A) */ 
00351                 normal,    /* form of op(B) */ 
00352                 &nsn,      /* number of sn's */
00353                 &noddl,    /* number of odd l's for this m */
00354                 &nlat,     /* number of latitudes */
00355                 &cnorm,   /* scalar multiplier of op(A) */
00356                 real4oddl,   /* matrix A */
00357                 &nlatx,     /* use every nlat-long row of A */ 
00358                 masks + nlat * (lfirstodd - lstart), /* matrix B */
00359                 &map_rows,  /* 2*nlat, use every other nlat-long row of B */ 
00360                 &zero,     /* scalar multiplier of C */
00361                 outx + nsn * 2 * (lfirstodd - lstart), /* matrix C (output) */ 
00362                 &fournsn,  /* use every fourth nsn-long row of C */
00363                 1,         /* length of transpose character string */
00364                 1);        /* length of normal character string */
00365         /* do imag part */
00366         sgemm_ (transpose, /* form of op(A) */ 
00367                 normal,    /* form of op(B) */ 
00368                 &nsn,      /* number of sn's */
00369                 &noddl,    /* number of odd l's for this m */
00370                 &nlat,     /* number of latitudes */
00371                 &cnorm,    /* scalar multiplier of op(A) */
00372                 imag4oddl,  /* matrix A */
00373                 &nlatx,     /* use every nlat-long row of A */ 
00374                 masks + nlat * (lfirstodd - lstart), /* matrix B */
00375                 &map_rows,  /* 2*nlat, use every other nlat-long row of B */ 
00376                 &zero,     /* scalar multiplier of C */
00377                 outx + nsn * (2 * (lfirstodd - lstart) + 1), /* matrix C (output) */ 
00378                 &fournsn,  /* use every fourth nsn-long row of C */
00379                 1,         /* length of transpose character string */
00380                 1);        /* length of normal character string */
00381 
00382         /* copy outx into out sds */
00383         /* alternate real and imaginary values in out - as in pipeLNU */
00384         for (l = lstart; l <= llast; l++) { // 0
00385              fromoffset = 2 * nsn * (l - lstart);       // 0
00386              tooffset = 2 * nsn * (l * (l + 1) / 2 + m - ifirst);
00387              scopy_ (&nsn,
00388                      outx + fromoffset,
00389                      &increment1,
00390                      outptr + tooffset,
00391                      &increment2);
00392              scopy_ (&nsn,
00393                      outx + fromoffset + nsn,
00394                      &increment1,
00395                      outptr + tooffset + 1,
00396                      &increment2);
00397         } /* end loop through l's for this m */
00398 
00399     } /* end loop on m */
00400 }