EVSL/Doc_html/ratfilter_8c_source.html

 #include <stdio.h>

 #include <stdlib.h>

 #include <string.h>

 #include <complex.h>

 #include <math.h>

 #include "def.h"

 #include "blaslapack.h"

 #include "struct.h"

 #include "internal_proto.h"


 void contQuad(int method, int n, complex double* zk) {

   int i, m, INFO;

   double *beta, *D, *Z, *WORK;

   char JOBZ = 'V';

   complex double tmp2;

   if (method == 0) {

     m = n-1;

     Malloc(D, n, double);

     Malloc(Z, n*n, double);

     Malloc(WORK, 2*n-2, double);

     for (i=0; i<n; i++) {

       D[i] = 0.0;

     }

     Malloc(beta, m, double);

     for (i=0; i<m; i++) {

       beta[i] = 0.5/(sqrt(1-pow(2*(i+1),-2)));

     }

     DSTEV(&JOBZ, &n, D, beta, Z, &n, WORK, &INFO);

     for (i=0; i<n; i++) {

       tmp2 = I*M_PI/2.0*(1.0-D[i]);

       zk[i] = cexp(tmp2);

     }

     free(beta);

     free(D);

     free(Z);

     free(WORK);

   } else if (method == 1) {

     for (i=0; i<n; i++) {

       tmp2 = M_PI*I*(2*(i+1)-1)/(2.0*n);

       zk[i] = cexp(tmp2);

     }

   }

 }


 void ratf2p2(int n, int *mulp, complex double *zk, complex double* alp, int m,

              double *z, double *xx) {

   complex double y, x, t;

   int i, j, k, k1, k2;

   for (k2=0; k2<m; k2++) {

     k = 0;

     y = 0.0 + 0.0*I;

     for (j=0; j<n; j++) {

       x = 1.0 / (z[k2]-zk[j]);

       k1 = k + mulp[j];

       t = 0.0+0.0*I;

       for (i=k1-1;i>=k;i--) {

         t = x*(alp[i]+t);

       }

       y = y+t;

       k = k1;

     }

     xx[k2] = 2.0*creal(y);

   }

 }


 void pfe2(complex double s1, complex double s2, int k1, int k2,

           complex double* alp, complex double* bet) {

   int i;

   complex double d, xp;

   if (cabs(s1-s2) < 1.0e-12 * (cabs(s1)+cabs(s2))) {

     for (i=0; i<k1+k2; i++) {

       alp[i] = 0.0;

     }

     alp[k1+k2-1] = 1;

   } else if ((k1 == 1) && (k2 == 1)) {

     d = s1-s2;

     alp[k1-1] = 1.0 / d;

     bet[k1-1] = -alp[k1-1];

   } else {

     d = 1.0 + 0.0*I;

     xp = 1.0 / cpow((s1-s2),k2);

     for (i=0; i<k1; i++) {

       alp[k1-i-1] = d * xp;

       xp = xp / (s1-s2);

       d = -d * (k2+i) / (i+1.0);

     }

     d = 1.0 + 0.0*I;

     xp = 1.0 / cpow((s2-s1),k1);

     for (i=0; i<k2; i++) {

       bet[k2-i-1] = d * xp;

       xp = xp / (s2-s1);

       d = -d * (k1+i) / (i+1.0);

     }

   }

 }


 complex double integg2(complex double s1, complex double s2,

                        complex double* alp, int k1, complex double* bet,

                        int k2, double a, double b) {

   complex double t, t1, t0, scal;

   int k;

   t = 0.0 + 0.0*I;

   t1 = 0.0 + 0.0*I;

   t0 = 0.0 +0.0*I;

   for (k=0; k<k1; k++) {

     scal = alp[k];

     if (k==0) {

       t0 = scal*clog((b-s1)/(a-s1));

     } else {

       t = t - (scal*1.0/k) * (1.0/cpow((b-s1),k)-1.0/cpow((a-s1),k));

     }

   }

   for (k=0; k<k2; k++) {

     scal = bet[k];

     if (k==0) {

       t1 = scal*clog((b-s2)/(a-s2));

     } else {

       t = t - (scal*1.0/k)*(1.0/cpow((b-s2),k)-1.0/cpow((a-s2),k));

     }

   }

   t = t + (t0+t1);

   return t;

 }


 void weights(int n, complex double* zk, int* mulp, double lambda,

              complex double* omega) {

   int INFO;

   int nrhs = 1;

   int *ipiv;

   int m;

   double mu = 10.0;

   int i, j, ii, jj, ki, kj, n1, n2, nf=0, k1, k2;

   complex double s1, s2, s3, t;

   complex double *rhs, *A, *B, *mat, *alp, *bet;

   double scaling;

   for (i=0; i<n; i++) {

     nf += mulp[i];

   }

   m = 2*nf;

   Malloc(ipiv, m, int);

   Malloc(rhs, m, complex double);

   Malloc(A, nf*nf, complex double);

   Malloc(B, nf*nf, complex double);

   Malloc(mat, 4*nf*nf, complex double);

   for(i=0; i<nf; i++) {

     for(j=0; j<nf; j++) {

       A[i*nf+j] = 0.0 + 0.0*I;

       B[i*nf+j] = 0.0 + 0.0*I;

     }

   }

   if (fabs(lambda) < 1.0e-12) {

     lambda = 1.0e-5;

   }

   ki = 0;

   for (ii=0; ii<n; ii++) {

     s1 = zk[ii];

     n1 = mulp[ii];

     kj = 0;

     s3 = conj(s1);

     for (i=0; i<n1; i++) {

       if (i==0) {

     rhs[ki+i] = lambda*clog((s3-1.0)/(s3+1.0));

       } else {

     rhs[ki+i] = -lambda*(1.0/(i))*(1/cpow((1.0-s3),i)-1.0/cpow((-1.0-s3),i));

       }

     }

     for (jj=0; jj<n; jj++) {

       s2 = zk[jj];

       n2 = mulp[jj];

       for (i=0; i<n1; i++) {

     for (j=0; j<n2; j++) {

       s3 = conj(s2);

       if (cabs(s1-s3) < 1.0e-12*(cabs(s1)+cabs(s3))) {

             Malloc(alp, i+j+2, complex double);

             Malloc(bet, 1, complex double);

         k1 = i+1+j+1;

         k2 = 0;

       } else {

             Malloc(alp, i+1, complex double);

             Malloc(bet, j+1, complex double);

         k1 = i+1;

         k2 = j+1;

       }

       pfe2(s1, s3, k1, k2, alp, bet);

       t = integg2(s1, s3, alp, k1, bet, k2, -mu, mu);

       t += (lambda-1)*integg2(s1, s3, alp, k1, bet, k2, -1.0, 1.0);

       A[(ki+i)*nf+kj+j] = t;

       free(bet);

       free(alp);

       if (cabs(s1-s2) < 1.0e-12*(cabs(s1)+cabs(s2))) {

             Malloc(alp, i+j+2, complex double);

             Malloc(bet, 1, complex double);

         k1 = i+1+j+1;

         k2 = 0;

       } else {

             Malloc(alp, i+1, complex double);

             Malloc(bet, j+1, complex double);

         k1 = i+1;

         k2 = j+1;

       }

       pfe2(s1, s2, k1, k2, alp, bet);

       t = integg2(s1, s2, alp, k1, bet, k2, -mu, mu);

       t += (lambda-1)*integg2(s1, s2, alp, k1, bet, k2, -1.0, 1.0);

       B[(ki+i)*nf+kj+j] = t;

       free(alp);

       free(bet);

     }

       }

       kj = kj+n2;

     }

     ki = ki+n1;

   }

   for (i=nf; i<2*nf; i++) {

     rhs[i] = conj(rhs[i-nf]);

   }

   /*---form mat = [A,B;conj(B),conj(A)]---*/

   /* Note that mat is stored column-wise for lapack routine */

   for (i=0; i<nf; i++) {

     for(j=0; j<nf; j++) {

       mat[i+j*m] = conj(A[i*nf+j]);

     }

   }

   for (i=0; i<nf; i++) {

     for (j=nf; j<m; j++) {

       mat[i+j*m] = conj(B[i*nf+j-nf]);

     }

   }

   for (i=nf; i<m; i++) {

     for (j=0; j<nf; j++) {

       mat[i+j*m] = B[(i-nf)*nf+j];

     }

   }

   for (i=nf; i<m; i++) {

     for (j=nf; j<m; j++) {

       mat[i+j*m] = A[(i-nf)*nf+j-nf];

     }

   }

   ZGESV(&m, &nrhs, mat, &m, ipiv, rhs, &m, &INFO);

   for(i=0;i<nf;i++) {

     omega[i] = rhs[i];

   }


   /* Scale coefs to let the filter pass through [-1, 0.5] */

   double aa = 1.0;

   ratf2p2(n, mulp, zk, omega, 1, &aa, &scaling);

   scaling = 0.5 / scaling;

   for (i=0; i<nf; i++) {

     omega[i] *= scaling;

   }


   free(A);

   free(B);

   free(rhs);

   free(mat);

   free(ipiv);

 }


 int scaleweigthts(int n, double a, double b, complex double *zk, int* mulp,

                   complex double* omegaM) {

   int i, j, k, nf=0;

   double c, h;

   c = 0.5 * (a + b);

   h = 0.5 * (b - a);

   for (i=0; i<n; i++) {

     nf += mulp[i];

     zk[i] = h*zk[i]+c;

   }

   /* Transform the coefs for multiple poles */

   double tmp;

   k = -1;

   for (i=0; i<n; i++) {

     for (j=0; j<mulp[i]; j++) {

       k = k+1;

       omegaM[k] = omegaM[k]*cpow(h,j+1);

     }

   }

   /* Scale ration function to let it pass through [a, 1/2] */

   ratf2p2(n, mulp, zk, omegaM, 1, &a, &tmp);

   tmp = 0.5 / tmp;

   for (i=0; i<nf; i++) {

     omegaM[i] = omegaM[i] * tmp;

   }

   return 0;

 }


 void set_ratf_def(ratparams *rat) {

   // -------------------- this sets default values for ratparams struct.

   rat->num = 1;            // number of the poles

   rat->pw = 2;             // default multplicity of each pole

   rat->method = 1;         // using poles from mid-point rule

   rat->beta = 0.01;        // beta in LS approximation

   rat->bar  = 0.5;         // this is fixed for rational filter

   rat->aa =  -1.0;         // left endpoint of interval

   rat->bb = 1.0;           // right endpoint of interval

   //rat->cc = 0.0;           // center of interval

   //rat->dd = 1.0;           // width of interval

 }


 int find_ratf(double *intv, ratparams *rat) {

   complex double *omega; // weights of the poles

   complex double *zk;    // location of the poles

   int *mulp;             // multiplicity of the each pole

   int n = rat->num, i, pow = 0, pw = rat->pw, method = rat->method;

   double beta = rat->beta;

   /*-------------------- A few parameters to be set or reset */

   Malloc(mulp, n, int);

   Malloc(zk, n, complex double);

   for (i=0; i<n; i++) { // set the multiplicity of each pole

     mulp[i] = pw;

     pow += mulp[i];

   }

   rat->zk = zk;

   rat->mulp = mulp;

   rat->pow = pow; // total multiplicity of the poles

   Malloc(omega, pow, complex double);

   rat->omega = omega;

   //-------------------- intervals related

   if (check_intv(intv, stdout) < 0) {

     return -1;

   }

   double aa, bb;

   aa = max(intv[0], intv[2]);  bb = min(intv[1], intv[3]);

   if (intv[0] < intv[2] || intv[1] > intv[3]) {

     fprintf(stdout, " warning [%s (%d)]: interval (%e, %e) is adjusted to (%e, %e)\n",

         __FILE__, __LINE__, intv[0], intv[1], aa, bb);

   }

   //double lmin = intv[2], lmax = intv[3];

   /*-------------------- */

   rat->aa = aa;

   rat->bb = bb;

   /*-------------------- cc, rr: center and half-width of [aa, bb] */

   //double cc = 0.5 * (aa + bb);

   //double dd = 0.5 * (bb - aa);

   //rat->cc = cc;

   //rat->dd = dd;

   /*------------ compute the location of the poles */

   contQuad(method, n, zk);

   /*------------ compute expansion coefficients of rational filter on [-1, 1] */

   weights(n, zk, mulp, beta, omega);

   /*-------------------- compute expansion coefficients on [aa, bb]*/

   scaleweigthts(n, aa, bb, zk, mulp, omega);


   rat->ASIGBsol = NULL;


   return 0;

 }


 void free_rat(ratparams *rat) {

   free(rat->mulp);

   free(rat->omega);

   free(rat->zk);

   free(rat->ASIGBsol);

 }


 void RatFiltApply(int n, ratparams *rat, double *b, double *x, double *w6) {

   double tt = evsl_timer();

   const int ifGenEv = evsldata.ifGenEv;

   int jj, kk, k=0, kf;

   int *mulp = rat->mulp;

   int num = rat->num;

   complex double *omega = rat->omega;

   double dtwo = 2.0;

   double done = 1.0;

   int one = 1;


   double *xr, *xz, *bz, *br, *yr=NULL, *yz=NULL;

   double zkr, zkc;

   xr = w6;

   xz = xr + n;

   bz = xz + n;

   br = bz + n;

   if (ifGenEv) {

     yr = br + n;

     yz = yr + n;

   }

   /*------------------ loop through each pole */

   for (kk=0; kk<num; kk++) {

     /*---------------- solver for A-s[kk]*B */

     EVSLASIGMABSol *sol = &rat->ASIGBsol[kk];

     kf = k + mulp[kk];

     /*------------------ power loop */

     for (jj=kf-1; jj>=k; jj--) {

       /*---------------- weight */

       zkr = creal(omega[jj]);

       zkc = cimag(omega[jj]);

       /*---------------- initilize the right hand side */

       memcpy(br, b, n*sizeof(double));

       memcpy(bz, b, n*sizeof(double));

       DSCAL(&n, &zkr, br, &one);

       DSCAL(&n, &zkc, bz, &one);

       if (jj != kf-1) {

         DAXPY(&n, &done, xr, &one, br, &one);

         DAXPY(&n, &done, xz, &one, bz, &one);

       }

       /*---------------- solve shifted system */

       if (ifGenEv) {

         if (jj > k) {

           //(sol->func)(n, br, bz, yr, yz, sol->data);

           solve_ASigB(sol, n, br, bz, yr, yz);

           matvec_B(yr, xr);

           matvec_B(yz, xz);

         } else {

           /*------------- jj == k */

           //(sol->func)(n, br, bz, xr, xz, sol->data);

           solve_ASigB(sol, n, br, bz, xr, xz);

         }

       } else {

         //(sol->func)(n, br, bz, xr, xz, sol->data);

         solve_ASigB(sol, n, br, bz, xr, xz);

       }

     }

     /*------------------ solution (real part) */

     if (kk) {

       DAXPY(&n, &dtwo, xr, &one, x, &one);

     } else {

       memcpy(x, xr, n*sizeof(double));

       DSCAL(&n, &dtwo, x, &one);

     }

     k = kf;

   }


   evslstat.n_ratAv ++;

   evslstat.t_ratAv += evsl_timer() - tt;

 }


_evslstat::t_ratAv
double t_ratAv
Definition: struct.h:212

_ratparams::zk
complex double * zk
Definition: struct.h:126

_ratparams::num
int num
Definition: struct.h:114

free_rat
void free_rat(ratparams *rat)
Definition: ratfilter.c:424

_ratparams::bar
double bar
Definition: struct.h:120

DSTEV
void DSTEV(char *jobz, int *n, double *diagonal, double *subdiagonal, double *V, int *ldz, double *work, int *info)

def.h
defs in EVSL

_evsldata::ifGenEv
int ifGenEv
Definition: struct.h:166

_ratparams::pow
int pow
Definition: struct.h:123

DSCAL
void DSCAL(int *n, double *a, double *x, int *incx)

_ratparams::pw
int pw
Definition: struct.h:115

_ratparams::method
int method
Definition: struct.h:116

internal_proto.h
This file contains function prototypes and constant definitions internally used in EVSL...

min
#define min(a, b)
Definition: def.h:62

_ratparams::ASIGBsol
EVSLASIGMABSol * ASIGBsol
Definition: struct.h:127

weights
void weights(int n, complex double *zk, int *mulp, double lambda, complex double *omega)
Compute the LS weight for each multiple pole.
Definition: ratfilter.c:169

Malloc
#define Malloc(base, nmem, type)
Definition: def.h:22

evslstat
evslStat evslstat
global statistics of EVSL
Definition: evsl.c:21

struct.h
structs used in evsl

_EVSLASIGMABSol
user-provided function and data for solving (A - SIGMA*B) x = b
Definition: struct.h:102

_evslstat::n_ratAv
size_t n_ratAv
Definition: struct.h:220

_ratparams::aa
double aa
Definition: struct.h:118

DAXPY
void DAXPY(int *n, double *alpha, double *x, int *incx, double *y, int *incy)

max
#define max(a, b)
Definition: def.h:56

scaleweigthts
int scaleweigthts(int n, double a, double b, complex double *zk, int *mulp, complex double *omegaM)
Compute the weights and pole locations on [a, b].
Definition: ratfilter.c:313

blaslapack.h
Defs for blaslapack routines.

integg2
complex double integg2(complex double s1, complex double s2, complex double *alp, int k1, complex double *bet, int k2, double a, double b)
Integration of 1/[(z-s1)^k1 (z-s2)^k2] from a to b.
Definition: ratfilter.c:129

pfe2
void pfe2(complex double s1, complex double s2, int k1, int k2, complex double *alp, complex double *bet)
Get the fraction expansion of 1/[(z-s1)^k1 (z-s2)^k2].
Definition: ratfilter.c:95

evsldata
evslData evsldata
global variable of EVSL
Definition: evsl.c:15

_ratparams::beta
double beta
Definition: struct.h:117

set_ratf_def
void set_ratf_def(ratparams *rat)
Sets default values for ratparams struct.
Definition: ratfilter.c:345

M_PI
#define M_PI
Definition: def.h:13

_ratparams::mulp
int * mulp
Definition: struct.h:122

find_ratf
int find_ratf(double *intv, ratparams *rat)
Definition: ratfilter.c:375

contQuad
void contQuad(int method, int n, complex double *zk)
Compute the locations of the poles.
Definition: ratfilter.c:23

ratf2p2
void ratf2p2(int n, int *mulp, complex double *zk, complex double *alp, int m, double *z, double *xx)
Compute the function value of the multiple pole rational filter at real locations.
Definition: ratfilter.c:69

RatFiltApply
void RatFiltApply(int n, ratparams *rat, double *b, double *x, double *w6)
Apply rational filter R to a vetor b.
Definition: ratfilter.c:448

_ratparams::omega
complex double * omega
Definition: struct.h:125

evsl_timer
double evsl_timer()
evsl timer for mac
Definition: mactime.c:14

_ratparams::bb
double bb
Definition: struct.h:119

_ratparams
parameters for rational filter
Definition: struct.h:112

ZGESV
void ZGESV(int *n, int *nrow, complex double *A, int *m, int *ipiv, complex double *rhs, int *k, int *INFO)