NFFT 3.2.3 API Reference - mpolar_fft

Go to the documentation of this file.
 /*
  * Copyright (c) 2002, 2012 Jens Keiner, Stefan Kunis, Daniel Potts
  *
  * This program is free software; you can redistribute it and/or modify it under
  * the terms of the GNU General Public License as published by the Free Software
  * Foundation; either version 2 of the License, or (at your option) any later
  * version.
  *
  * This program is distributed in the hope that it will be useful, but WITHOUT
  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
  * FOR A PARTICULAR PURPOSE.  See the GNU General Public License for more
  * details.
  *
  * You should have received a copy of the GNU General Public License along with
  * this program; if not, write to the Free Software Foundation, Inc., 51
  * Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
  */
 
 /* $Id: mpolar_fft_test.c 3896 2012-10-10 12:19:26Z tovo $ */
 
 #include "config.h"
 
 #include <math.h>
 #include <stdlib.h>
 #ifdef HAVE_COMPLEX_H
 #include <complex.h>
 #endif
 
 #include "nfft3util.h"
 #include "nfft3.h"
 #include "infft.h"
 
 double GLOBAL_elapsed_time;
 
 static int mpolar_grid(int T, int R, double *x, double *w)
 {
   int t, r;
   double W;
   int R2=2*ceil(sqrt(2.0)*R/2);
   double xx, yy;
   int M=0;
 
   for(t=-T/2; t<T/2; t++)
   {
     for(r=-R2/2; r<R2/2; r++)
     {
       xx = (double)r/R*cos(PI*t/T);
       yy = (double)r/R*sin(PI*t/T);
 
       if ( ((-0.5-1.0/(double)R)<=xx) & (xx<=(0.5+1.0/(double)R)) &
         ((-0.5-1.0/(double)R)<=yy) & (yy<=(0.5+1.0/(double)R)) )
       {
         x[2*M+0] = xx;
         x[2*M+1] = yy;
 
         if (r==0)
           w[M] = 1.0/4.0;
         else
           w[M] = fabs((double)r);
 
         M++; 
       }
     }
   }
 
    W=0.0;
    for (t=0; t<M; t++)
       W+=w[t];
 
    for (t=0; t<M; t++)
     w[t]/=W;
 
   return M;                             
 }
 
 static int mpolar_dft(fftw_complex *f_hat, int NN, fftw_complex *f, int T, int R, int m)
 {
   ticks t0, t1;
   int j,k;                              
   nfft_plan my_nfft_plan;               
   double *x, *w;                        
   int N[2],n[2];
   int M;                                
   N[0]=NN; n[0]=2*N[0];                 
   N[1]=NN; n[1]=2*N[1];                 
   x = (double *)nfft_malloc(5*(T/2)*R*(sizeof(double)));
   if (x==NULL)
     return -1;
 
   w = (double *)nfft_malloc(5*(T*R)/4*(sizeof(double)));
   if (w==NULL)
     return -1;
 
   M=mpolar_grid(T,R,x,w);
   nfft_init_guru(&my_nfft_plan, 2, N, M, n, m,
                   PRE_PHI_HUT| PRE_PSI| MALLOC_X | MALLOC_F_HAT| MALLOC_F| FFTW_INIT | FFT_OUT_OF_PLACE,
                   FFTW_MEASURE| FFTW_DESTROY_INPUT);
 
   for(j=0;j<my_nfft_plan.M_total;j++)
   {
     my_nfft_plan.x[2*j+0] = x[2*j+0];
     my_nfft_plan.x[2*j+1] = x[2*j+1];
   }
 
   for(k=0;k<my_nfft_plan.N_total;k++)
     my_nfft_plan.f_hat[k] = f_hat[k];
 
   t0 = getticks();
 
   nfft_trafo_direct(&my_nfft_plan);
 
   t1 = getticks();
   GLOBAL_elapsed_time = nfft_elapsed_seconds(t1,t0);
 
   for(j=0;j<my_nfft_plan.M_total;j++)
     f[j] = my_nfft_plan.f[j];
 
   nfft_finalize(&my_nfft_plan);
   nfft_free(x);
   nfft_free(w);
 
   return EXIT_SUCCESS;
 }
 
 static int mpolar_fft(fftw_complex *f_hat, int NN, fftw_complex *f, int T, int R, int m)
 {
   ticks t0, t1;
   int j,k;                              
   nfft_plan my_nfft_plan;               
   double *x, *w;                        
   int N[2],n[2];
   int M;                                
   N[0]=NN; n[0]=2*N[0];                 
   N[1]=NN; n[1]=2*N[1];                 
   x = (double *)nfft_malloc(5*T*R/2*(sizeof(double)));
   if (x==NULL)
     return -1;
 
   w = (double *)nfft_malloc(5*T*R/4*(sizeof(double)));
   if (w==NULL)
     return -1;
 
   M=mpolar_grid(T,R,x,w);
   nfft_init_guru(&my_nfft_plan, 2, N, M, n, m,
                   PRE_PHI_HUT| PRE_PSI| MALLOC_X | MALLOC_F_HAT| MALLOC_F| FFTW_INIT | FFT_OUT_OF_PLACE,
                   FFTW_MEASURE| FFTW_DESTROY_INPUT);
 
   for(j=0;j<my_nfft_plan.M_total;j++)
   {
     my_nfft_plan.x[2*j+0] = x[2*j+0];
     my_nfft_plan.x[2*j+1] = x[2*j+1];
   }
 
   if(my_nfft_plan.nfft_flags & PRE_LIN_PSI)
     nfft_precompute_lin_psi(&my_nfft_plan);
 
   if(my_nfft_plan.nfft_flags & PRE_PSI)
     nfft_precompute_psi(&my_nfft_plan);
 
   if(my_nfft_plan.nfft_flags & PRE_FULL_PSI)
     nfft_precompute_full_psi(&my_nfft_plan);
 
   for(k=0;k<my_nfft_plan.N_total;k++)
     my_nfft_plan.f_hat[k] = f_hat[k];
 
   t0 = getticks();
 
   nfft_trafo(&my_nfft_plan);
 
   t1 = getticks();
   GLOBAL_elapsed_time = nfft_elapsed_seconds(t1,t0);
 
   for(j=0;j<my_nfft_plan.M_total;j++)
     f[j] = my_nfft_plan.f[j];
 
   nfft_finalize(&my_nfft_plan);
   nfft_free(x);
   nfft_free(w);
 
   return EXIT_SUCCESS;
 }
 
 static int inverse_mpolar_fft(fftw_complex *f, int T, int R, fftw_complex *f_hat, int NN, int max_i, int m)
 {
   ticks t0, t1;
   int j,k;                              
   nfft_plan my_nfft_plan;               
   solver_plan_complex my_infft_plan;             
   double *x, *w;                        
   int l;                                
   int N[2],n[2];
   int M;                                
   N[0]=NN; n[0]=2*N[0];                 
   N[1]=NN; n[1]=2*N[1];                 
   x = (double *)nfft_malloc(5*T*R/2*(sizeof(double)));
   if (x==NULL)
     return -1;
 
   w = (double *)nfft_malloc(5*T*R/4*(sizeof(double)));
   if (w==NULL)
     return -1;
 
   M=mpolar_grid(T,R,x,w);
   nfft_init_guru(&my_nfft_plan, 2, N, M, n, m,
                   PRE_PHI_HUT| PRE_PSI| MALLOC_X | MALLOC_F_HAT| MALLOC_F| FFTW_INIT | FFT_OUT_OF_PLACE,
                   FFTW_MEASURE| FFTW_DESTROY_INPUT);
 
     solver_init_advanced_complex(&my_infft_plan,(nfft_mv_plan_complex*)(&my_nfft_plan), CGNR | PRECOMPUTE_WEIGHT );
 
   for(j=0;j<my_nfft_plan.M_total;j++)
   {
     my_nfft_plan.x[2*j+0] = x[2*j+0];
     my_nfft_plan.x[2*j+1] = x[2*j+1];
     my_infft_plan.y[j]    = f[j];
     my_infft_plan.w[j]    = w[j];
   }
 
   if(my_nfft_plan.nfft_flags & PRE_LIN_PSI)
     nfft_precompute_lin_psi(&my_nfft_plan);
 
   if(my_nfft_plan.nfft_flags & PRE_PSI)
     nfft_precompute_psi(&my_nfft_plan);
 
   if(my_nfft_plan.nfft_flags & PRE_FULL_PSI)
     nfft_precompute_full_psi(&my_nfft_plan);
 
 
  if(my_infft_plan.flags & PRECOMPUTE_DAMP)
    for(j=0;j<my_nfft_plan.N[0];j++)
      for(k=0;k<my_nfft_plan.N[1];k++)
      {
         my_infft_plan.w_hat[j*my_nfft_plan.N[1]+k]=
           (sqrt(pow(j-my_nfft_plan.N[0]/2,2)+pow(k-my_nfft_plan.N[1]/2,2))>(my_nfft_plan.N[0]/2)?0:1);
      }
 
   for(k=0;k<my_nfft_plan.N_total;k++)
       my_infft_plan.f_hat_iter[k] = 0.0 + _Complex_I*0.0;
 
   t0 = getticks();
 
   solver_before_loop_complex(&my_infft_plan);
 
   if (max_i<1)
   {
     l=1;
     for(k=0;k<my_nfft_plan.N_total;k++)
       my_infft_plan.f_hat_iter[k] = my_infft_plan.p_hat_iter[k];
   }
   else
   {
     for(l=1;l<=max_i;l++)
     {
       solver_loop_one_step_complex(&my_infft_plan);
     }
   }
 
   t1 = getticks();
   GLOBAL_elapsed_time = nfft_elapsed_seconds(t1,t0);
 
   for(k=0;k<my_nfft_plan.N_total;k++)
     f_hat[k] = my_infft_plan.f_hat_iter[k];
 
   solver_finalize_complex(&my_infft_plan);
   nfft_finalize(&my_nfft_plan);
   nfft_free(x);
   nfft_free(w);
 
   return EXIT_SUCCESS;
 }
 
 static int comparison_fft(FILE *fp, int N, int T, int R)
 {
   ticks t0, t1;
   fftw_plan my_fftw_plan;
   fftw_complex *f_hat,*f;
   int m,k;
   double t_fft, t_dft_mpolar;
 
   f_hat = (fftw_complex *)nfft_malloc(sizeof(fftw_complex)*N*N);
   f     = (fftw_complex *)nfft_malloc(sizeof(fftw_complex)*(T*R/4)*5);
 
   my_fftw_plan = fftw_plan_dft_2d(N,N,f_hat,f,FFTW_BACKWARD,FFTW_MEASURE);
 
   for(k=0; k<N*N; k++)
     f_hat[k] = (((double)rand())/RAND_MAX) + _Complex_I* (((double)rand())/RAND_MAX);
 
   t0 = getticks();
   for(m=0;m<65536/N;m++)
     {
       fftw_execute(my_fftw_plan);
       /* touch */
       f_hat[2]=2*f_hat[0];
     }
   t1 = getticks();
   GLOBAL_elapsed_time = nfft_elapsed_seconds(t1,t0);
   t_fft=N*GLOBAL_elapsed_time/65536;
 
   if(N<256)
     {
       mpolar_dft(f_hat,N,f,T,R,1);
       t_dft_mpolar=GLOBAL_elapsed_time;
     }
 
   for (m=3; m<=9; m+=3)
     {
       if((m==3)&&(N<256))
         fprintf(fp,"%d\t&\t&\t%1.1e&\t%1.1e&\t%d\t",N,t_fft,t_dft_mpolar,m);
       else
         if(m==3)
     fprintf(fp,"%d\t&\t&\t%1.1e&\t       &\t%d\t",N,t_fft,m);
   else
     fprintf(fp,"  \t&\t&\t       &\t       &\t%d\t",m);
 
       printf("N=%d\tt_fft=%1.1e\tt_dft_mpolar=%1.1e\tm=%d\t",N,t_fft,t_dft_mpolar,m);
 
       mpolar_fft(f_hat,N,f,T,R,m);
       fprintf(fp,"%1.1e&\t",GLOBAL_elapsed_time);
       printf("t_mpolar=%1.1e\t",GLOBAL_elapsed_time);
       inverse_mpolar_fft(f,T,R,f_hat,N,2*m,m);
       if(m==9)
   fprintf(fp,"%1.1e\\\\\\hline\n",GLOBAL_elapsed_time);
       else
   fprintf(fp,"%1.1e\\\\\n",GLOBAL_elapsed_time);
       printf("t_impolar=%1.1e\n",GLOBAL_elapsed_time);
     }
 
   fflush(fp);
 
   nfft_free(f);
   nfft_free(f_hat);
 
   return EXIT_SUCCESS;
 }
 
 int main(int argc,char **argv)
 {
   int N;                                
   int T, R;                             
   int M;                                
   double *x, *w;                        
   fftw_complex *f_hat, *f, *f_direct, *f_tilde;
   int k;
   int max_i;                            
   int m;
   double temp1, temp2, E_max=0.0;
   FILE *fp1, *fp2;
   char filename[30];
   int logN;
 
   if( argc!=4 )
   {
     printf("mpolar_fft_test N T R \n");
     printf("\n");
     printf("N          mpolar FFT of size NxN    \n");
     printf("T          number of slopes          \n");
     printf("R          number of offsets         \n");
 
     printf("\nHence, comparison FFTW, mpolar FFT and inverse mpolar FFT\n");
     fp1=fopen("mpolar_comparison_fft.dat","w");
     if (fp1==NULL)
   return(-1);
     for (logN=4; logN<=8; logN++)
   comparison_fft(fp1,(1U<< logN), 3*(1U<< logN), 3*(1U<< (logN-1)));
     fclose(fp1);
 
     exit(-1);
   }
 
   N = atoi(argv[1]);
   T = atoi(argv[2]);
   R = atoi(argv[3]);
   printf("N=%d, modified polar grid with T=%d, R=%d => ",N,T,R);
 
   x = (double *)nfft_malloc(5*T*R/2*(sizeof(double)));
   w = (double *)nfft_malloc(5*T*R/4*(sizeof(double)));
 
   f_hat    = (fftw_complex *)nfft_malloc(sizeof(fftw_complex)*N*N);
   f        = (fftw_complex *)nfft_malloc(sizeof(fftw_complex)*1.25*T*R);  /* 4/pi*log(1+sqrt(2)) = 1.122... < 1.25 */
   f_direct = (fftw_complex *)nfft_malloc(sizeof(fftw_complex)*1.25*T*R);
   f_tilde  = (fftw_complex *)nfft_malloc(sizeof(fftw_complex)*N*N);
 
   M=mpolar_grid(T,R,x,w); printf("M=%d.\n",M);
 
   fp1=fopen("input_data_r.dat","r");
   fp2=fopen("input_data_i.dat","r");
   if ((fp1==NULL) || (fp2==NULL))
     return(-1);
   for(k=0;k<N*N;k++)
   {
     fscanf(fp1,"%le ",&temp1);
     fscanf(fp2,"%le ",&temp2);
     f_hat[k]=temp1+ _Complex_I*temp2;
   }
   fclose(fp1);
   fclose(fp2);
 
       mpolar_dft(f_hat,N,f_direct,T,R,1);
   //  mpolar_fft(f_hat,N,f_direct,T,R,12);
 
   printf("\nTest of the mpolar FFT: \n");
   fp1=fopen("mpolar_fft_error.dat","w+");
   for (m=1; m<=12; m++)
   {
     mpolar_fft(f_hat,N,f,T,R,m);
 
     E_max=X(error_l_infty_complex)(f_direct,f,M);
     printf("m=%2d: E_max = %e\n",m,E_max);
     fprintf(fp1,"%e\n",E_max);
   }
   fclose(fp1);
 
   for (m=3; m<=9; m+=3)
   {
     printf("\nTest of the inverse mpolar FFT for m=%d: \n",m);
     sprintf(filename,"mpolar_ifft_error%d.dat",m);
     fp1=fopen(filename,"w+");
     for (max_i=0; max_i<=20; max_i+=2)
     {
       inverse_mpolar_fft(f_direct,T,R,f_tilde,N,max_i,m);
 
       E_max=X(error_l_infty_complex)(f_hat,f_tilde,N*N);
       printf("%3d iterations: E_max = %e\n",max_i,E_max);
       fprintf(fp1,"%e\n",E_max);
     }
     fclose(fp1);
   }
 
   nfft_free(x);
   nfft_free(w);
   nfft_free(f_hat);
   nfft_free(f);
   nfft_free(f_direct);
   nfft_free(f_tilde);
 
   return 0;
 }
 /* \} */