# include # include # include # include # include using namespace std; int main ( void ); void ccopy ( int n, float x[], float y[] ); void cfft2 ( int n, float x[], float y[], float w[], float sgn ); void cffti ( int n, float w[] ); double cpu_time ( void ); float ggl ( float *ds ); void step ( int n, int mj, float a[], float b[], float c[], float d[], float w[], float sgn ); //****************************************************************************80 int main ( void ) //****************************************************************************80 // // Purpose: // // MAIN is the main program for FFT. // // Discussion: // // The complex data in an N vector is stored as pairs of values in a // real vector of length 2*N. // // Modified: // // 16 July 2008 // // Author: // // C original version by Wesley Petersen // C++ version by John Burkardt // // Reference: // // Wesley Petersen, Peter Arbenz, // Introduction to Parallel Computing - A practical guide with examples in C, // Oxford University Press, // ISBN: 0-19-851576-6, // LC: QA76.58.P47. // { double ctime; double ctime1; double ctime2; float error; int first; int flops; float fnm1; int i; int icase; int it; int ln2; double mflops; int n; int nits = 10000; static float seed; float sgn; float *w; float *x; float *y; float *z; float z0; float z1; cout << "\n"; cout << "FFT\n"; cout << " C++ version\n"; cout << "\n"; cout << " Demonstrate an implementation of the Fast Fourier Transform\n"; cout << " of a complex data vector.\n"; // // Prepare for tests. // cout << "\n"; cout << " Accuracy check:\n"; cout << "\n"; cout << " FFT ( FFT ( X(1:N) ) ) == N * X(1:N)\n"; cout << "\n"; cout << " N Error Time MFLOPS\n"; cout << "\n"; seed = 331.0; n = 1; // // LN2 is the log base 2 of N. Each increase of LN2 doubles N. // for ( ln2 = 1; ln2 <= 20; ln2++ ) { n = 2 * n; // // Allocate storage for the complex arrays W, X, Y, Z. // // We handle the complex arithmetic, // and store a complex number as a pair of floats, a complex vector as a doubly // dimensioned array whose second dimension is 2. // w = new float[ n]; x = new float[2*n]; y = new float[2*n]; z = new float[2*n]; first = 1; for ( icase = 0; icase < 2; icase++ ) { if ( first ) { for ( i = 0; i < 2 * n; i = i + 2 ) { z0 = ggl ( &seed ); z1 = ggl ( &seed ); x[i] = z0; z[i] = z0; x[i+1] = z1; z[i+1] = z1; } } else { for ( i = 0; i < 2 * n; i = i + 2 ) { z0 = 0.0; z1 = 0.0; x[i] = z0; z[i] = z0; x[i+1] = z1; z[i+1] = z1; } } // // Initialize the sine and cosine tables. // cffti ( n, w ); // // Transform forward, back // if ( first ) { sgn = + 1.0; cfft2 ( n, x, y, w, sgn ); sgn = - 1.0; cfft2 ( n, y, x, w, sgn ); // // Results should be same as initial multiplied by N. // fnm1 = 1.0 / ( float ) n; error = 0.0; for ( i = 0; i < 2 * n; i = i + 2 ) { error = error + pow ( z[i] - fnm1 * x[i], 2 ) + pow ( z[i+1] - fnm1 * x[i+1], 2 ); } error = sqrt ( fnm1 * error ); cout << " " << setw(12) << n << " " << setw(12) << error; first = 0; } else { ctime1 = cpu_time ( ); for ( it = 0; it < nits; it++ ) { sgn = + 1.0; cfft2 ( n, x, y, w, sgn ); sgn = - 1.0; cfft2 ( n, y, x, w, sgn ); } ctime2 = cpu_time ( ); ctime = ctime2 - ctime1; flops = 2 * nits * ( 5 * n * ln2 ); mflops = ( double ) ( flops ) / 1.0E+06 / ctime; cout << " " << setw(12) << ctime / ( double ) ( 2 * nits ) << " " << setw(12) << mflops << "\n"; } } if ( ( ln2 % 4 ) == 0 ) { nits = nits / 10; } if ( nits < 1 ) { nits = 1; } delete [] w; delete [] x; delete [] y; delete [] z; } cout << "\n"; cout << "FFT:\n"; cout << " Normal end of execution.\n"; return 0; } //****************************************************************************80 void ccopy ( int n, float x[], float y[] ) //****************************************************************************80 // // Purpose: // // CCOPY copies a complex vector. // // Discussion: // // The "complex" vector A[N] is actually stored as a float vector B[2*N]. // // The "complex" vector entry A[I] is stored as: // // B[I*2+0], the real part, // B[I*2+1], the imaginary part. // // Modified: // // 27 April 2008 // // Author: // // C original version by Wesley Petersen // C++ version by John Burkardt // // Reference: // // Wesley Petersen, Peter Arbenz, // Introduction to Parallel Computing - A practical guide with examples in C, // Oxford University Press, // ISBN: 0-19-851576-6, // LC: QA76.58.P47. // // Parameters: // // Input, int N, the length of the "complex" array. // // Input, "complex X[N]", the array to be copied. // // Output, "complex Y[N]", a copy of X. // { int i; for ( i = 0; i < n; i++ ) { y[i*2+0] = x[i*2+0]; y[i*2+1] = x[i*2+1]; } return; } //****************************************************************************80 void cfft2 ( int n, float x[], float y[], float w[], float sgn ) //****************************************************************************80 // // Purpose: // // CFFT2 performs a complex Fast Fourier Transform. // // Modified: // // 27 April 2008 // // Author: // // C original version by Wesley Petersen // C++ version by John Burkardt // // Reference: // // Wesley Petersen, Peter Arbenz, // Introduction to Parallel Computing - A practical guide with examples in C, // Oxford University Press, // ISBN: 0-19-851576-6, // LC: QA76.58.P47. // // Parameters: // // Input, int N, the size of the array to be transformed. // // Input/output, float X[2*N], the data to be transformed. // On output, the contents of X have been overwritten by work information. // // Output, float Y[2*N], the forward or backward FFT of X. // // Input, float W[N], a table of sines and cosines. // // Input, float SGN, is +1 for a "forward" FFT and -1 for a "backward" FFT. // { int j; int m; int mj; int tgle; m = ( int ) ( log ( ( float ) n ) / log ( 1.99 ) ); mj = 1; // // Toggling switch for work array. // tgle = 1; step ( n, mj, &x[0*2+0], &x[(n/2)*2+0], &y[0*2+0], &y[mj*2+0], w, sgn ); if ( n == 2 ) { return; } for ( j = 0; j < m - 2; j++ ) { mj = mj * 2; if ( tgle ) { step ( n, mj, &y[0*2+0], &y[(n/2)*2+0], &x[0*2+0], &x[mj*2+0], w, sgn ); tgle = 0; } else { step ( n, mj, &x[0*2+0], &x[(n/2)*2+0], &y[0*2+0], &y[mj*2+0], w, sgn ); tgle = 1; } } // // Last pass thru data: move y to x if needed // if ( tgle ) { ccopy ( n, y, x ); } mj = n / 2; step ( n, mj, &x[0*2+0], &x[(n/2)*2+0], &y[0*2+0], &y[mj*2+0], w, sgn ); return; } //****************************************************************************80 void cffti ( int n, float w[] ) //****************************************************************************80 // // Purpose: // // CFFTI sets up sine and cosine tables needed for the FFT calculation. // // Modified: // // 27 April 2008 // // Author: // // C original version by Wesley Petersen // C++ version by John Burkardt // // Reference: // // Wesley Petersen, Peter Arbenz, // Introduction to Parallel Computing - A practical guide with examples in C, // Oxford University Press, // ISBN: 0-19-851576-6, // LC: QA76.58.P47. // // Parameters: // // Input, int N, the size of the array to be transformed. // // Output, float W[N], a table of sines and cosines. // { float arg; float aw; int i; int n2; const float pi = 3.141592653589793; n2 = n / 2; aw = 2.0 * pi / ( ( float ) n ); for ( i = 0; i < n2; i++ ) { arg = aw * ( ( float ) i ); w[i*2+0] = cos ( arg ); w[i*2+1] = sin ( arg ); } return; } //****************************************************************************80 double cpu_time ( void ) //****************************************************************************80 // // Purpose: // // CPU_TIME reports the elapsed CPU time. // // Modified: // // 27 September 2005 // // Author: // // John Burkardt // // Parameters: // // Output, double CPU_TIME, the current total elapsed CPU time in second. // { double value; value = ( double ) clock ( ) / ( double ) CLOCKS_PER_SEC; return value; } //****************************************************************************80 float ggl ( float *seed ) //****************************************************************************80 // // Purpose: // // GGL generates uniformly distributed pseudorandom numbers. // // Modified: // // 16 July 2008 // // Author: // // C original version by Wesley Petersen, M Troyer, I Vattulainen // C++ version by John Burkardt // // Reference: // // Wesley Petersen, Peter Arbenz, // Introduction to Parallel Computing - A practical guide with examples in C, // Oxford University Press, // ISBN: 0-19-851576-6, // LC: QA76.58.P47. // // Parameters: // // Input/output, float *SEED, used as a seed for the sequence. // // Output, real GGL, the next pseudorandom value. // { double d2 = 0.2147483647e10; double t; float value; t = ( double ) *seed; t = fmod ( 16807.0 * t, d2 ); *seed = ( float ) t; value = ( float ) ( ( t - 1.0 ) / ( d2 - 1.0 ) ); return value; } //****************************************************************************80 void step ( int n, int mj, float a[], float b[], float c[], float d[], float w[], float sgn ) //****************************************************************************80 // // Purpose: // // STEP carries out one step of the workspace version of CFFT2. // // Modified: // // 27 April 2008 // // Author: // // C original version by Wesley Petersen // C++ version by John Burkardt // // Reference: // // Wesley Petersen, Peter Arbenz, // Introduction to Parallel Computing - A practical guide with examples in C, // Oxford University Press, // ISBN: 0-19-851576-6, // LC: QA76.58.P47. // { float ambr; float ambu; int j; int ja; int jb; int jc; int jd; int jw; int k; int lj; int mj2; float wjw[2]; mj2 = 2 * mj; lj = n / mj2; for ( j = 0; j < lj; j++ ) { jw = j * mj; ja = jw; jb = ja; jc = j * mj2; jd = jc; wjw[0] = w[jw*2+0]; wjw[1] = w[jw*2+1]; if ( sgn < 0.0 ) { wjw[1] = - wjw[1]; } for ( k = 0; k < mj; k++ ) { c[(jc+k)*2+0] = a[(ja+k)*2+0] + b[(jb+k)*2+0]; c[(jc+k)*2+1] = a[(ja+k)*2+1] + b[(jb+k)*2+1]; ambr = a[(ja+k)*2+0] - b[(jb+k)*2+0]; ambu = a[(ja+k)*2+1] - b[(jb+k)*2+1]; d[(jd+k)*2+0] = wjw[0] * ambr - wjw[1] * ambu; d[(jd+k)*2+1] = wjw[1] * ambr + wjw[0] * ambu; } } return; }