⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 rfftw_mpi_test.c

📁 FFTW, a collection of fast C routines to compute the Discrete Fourier Transform in one or more dime
💻 C
📖 第 1 页 / 共 2 页
字号:
{     WHEN_VERBOSE(2,		  printf("TEST CORRECTNESS (in place, FFTW_FORWARD, %s) "			 "n = %d  istride = %d  howmany = %d\n",			 SPECIFICP(0),			 n, istride, howmany));     test_in_place(n, istride, howmany, FFTW_FORWARD,		   validated_plan_forward, 0);          WHEN_VERBOSE(2,		  printf("TEST CORRECTNESS (in place, FFTW_BACKWARD, %s) "			 "n = %d  istride = %d  howmany = %d\n",			 SPECIFICP(0),			 n, istride, howmany));     test_in_place(n, istride, howmany, FFTW_BACKWARD,		   validated_plan_backward, 0);}void test_correctness(int n){}/************************************************* * multi-dimensional correctness tests *************************************************/void testnd_out_of_place(int rank, int *n, fftwnd_plan validated_plan){}void testnd_in_place(int rank, int *n, fftwnd_plan validated_plan,		     int alternate_api, int specific){     int local_nx, local_x_start, local_ny_after_transpose,          local_y_start_after_transpose, total_local_size;     int istride, ostride, howmany;     int N, dim, i, j, k;     int nc, nhc, nr;     fftw_real *in1, *out3, *work = 0;     fftw_complex *in2, *out1, *out2;     rfftwnd_mpi_plan p = 0, ip = 0;     int flags = measure_flag | wisdom_flag | FFTW_IN_PLACE;     if (specific || rank < 2)          return;     if (coinflip())	  flags |= FFTW_THREADSAFE;     N = nc = nr = nhc = 1;     for (dim = 0; dim < rank; ++dim)	  N *= n[dim];     if (rank > 0) {	  nr = n[rank - 1];	  nc = N / nr;	  nhc = nr / 2 + 1;     }     if (alternate_api && (rank == 2 || rank == 3)) {	  if (rank == 2) {	       p = rfftw2d_mpi_create_plan(MPI_COMM_WORLD,					   n[0], n[1], FFTW_REAL_TO_COMPLEX,					   flags);	       ip = rfftw2d_mpi_create_plan(MPI_COMM_WORLD,					    n[0], n[1], FFTW_COMPLEX_TO_REAL,					    flags);	  } else {	       p = rfftw3d_mpi_create_plan(MPI_COMM_WORLD,					   n[0], n[1], n[2],					   FFTW_REAL_TO_COMPLEX, flags);	       ip = rfftw3d_mpi_create_plan(MPI_COMM_WORLD,					    n[0], n[1], n[2],					    FFTW_COMPLEX_TO_REAL, flags);	  }     }     else {	  p = rfftwnd_mpi_create_plan(MPI_COMM_WORLD,				      rank, n, FFTW_REAL_TO_COMPLEX, flags);	  ip = rfftwnd_mpi_create_plan(MPI_COMM_WORLD, 				       rank, n, FFTW_COMPLEX_TO_REAL, flags);     }     CHECK(p != NULL && ip != NULL, "can't create plan");     rfftwnd_mpi_local_sizes(p, &local_nx, &local_x_start,			     &local_ny_after_transpose,			     &local_y_start_after_transpose,			     &total_local_size);          in1 = (fftw_real *) fftw_malloc(total_local_size				     * MAX_STRIDE * sizeof(fftw_real));     if (coinflip()) {          WHEN_VERBOSE(1, my_printf("w/work..."));	  work = (fftw_real *) fftw_malloc(total_local_size 					   * MAX_STRIDE * sizeof(fftw_real));     }     out3 = in1;     out1 = (fftw_complex *) in1;     in2 = (fftw_complex *) fftw_malloc(N * sizeof(fftw_complex));     out2 = (fftw_complex *) fftw_malloc(N * sizeof(fftw_complex));     for (i = 0; i < total_local_size * MAX_STRIDE; ++i)	  out3[i] = 0;     for (istride = 1; istride <= MAX_STRIDE; ++istride) {	  /* generate random inputs */	  for (i = 0; i < nc; ++i)	       for (j = 0; j < nr; ++j) {		    c_re(in2[i * nr + j]) = DRAND();		    c_im(in2[i * nr + j]) = 0.0;	       }	  for (i = 0; i < local_nx * (nc / n[0]); ++i)	       for (j = 0; j < nr; ++j) {		    for (k = 0; k < istride; ++k)			 in1[(i * nhc * 2 + j) * istride + k]			     = c_re((in2 + local_x_start * (N/n[0]))				     [i * nr + j]);	       }	  fftwnd(validated_plan, 1, in2, 1, 1, out2, 1, 1);	  howmany = ostride = istride;	  WHEN_VERBOSE(2, printf("\n    testing in-place stride %d...",				 istride));	  rfftwnd_mpi(p, howmany, in1, work, FFTW_NORMAL_ORDER);	  for (i = 0; i < local_nx * (nc / n[0]); ++i)	       for (k = 0; k < howmany; ++k)		    CHECK(compute_error_complex(out1 + i * nhc * ostride + k,						ostride,						out2 + local_x_start*(N/n[0])						+ i * nr, 1,						nhc) < TOLERANCE,			  "in-place (r2c): wrong answer");	  rfftwnd_mpi(ip, howmany, in1, work, FFTW_NORMAL_ORDER);	  for (i = 0; i < total_local_size * istride; ++i)	       out3[i] *= 1.0 / N;	  for (i = 0; i < local_nx * (nc / n[0]); ++i)	       for (k = 0; k < howmany; ++k)		    CHECK(compute_error(out3 + i * nhc * 2 * istride + k,					istride,					(fftw_real *)					(in2 + local_x_start*(N/n[0])					 + i * nr), 2,					nr) < TOLERANCE,			  "in-place (c2r): wrong answer (check 2)");     }     rfftwnd_mpi_destroy_plan(p);     rfftwnd_mpi_destroy_plan(ip);     fftw_free(work);     fftw_free(out2);     fftw_free(in2);     fftw_free(in1);}void testnd_correctness(struct size sz, fftw_direction dir,			int alt_api, int specific, int force_buf){     fftwnd_plan validated_plan;     if (dir != FFTW_FORWARD)	  return;     if (force_buf)	  return;     validated_plan = fftwnd_create_plan(sz.rank, sz.narray, 					 dir, measure_flag | wisdom_flag);     CHECK(validated_plan != NULL, "can't create plan");     testnd_in_place(sz.rank, sz.narray,		     validated_plan, alt_api, specific);     fftwnd_destroy_plan(validated_plan);}/************************************************* * planner tests *************************************************/void test_planner(int rank){     /*      * create and destroy many plans, at random.  Check the      * garbage-collecting allocator of twiddle factors      */     int i, dim;     int r, s;     rfftwnd_mpi_plan pnd[PLANNER_TEST_SIZE];     int *narr, maxdim;     chk_mem_leak = 0;     verbose--;     please_wait();     if (rank < 2)          rank = 2;     narr = (int *) fftw_malloc(rank * sizeof(int));     for (i = 0; i < PLANNER_TEST_SIZE; ++i) {          pnd[i] = (rfftwnd_mpi_plan) 0;     }     maxdim = (int) pow(8192, 1.0/rank);     for (i = 0; i < PLANNER_TEST_SIZE * PLANNER_TEST_SIZE; ++i) {          r = rand();          if (r < 0)               r = -r;          r = r % PLANNER_TEST_SIZE;          for (dim = 0; dim < rank; ++dim) {               do {                    s = rand();                    if (s < 0)                         s = -s;                    s = s % maxdim + 1;               } while (s == 0);               narr[dim] = s;          }	  if (rank > 1) {	       if (pnd[r])		    rfftwnd_mpi_destroy_plan(pnd[r]);	       	       pnd[r] = rfftwnd_mpi_create_plan(MPI_COMM_WORLD, rank, narr,					       random_dir(), measure_flag |					       wisdom_flag);	  }          if (i % (PLANNER_TEST_SIZE * PLANNER_TEST_SIZE / 20) == 0) {               WHEN_VERBOSE(0, my_printf("test planner: so far so good\n"));               WHEN_VERBOSE(0, my_printf("test planner: iteration %d"					 " out of %d\n",                              i, PLANNER_TEST_SIZE * PLANNER_TEST_SIZE));          }     }     for (i = 0; i < PLANNER_TEST_SIZE; ++i) {          if (pnd[i])               rfftwnd_mpi_destroy_plan(pnd[i]);     }     fftw_free(narr);     verbose++;     chk_mem_leak = 1;}/************************************************* * test initialization *************************************************/void test_init(int *argc, char ***argv){     unsigned int seed;     MPI_Init(argc,argv);     MPI_Comm_size(MPI_COMM_WORLD,&ncpus);     MPI_Comm_rank(MPI_COMM_WORLD,&my_cpu);     /* Only process 0 gets to do I/O: */     io_okay = my_cpu == 0;     /* Make sure all processes use the same seed for random numbers: */     seed = time(NULL);     MPI_Bcast(&seed, 1, MPI_INT, 0, MPI_COMM_WORLD);     srand(seed);     fftw_die_hook = fftw_mpi_die; /* call MPI_Abort on failure */}void test_finish(void){     MPI_Finalize();}void enter_paranoid_mode(void){}/* in MPI, only process 0 is guaranteed to have access to the argument list */int get_option(int argc, char **argv, char *argval, int argval_maxlen){     int c;     int arglen;     if (io_okay) {	  c = default_get_option(argc,argv,argval,argval_maxlen);	  arglen = strlen(argval) + 1;     }     MPI_Bcast(&c, 1, MPI_INT, 0, MPI_COMM_WORLD);     MPI_Bcast(&arglen, 1, MPI_INT, 0, MPI_COMM_WORLD);     MPI_Bcast(argval, arglen, MPI_CHAR, 0, MPI_COMM_WORLD);     return c;}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -