📄 rfftw_mpi_test.c
字号:
{ WHEN_VERBOSE(2, printf("TEST CORRECTNESS (in place, FFTW_FORWARD, %s) " "n = %d istride = %d howmany = %d\n", SPECIFICP(0), n, istride, howmany)); test_in_place(n, istride, howmany, FFTW_FORWARD, validated_plan_forward, 0); WHEN_VERBOSE(2, printf("TEST CORRECTNESS (in place, FFTW_BACKWARD, %s) " "n = %d istride = %d howmany = %d\n", SPECIFICP(0), n, istride, howmany)); test_in_place(n, istride, howmany, FFTW_BACKWARD, validated_plan_backward, 0);}void test_correctness(int n){}/************************************************* * multi-dimensional correctness tests *************************************************/void testnd_out_of_place(int rank, int *n, fftwnd_plan validated_plan){}void testnd_in_place(int rank, int *n, fftwnd_plan validated_plan, int alternate_api, int specific){ int local_nx, local_x_start, local_ny_after_transpose, local_y_start_after_transpose, total_local_size; int istride, ostride, howmany; int N, dim, i, j, k; int nc, nhc, nr; fftw_real *in1, *out3, *work = 0; fftw_complex *in2, *out1, *out2; rfftwnd_mpi_plan p = 0, ip = 0; int flags = measure_flag | wisdom_flag | FFTW_IN_PLACE; if (specific || rank < 2) return; if (coinflip()) flags |= FFTW_THREADSAFE; N = nc = nr = nhc = 1; for (dim = 0; dim < rank; ++dim) N *= n[dim]; if (rank > 0) { nr = n[rank - 1]; nc = N / nr; nhc = nr / 2 + 1; } if (alternate_api && (rank == 2 || rank == 3)) { if (rank == 2) { p = rfftw2d_mpi_create_plan(MPI_COMM_WORLD, n[0], n[1], FFTW_REAL_TO_COMPLEX, flags); ip = rfftw2d_mpi_create_plan(MPI_COMM_WORLD, n[0], n[1], FFTW_COMPLEX_TO_REAL, flags); } else { p = rfftw3d_mpi_create_plan(MPI_COMM_WORLD, n[0], n[1], n[2], FFTW_REAL_TO_COMPLEX, flags); ip = rfftw3d_mpi_create_plan(MPI_COMM_WORLD, n[0], n[1], n[2], FFTW_COMPLEX_TO_REAL, flags); } } else { p = rfftwnd_mpi_create_plan(MPI_COMM_WORLD, rank, n, FFTW_REAL_TO_COMPLEX, flags); ip = rfftwnd_mpi_create_plan(MPI_COMM_WORLD, rank, n, FFTW_COMPLEX_TO_REAL, flags); } CHECK(p != NULL && ip != NULL, "can't create plan"); rfftwnd_mpi_local_sizes(p, &local_nx, &local_x_start, &local_ny_after_transpose, &local_y_start_after_transpose, &total_local_size); in1 = (fftw_real *) fftw_malloc(total_local_size * MAX_STRIDE * sizeof(fftw_real)); if (coinflip()) { WHEN_VERBOSE(1, my_printf("w/work...")); work = (fftw_real *) fftw_malloc(total_local_size * MAX_STRIDE * sizeof(fftw_real)); } out3 = in1; out1 = (fftw_complex *) in1; in2 = (fftw_complex *) fftw_malloc(N * sizeof(fftw_complex)); out2 = (fftw_complex *) fftw_malloc(N * sizeof(fftw_complex)); for (i = 0; i < total_local_size * MAX_STRIDE; ++i) out3[i] = 0; for (istride = 1; istride <= MAX_STRIDE; ++istride) { /* generate random inputs */ for (i = 0; i < nc; ++i) for (j = 0; j < nr; ++j) { c_re(in2[i * nr + j]) = DRAND(); c_im(in2[i * nr + j]) = 0.0; } for (i = 0; i < local_nx * (nc / n[0]); ++i) for (j = 0; j < nr; ++j) { for (k = 0; k < istride; ++k) in1[(i * nhc * 2 + j) * istride + k] = c_re((in2 + local_x_start * (N/n[0])) [i * nr + j]); } fftwnd(validated_plan, 1, in2, 1, 1, out2, 1, 1); howmany = ostride = istride; WHEN_VERBOSE(2, printf("\n testing in-place stride %d...", istride)); rfftwnd_mpi(p, howmany, in1, work, FFTW_NORMAL_ORDER); for (i = 0; i < local_nx * (nc / n[0]); ++i) for (k = 0; k < howmany; ++k) CHECK(compute_error_complex(out1 + i * nhc * ostride + k, ostride, out2 + local_x_start*(N/n[0]) + i * nr, 1, nhc) < TOLERANCE, "in-place (r2c): wrong answer"); rfftwnd_mpi(ip, howmany, in1, work, FFTW_NORMAL_ORDER); for (i = 0; i < total_local_size * istride; ++i) out3[i] *= 1.0 / N; for (i = 0; i < local_nx * (nc / n[0]); ++i) for (k = 0; k < howmany; ++k) CHECK(compute_error(out3 + i * nhc * 2 * istride + k, istride, (fftw_real *) (in2 + local_x_start*(N/n[0]) + i * nr), 2, nr) < TOLERANCE, "in-place (c2r): wrong answer (check 2)"); } rfftwnd_mpi_destroy_plan(p); rfftwnd_mpi_destroy_plan(ip); fftw_free(work); fftw_free(out2); fftw_free(in2); fftw_free(in1);}void testnd_correctness(struct size sz, fftw_direction dir, int alt_api, int specific, int force_buf){ fftwnd_plan validated_plan; if (dir != FFTW_FORWARD) return; if (force_buf) return; validated_plan = fftwnd_create_plan(sz.rank, sz.narray, dir, measure_flag | wisdom_flag); CHECK(validated_plan != NULL, "can't create plan"); testnd_in_place(sz.rank, sz.narray, validated_plan, alt_api, specific); fftwnd_destroy_plan(validated_plan);}/************************************************* * planner tests *************************************************/void test_planner(int rank){ /* * create and destroy many plans, at random. Check the * garbage-collecting allocator of twiddle factors */ int i, dim; int r, s; rfftwnd_mpi_plan pnd[PLANNER_TEST_SIZE]; int *narr, maxdim; chk_mem_leak = 0; verbose--; please_wait(); if (rank < 2) rank = 2; narr = (int *) fftw_malloc(rank * sizeof(int)); for (i = 0; i < PLANNER_TEST_SIZE; ++i) { pnd[i] = (rfftwnd_mpi_plan) 0; } maxdim = (int) pow(8192, 1.0/rank); for (i = 0; i < PLANNER_TEST_SIZE * PLANNER_TEST_SIZE; ++i) { r = rand(); if (r < 0) r = -r; r = r % PLANNER_TEST_SIZE; for (dim = 0; dim < rank; ++dim) { do { s = rand(); if (s < 0) s = -s; s = s % maxdim + 1; } while (s == 0); narr[dim] = s; } if (rank > 1) { if (pnd[r]) rfftwnd_mpi_destroy_plan(pnd[r]); pnd[r] = rfftwnd_mpi_create_plan(MPI_COMM_WORLD, rank, narr, random_dir(), measure_flag | wisdom_flag); } if (i % (PLANNER_TEST_SIZE * PLANNER_TEST_SIZE / 20) == 0) { WHEN_VERBOSE(0, my_printf("test planner: so far so good\n")); WHEN_VERBOSE(0, my_printf("test planner: iteration %d" " out of %d\n", i, PLANNER_TEST_SIZE * PLANNER_TEST_SIZE)); } } for (i = 0; i < PLANNER_TEST_SIZE; ++i) { if (pnd[i]) rfftwnd_mpi_destroy_plan(pnd[i]); } fftw_free(narr); verbose++; chk_mem_leak = 1;}/************************************************* * test initialization *************************************************/void test_init(int *argc, char ***argv){ unsigned int seed; MPI_Init(argc,argv); MPI_Comm_size(MPI_COMM_WORLD,&ncpus); MPI_Comm_rank(MPI_COMM_WORLD,&my_cpu); /* Only process 0 gets to do I/O: */ io_okay = my_cpu == 0; /* Make sure all processes use the same seed for random numbers: */ seed = time(NULL); MPI_Bcast(&seed, 1, MPI_INT, 0, MPI_COMM_WORLD); srand(seed); fftw_die_hook = fftw_mpi_die; /* call MPI_Abort on failure */}void test_finish(void){ MPI_Finalize();}void enter_paranoid_mode(void){}/* in MPI, only process 0 is guaranteed to have access to the argument list */int get_option(int argc, char **argv, char *argval, int argval_maxlen){ int c; int arglen; if (io_okay) { c = default_get_option(argc,argv,argval,argval_maxlen); arglen = strlen(argval) + 1; } MPI_Bcast(&c, 1, MPI_INT, 0, MPI_COMM_WORLD); MPI_Bcast(&arglen, 1, MPI_INT, 0, MPI_COMM_WORLD); MPI_Bcast(argval, arglen, MPI_CHAR, 0, MPI_COMM_WORLD); return c;}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -