⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 fftw_mpi.h

📁 FFTW, a collection of fast C routines to compute the Discrete Fourier Transform in one or more dime
💻 H
字号:
/* * Copyright (c) 1997-1999, 2003 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA * */#ifndef FFTW_MPI_H#define FFTW_MPI_H#include "fftw.h"#include <mpi.h> /* need access to the MPI type definitions */#ifdef __cplusplusextern "C" {#endif /* __cplusplus *//***********************************************************************/typedef fftw_real TRANSPOSE_EL_TYPE;typedef struct {     int block_num, dest_pe, send_size, recv_size;} transpose_mpi_exchange;typedef struct {     MPI_Comm comm;     int n_pes, my_pe;          int nx,ny,local_nx,local_ny;     transpose_mpi_exchange *exchange;     int num_steps, send_block_size, recv_block_size;     MPI_Datatype el_type;     MPI_Request request[2];     int *perm_block_dest;     int num_perm_blocks, perm_block_size;     int all_blocks_equal;     int *send_block_sizes, *send_block_offsets;     int *recv_block_sizes, *recv_block_offsets;     char *move;     int move_size;} transpose_mpi_plan_struct;typedef transpose_mpi_plan_struct *transpose_mpi_plan;extern void transpose_mpi_get_local_size(int n, int my_pe, int n_pes,					 int *local_n, int *local_start);extern int transpose_mpi_get_local_storage_size(int nx, int ny,						int my_pe, int n_pes);extern transpose_mpi_plan transpose_mpi_create_plan(int nx, int ny,						    MPI_Comm comm);extern void transpose_mpi_destroy_plan(transpose_mpi_plan p);extern void transpose_mpi(transpose_mpi_plan p, int el_size,			  TRANSPOSE_EL_TYPE *local_data,			  TRANSPOSE_EL_TYPE *work);typedef enum { BEFORE_TRANSPOSE, AFTER_TRANSPOSE } transpose_in_place_which;typedef enum { TRANSPOSE_SYNC, TRANSPOSE_ASYNC } transpose_sync_type;extern void transpose_in_place_local(transpose_mpi_plan p,                              int el_size, TRANSPOSE_EL_TYPE *local_data,                              transpose_in_place_which which);extern TRANSPOSE_EL_TYPE *transpose_allocate_send_buf(transpose_mpi_plan p,						      int el_size);extern void transpose_get_send_block(transpose_mpi_plan p, int step,				     int *block_y_start, int *block_ny);extern void transpose_start_exchange_step(transpose_mpi_plan p,					  int el_size,					  TRANSPOSE_EL_TYPE *local_data,					  TRANSPOSE_EL_TYPE *send_buf,					  int step,					  transpose_sync_type sync_type);extern void transpose_finish_exchange_step(transpose_mpi_plan p, int step);/***********************************************************************/typedef struct {     fftw_plan p_fft_x;  /* plan for first dimension */     fftwnd_plan p_fft;  /* plan for subsequent dimensions */     transpose_mpi_plan p_transpose, p_transpose_inv;     fftw_complex *work; /* extra workspace, if needed */} fftwnd_mpi_plan_data;typedef fftwnd_mpi_plan_data *fftwnd_mpi_plan;typedef enum {    FFTW_NORMAL_ORDER,    FFTW_TRANSPOSED_ORDER} fftwnd_mpi_output_order;extern fftwnd_mpi_plan fftwnd_mpi_create_plan(MPI_Comm comm,					      int rank, const int *n,					      fftw_direction dir,					      int flags);extern fftwnd_mpi_plan fftw2d_mpi_create_plan(MPI_Comm comm,					      int nx, int ny,					  fftw_direction dir, int flags);extern fftwnd_mpi_plan fftw3d_mpi_create_plan(MPI_Comm comm,					      int nx, int ny, int nz,					  fftw_direction dir, int flags);extern void fftwnd_mpi_destroy_plan(fftwnd_mpi_plan p);extern void fftwnd_mpi_local_sizes(fftwnd_mpi_plan p,				   int *local_nx,				   int *local_x_start,				   int *local_ny_after_transpose,				   int *local_y_start_after_transpose,				   int *total_local_size);extern void fftwnd_mpi(fftwnd_mpi_plan p,		       int n_fields,		       fftw_complex *local_data, fftw_complex *work,		       fftwnd_mpi_output_order output_order);extern void fftw_mpi_die(const char *error_string);/***********************************************************************/typedef struct fftw_mpi_twiddle_struct {     int rows, rowstart, cols, n;     fftw_complex *W;     int refcount;     struct fftw_mpi_twiddle_struct *next;} fftw_mpi_twiddle;typedef struct fftw_mpi_plan_struct {     int n, m, r, local_m, local_m_start, local_r, local_r_start;     fftw_complex *fft_work;     fftw_mpi_twiddle *tw;     transpose_mpi_plan p_transpose, p_transpose_inv;     fftw_plan pm, pr;     int flags;     fftw_direction dir;} *fftw_mpi_plan;/* new flags for the MPI planner: */#define FFTW_SCRAMBLED_INPUT (8192)#define FFTW_SCRAMBLED_OUTPUT (16384)extern void fftw_mpi_local_sizes(fftw_mpi_plan p,				 int *local_n,				 int *local_start,				 int *local_n_after_transform,				 int *local_start_after_transform,				 int *total_local_size);extern fftw_mpi_plan fftw_mpi_create_plan(MPI_Comm comm,					  int n,					  fftw_direction dir, int flags);extern void fftw_mpi_destroy_plan(fftw_mpi_plan p);extern void fftw_mpi(fftw_mpi_plan p, int n_fields,		     fftw_complex *local_data, fftw_complex *work);extern void fftw_mpi_print_plan(fftw_mpi_plan p);/***********************************************************************/#ifdef __cplusplus} /* extern "C" */#endif /* __cplusplus */#endif /* FFTW_MPI_H */

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -