/usr/include/fftw_mpi.h is in fftw-dev 2.1.5-4.2.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 | /*
* Copyright (c) 1997-1999, 2003 Massachusetts Institute of Technology
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
*
*/
#ifndef FFTW_MPI_H
#define FFTW_MPI_H
#include "fftw.h"
#include <mpi.h> /* need access to the MPI type definitions */
#ifdef __cplusplus
extern "C" {
#endif /* __cplusplus */
/***********************************************************************/
typedef fftw_real TRANSPOSE_EL_TYPE;
typedef struct {
int block_num, dest_pe, send_size, recv_size;
} transpose_mpi_exchange;
typedef struct {
MPI_Comm comm;
int n_pes, my_pe;
int nx,ny,local_nx,local_ny;
transpose_mpi_exchange *exchange;
int num_steps, send_block_size, recv_block_size;
MPI_Datatype el_type;
MPI_Request request[2];
int *perm_block_dest;
int num_perm_blocks, perm_block_size;
int all_blocks_equal;
int *send_block_sizes, *send_block_offsets;
int *recv_block_sizes, *recv_block_offsets;
char *move;
int move_size;
} transpose_mpi_plan_struct;
typedef transpose_mpi_plan_struct *transpose_mpi_plan;
extern void transpose_mpi_get_local_size(int n, int my_pe, int n_pes,
int *local_n, int *local_start);
extern int transpose_mpi_get_local_storage_size(int nx, int ny,
int my_pe, int n_pes);
extern transpose_mpi_plan transpose_mpi_create_plan(int nx, int ny,
MPI_Comm comm);
extern void transpose_mpi_destroy_plan(transpose_mpi_plan p);
extern void transpose_mpi(transpose_mpi_plan p, int el_size,
TRANSPOSE_EL_TYPE *local_data,
TRANSPOSE_EL_TYPE *work);
typedef enum { BEFORE_TRANSPOSE, AFTER_TRANSPOSE } transpose_in_place_which;
typedef enum { TRANSPOSE_SYNC, TRANSPOSE_ASYNC } transpose_sync_type;
extern void transpose_in_place_local(transpose_mpi_plan p,
int el_size, TRANSPOSE_EL_TYPE *local_data,
transpose_in_place_which which);
extern TRANSPOSE_EL_TYPE *transpose_allocate_send_buf(transpose_mpi_plan p,
int el_size);
extern void transpose_get_send_block(transpose_mpi_plan p, int step,
int *block_y_start, int *block_ny);
extern void transpose_start_exchange_step(transpose_mpi_plan p,
int el_size,
TRANSPOSE_EL_TYPE *local_data,
TRANSPOSE_EL_TYPE *send_buf,
int step,
transpose_sync_type sync_type);
extern void transpose_finish_exchange_step(transpose_mpi_plan p, int step);
/***********************************************************************/
typedef struct {
fftw_plan p_fft_x; /* plan for first dimension */
fftwnd_plan p_fft; /* plan for subsequent dimensions */
transpose_mpi_plan p_transpose, p_transpose_inv;
fftw_complex *work; /* extra workspace, if needed */
} fftwnd_mpi_plan_data;
typedef fftwnd_mpi_plan_data *fftwnd_mpi_plan;
typedef enum {
FFTW_NORMAL_ORDER,
FFTW_TRANSPOSED_ORDER
} fftwnd_mpi_output_order;
extern fftwnd_mpi_plan fftwnd_mpi_create_plan(MPI_Comm comm,
int rank, const int *n,
fftw_direction dir,
int flags);
extern fftwnd_mpi_plan fftw2d_mpi_create_plan(MPI_Comm comm,
int nx, int ny,
fftw_direction dir, int flags);
extern fftwnd_mpi_plan fftw3d_mpi_create_plan(MPI_Comm comm,
int nx, int ny, int nz,
fftw_direction dir, int flags);
extern void fftwnd_mpi_destroy_plan(fftwnd_mpi_plan p);
extern void fftwnd_mpi_local_sizes(fftwnd_mpi_plan p,
int *local_nx,
int *local_x_start,
int *local_ny_after_transpose,
int *local_y_start_after_transpose,
int *total_local_size);
extern void fftwnd_mpi(fftwnd_mpi_plan p,
int n_fields,
fftw_complex *local_data, fftw_complex *work,
fftwnd_mpi_output_order output_order);
extern void fftw_mpi_die(const char *error_string);
/***********************************************************************/
typedef struct fftw_mpi_twiddle_struct {
int rows, rowstart, cols, n;
fftw_complex *W;
int refcount;
struct fftw_mpi_twiddle_struct *next;
} fftw_mpi_twiddle;
typedef struct fftw_mpi_plan_struct {
int n, m, r, local_m, local_m_start, local_r, local_r_start;
fftw_complex *fft_work;
fftw_mpi_twiddle *tw;
transpose_mpi_plan p_transpose, p_transpose_inv;
fftw_plan pm, pr;
int flags;
fftw_direction dir;
} *fftw_mpi_plan;
/* new flags for the MPI planner: */
#define FFTW_SCRAMBLED_INPUT (8192)
#define FFTW_SCRAMBLED_OUTPUT (16384)
extern void fftw_mpi_local_sizes(fftw_mpi_plan p,
int *local_n,
int *local_start,
int *local_n_after_transform,
int *local_start_after_transform,
int *total_local_size);
extern fftw_mpi_plan fftw_mpi_create_plan(MPI_Comm comm,
int n,
fftw_direction dir, int flags);
extern void fftw_mpi_destroy_plan(fftw_mpi_plan p);
extern void fftw_mpi(fftw_mpi_plan p, int n_fields,
fftw_complex *local_data, fftw_complex *work);
extern void fftw_mpi_print_plan(fftw_mpi_plan p);
/***********************************************************************/
#ifdef __cplusplus
} /* extern "C" */
#endif /* __cplusplus */
#endif /* FFTW_MPI_H */
|