-
Notifications
You must be signed in to change notification settings - Fork 12
/
Copy pathtransform.hpp
318 lines (277 loc) · 11.8 KB
/
transform.hpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
/*
* Copyright (c) 2019 ETH Zurich, Simon Frasch
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are met:
*
* 1. Redistributions of source code must retain the above copyright notice,
* this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. Neither the name of the copyright holder nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
#ifndef SPFFT_TRANSFORM_HPP
#define SPFFT_TRANSFORM_HPP
#include <memory>
#include "spfft/config.h"
#include "spfft/types.h"
#ifdef SPFFT_MPI
#include <mpi.h>
#endif
namespace spfft {
template <typename T>
class SPFFT_NO_EXPORT TransformInternal;
class SPFFT_EXPORT Grid;
template <typename TransformType>
class SPFFT_NO_EXPORT MultiTransformInternal;
template <typename T>
class SPFFT_NO_EXPORT GridInternal;
/**
* A transform in double precision with fixed dimensions. Shares memory with other transform created
* from the same Grid object.
*/
class SPFFT_EXPORT Transform {
public:
using ValueType = double;
/**
* Create a transform without a grid handle.
* Thread-safe if no FFTW calls are executed concurrently.
*
* @param[in] maxNumThreads The maximum number of threads to use.
* @param[in] processingUnit The processing unit type to use. Must be either SPFFT_PU_HOST or
* SPFFT_PU_GPU.
* @param[in] transformType The transform type (complex to complex or real to complex). Can be
* SPFFT_TRANS_C2C or SPFFT_TRANS_R2C.
* @param[in] dimX The dimension in x.
* @param[in] dimY The dimension in y.
* @param[in] dimZ The dimension in z.
* @param[in] numLocalElements The number of elements in frequency domain.
* @param[in] indexFormat The index format. Only SPFFT_INDEX_TRIPLETS currently supported.
* @param[in] indices Pointer to frequency indices. Centered indexing is allowed.
*/
Transform(int maxNumThreads, SpfftProcessingUnitType processingUnit,
SpfftTransformType transformType, int dimX, int dimY, int dimZ, int numLocalElements,
SpfftIndexFormatType indexFormat, const int* indices);
#ifdef SPFFT_MPI
/**
* Create a distributed transform without a grid handle.
* Thread-safe if no FFTW calls are executed concurrently.
*
* @param[in] maxNumThreads The maximum number of threads to use.
* @param[in] comm The MPI communicator to use. Will be duplicated for internal use.
* @param[in] exchangeType The type of MPI exchange to use. Possible values are
* SPFFT_EXCH_DEFAULT, SPFFT_EXCH_BUFFERED, SPFFT_EXCH_COMPACT_BUFFERED and SPFFT_EXCH_UNBUFFERED.
* @param[in] processingUnit The processing unit type to use. Must be either SPFFT_PU_HOST or
* SPFFT_PU_GPU.
* @param[in] transformType The transform type (complex to complex or real to complex). Can be
* SPFFT_TRANS_C2C or SPFFT_TRANS_R2C.
* @param[in] dimX The dimension in x.
* @param[in] dimY The dimension in y.
* @param[in] dimZ The dimension in z.
* @param[in] localZLength The length in z in space domain of the local MPI rank.
* @param[in] numLocalElements The number of elements in frequency domain of the local MPI
* rank.
* @param[in] indexFormat The index format. Only SPFFT_INDEX_TRIPLETS currently supported.
* @param[in] indices Pointer to frequency indices. Centered indexing is allowed.
*/
Transform(int maxNumThreads, MPI_Comm comm, SpfftExchangeType exchangeType,
SpfftProcessingUnitType processingUnit, SpfftTransformType transformType, int dimX,
int dimY, int dimZ, int localZLength, int numLocalElements,
SpfftIndexFormatType indexFormat, const int* indices);
#endif
/**
* Default copy constructor.
*/
Transform(const Transform&) = default;
/**
* Default move constructor.
*/
Transform(Transform&&) = default;
/**
* Default copy operator.
*/
Transform& operator=(const Transform&) = default;
/**
* Default move operator.
*/
Transform& operator=(Transform&&) = default;
/**
* Clone transform.
*
* @return Independent transform with the same parameters, but with new underlying grid.
*/
Transform clone() const;
/**
* Access a transform parameter.
* @return Type of transform.
*/
SpfftTransformType type() const;
/**
* Access a transform parameter.
* @return Dimension in x.
*/
int dim_x() const;
/**
* Access a transform parameter.
* @return Dimension in y.
*/
int dim_y() const;
/**
* Access a transform parameter.
* @return Dimension in z.
*/
int dim_z() const;
/**
* Access a transform parameter.
* @return Length in z of the space domain slice held by the local MPI rank.
*/
int local_z_length() const;
/**
* Access a transform parameter.
* @return Offset in z of the space domain slice held by the local MPI rank.
*/
int local_z_offset() const;
/**
* Access a transform parameter.
* @return Number of elements in the space domain slice held by the local MPI rank.
*/
int local_slice_size() const;
/**
* Access a transform parameter.
* @return Global number of elements in space domain. Equals dim_x() * dim_y() * dim_z().
*/
long long int global_size() const;
/**
* Access a transform parameter.
* @return Number of elements in frequency domain.
*/
int num_local_elements() const;
/**
* Access a transform parameter.
* @return Global number of elements in frequency domain.
*/
long long int num_global_elements() const;
/**
* Access a transform parameter.
* @return The processing unit used for calculations. Can be SPFFT_PU_HOST or SPFFT_PU_GPU.
*/
SpfftProcessingUnitType processing_unit() const;
/**
* Access a transform parameter.
* @return The GPU device id used. Returns always 0, if no GPU support is enabled.
*/
int device_id() const;
/**
* Access a transform parameter.
* @return The exact number of threads used by transforms created from this grid. May be less than
* the maximum given to the constructor. Always 1, if not compiled with OpenMP support.
*/
int num_threads() const;
/**
* Access a transform parameter.
* @return The execution mode. Only affects execution on GPU. Defaults to SPFFT_EXEC_SYNCHRONOUS.
*/
SpfftExecType execution_mode() const;
/**
* Set a transform parameter.
* @param[in] mode The execution mode to change to. Only affects execution on GPU.
* Defaults to SPFFT_EXEC_SYNCHRONOUS.
*/
void set_execution_mode(SpfftExecType mode);
#ifdef SPFFT_MPI
/**
* Access a transform parameter.
* @return The internal MPI communicator.
*/
MPI_Comm communicator() const;
#endif
/**
* Provides access to the space domain data.
*
* @param[in] dataLocation The processing unit to query for the data. Can be SPFFT_PU_HOST or
* SPFFT_PU_GPU (if GPU is set as execution unit).
* @return Pointer to space domain data on given processing unit. Alignment is guaranteed to
* fulfill requirements for std::complex and C language complex types.
* @throw GenericError SpFFT error. Can be a derived type.
* @throw std::exception Error from standard library calls. Can be a derived type.
*/
double* space_domain_data(SpfftProcessingUnitType dataLocation);
/**
* Execute a forward transform from space domain to frequency domain.
*
* @param[in] inputLocation The processing unit, to take the input from. Can be SPFFT_PU_HOST or
* SPFFT_PU_GPU (if GPU is set as execution unit).
* @param[out] output Pointer to memory, where the frequency domain elements are written to. Can
* be located at Host or GPU memory (if GPU is set as processing unit).
* @param[in] scaling Controls scaling of output. SPFFT_NO_SCALING to disable or
* SPFFT_FULL_SCALING to scale by factor 1 / (dim_x() * dim_y() * dim_z()).
* @throw GenericError SpFFT error. Can be a derived type.
* @throw std::exception Error from standard library calls. Can be a derived type.
*/
void forward(SpfftProcessingUnitType inputLocation, double* output,
SpfftScalingType scaling = SPFFT_NO_SCALING);
/**
* Execute a forward transform from space domain to frequency domain.
*
* @param[in] input Pointer to memory, to read space domain data from. Can
* be located at Host or GPU memory (if GPU is set as processing unit).
* @param[out] output Pointer to memory, where the frequency domain elements are written to. Can
* be located at Host or GPU memory (if GPU is set as processing unit).
* @param[in] scaling Controls scaling of output. SPFFT_NO_SCALING to disable or
* SPFFT_FULL_SCALING to scale by factor 1 / (dim_x() * dim_y() * dim_z()).
* @throw GenericError SpFFT error. Can be a derived type.
* @throw std::exception Error from standard library calls. Can be a derived type.
*/
void forward(const double* input, double* output, SpfftScalingType scaling = SPFFT_NO_SCALING);
/**
* Execute a backward transform from frequency domain to space domain.
*
* @param[in] input Input data in frequency domain. Must match the indices provided at transform
* creation. Can be located at Host or GPU memory, if GPU is set as processing unit.
* @param[in] outputLocation The processing unit, to place the output at. Can be SPFFT_PU_HOST or
* SPFFT_PU_GPU (if GPU is set as execution unit).
* @throw GenericError SpFFT error. Can be a derived type.
* @throw std::exception Error from standard library calls. Can be a derived type.
*/
void backward(const double* input, SpfftProcessingUnitType outputLocation);
/**
* Execute a backward transform from frequency domain to space domain.
*
* @param[in] input Input data in frequency domain. Must match the indices provided at transform
* creation. Can be located at Host or GPU memory, if GPU is set as processing unit.
* @param[out] output Pointer to memory to write output in frequency domain to. Can be located at
* Host or GPU memory, if GPU is set as processing unit.
* @throw GenericError SpFFT error. Can be a derived type.
* @throw std::exception Error from standard library calls. Can be a derived type.
*/
void backward(const double* input, double* output);
private:
/*! \cond PRIVATE */
friend Grid;
friend MultiTransformInternal<Transform>;
SPFFT_NO_EXPORT Transform(const std::shared_ptr<GridInternal<double>>& grid,
SpfftProcessingUnitType processingUnit,
SpfftTransformType transformType, int dimX, int dimY, int dimZ,
int localZLength, int numLocalElements,
SpfftIndexFormatType indexFormat, const int* indices);
SPFFT_NO_EXPORT explicit Transform(std::shared_ptr<TransformInternal<double>> transform);
std::shared_ptr<TransformInternal<double>> transform_;
/*! \endcond */
};
} // namespace spfft
#endif