Added multi-GPU reductions. Tested to work with 1-2 GPUs with power of two grid dimensions. Requires more testing in special cases (when using exotic grid dimensions and a large number of GPUs)
This commit is contained in:
@@ -51,10 +51,16 @@ AcResult boundcondStep(const Device device, const StreamType stream_type,
|
||||
const int3& start, const int3& end);
|
||||
|
||||
/** */
|
||||
AcResult reduceScal(const Device device);
|
||||
AcResult reduceScal(const Device device, const StreamType stream_type, const ReductionType rtype,
|
||||
const VertexBufferHandle vtxbuf_handle, AcReal* result);
|
||||
|
||||
/** */
|
||||
AcResult reduceVec(const Device device);
|
||||
AcResult reduceVec(const Device device, const StreamType stream_type,
|
||||
const ReductionType rtype,
|
||||
const VertexBufferHandle vec0,
|
||||
const VertexBufferHandle vec1,
|
||||
const VertexBufferHandle vec2,
|
||||
AcReal* result);
|
||||
|
||||
/** */
|
||||
AcResult rkStep(const Device device, const StreamType stream_type, const int step_number,
|
||||
|
Reference in New Issue
Block a user