Tinker9 70bd052 (Thu Nov 9 12:11:35 2023 -0800)
Loading...
Searching...
No Matches
parallelcu.h
1#pragma once
2#include <cstddef>
3
4namespace tinker {
5template <class T>
6T reduceSum_cu(const T* a, size_t nelem, int queue);
7
8template <class HT, size_t HN, class DPTR>
9void reduceSum2_cu(HT (&h_ans)[HN], DPTR v, size_t nelem, int queue);
10
11template <class T>
12void reduceSumOnDevice_cu(T*, const T*, size_t, int);
13
14template <class HT, size_t HN, class DPTR>
15void reduceSum2OnDevice_cu(HT (&)[HN], DPTR, size_t, int);
16
17template <class T>
18void dotProd_cu(T* ans, const T* a, const T* b, size_t nelem, int queue);
19
20template <class T>
21void scaleArray_cu(T* dst, T scal, size_t nelem, int queue);
22}
Definition: testrt.h:9
void dotProd_cu(T *ans, const T *a, const T *b, size_t nelem, int queue)
void reduceSum2_cu(HT(&h_ans)[HN], DPTR v, size_t nelem, int queue)
void reduceSumOnDevice_cu(T *, const T *, size_t, int)
void scaleArray_cu(T *dst, T scal, size_t nelem, int queue)
void reduceSum2OnDevice_cu(HT(&)[HN], DPTR, size_t, int)
T reduceSum_cu(const T *a, size_t nelem, int queue)