|
20 | 20 | //------------------------------------------------------------------------------ |
21 | 21 | // Interp |
22 | 22 | //------------------------------------------------------------------------------ |
23 | | -extern "C" __global__ void InterpAtPoints(const CeedInt num_elem, const CeedScalarCPU *__restrict__ c_B, const CeedInt *__restrict__ points_per_elem, |
24 | | - const CeedScalarCPU *__restrict__ d_X, const CeedScalarCPU *__restrict__ d_U, |
25 | | - CeedScalarCPU *__restrict__ d_V) { |
| 23 | +extern "C" __global__ void InterpAtPoints(const CeedInt num_elem, const CeedScalarBase *__restrict__ c_B, const CeedInt *__restrict__ points_per_elem, |
| 24 | + const CeedScalarBase *__restrict__ d_X, const CeedScalarBase *__restrict__ d_U, |
| 25 | + CeedScalarBase *__restrict__ d_V) { |
26 | 26 | extern __shared__ CeedScalar slice[]; |
27 | 27 |
|
28 | 28 | SharedData_Cuda data; |
@@ -76,9 +76,9 @@ extern "C" __global__ void InterpAtPoints(const CeedInt num_elem, const CeedScal |
76 | 76 | } |
77 | 77 | } |
78 | 78 |
|
79 | | -extern "C" __global__ void InterpTransposeAtPoints(const CeedInt num_elem, const CeedScalarCPU *__restrict__ c_B, |
80 | | - const CeedInt *__restrict__ points_per_elem, const CeedScalarCPU *__restrict__ d_X, |
81 | | - const CeedScalarCPU *__restrict__ d_U, CeedScalarCPU *__restrict__ d_V) { |
| 79 | +extern "C" __global__ void InterpTransposeAtPoints(const CeedInt num_elem, const CeedScalarBase *__restrict__ c_B, |
| 80 | + const CeedInt *__restrict__ points_per_elem, const CeedScalarBase *__restrict__ d_X, |
| 81 | + const CeedScalarBase *__restrict__ d_U, CeedScalarBase *__restrict__ d_V) { |
82 | 82 | extern __shared__ CeedScalar slice[]; |
83 | 83 |
|
84 | 84 | SharedData_Cuda data; |
@@ -146,9 +146,9 @@ extern "C" __global__ void InterpTransposeAtPoints(const CeedInt num_elem, const |
146 | 146 | } |
147 | 147 | } |
148 | 148 |
|
149 | | -extern "C" __global__ void InterpTransposeAddAtPoints(const CeedInt num_elem, const CeedScalarCPU *__restrict__ c_B, |
150 | | - const CeedInt *__restrict__ points_per_elem, const CeedScalarCPU *__restrict__ d_X, |
151 | | - const CeedScalarCPU *__restrict__ d_U, CeedScalarCPU *__restrict__ d_V) { |
| 149 | +extern "C" __global__ void InterpTransposeAddAtPoints(const CeedInt num_elem, const CeedScalarBase *__restrict__ c_B, |
| 150 | + const CeedInt *__restrict__ points_per_elem, const CeedScalarBase *__restrict__ d_X, |
| 151 | + const CeedScalarBase *__restrict__ d_U, CeedScalarBase *__restrict__ d_V) { |
152 | 152 | extern __shared__ CeedScalar slice[]; |
153 | 153 |
|
154 | 154 | SharedData_Cuda data; |
@@ -208,9 +208,9 @@ extern "C" __global__ void InterpTransposeAddAtPoints(const CeedInt num_elem, co |
208 | 208 | //------------------------------------------------------------------------------ |
209 | 209 | // Grad |
210 | 210 | //------------------------------------------------------------------------------ |
211 | | -extern "C" __global__ void GradAtPoints(const CeedInt num_elem, const CeedScalarCPU *__restrict__ c_B, const CeedInt *__restrict__ points_per_elem, |
212 | | - const CeedScalarCPU *__restrict__ d_X, const CeedScalarCPU *__restrict__ d_U, |
213 | | - CeedScalarCPU *__restrict__ d_V) { |
| 211 | +extern "C" __global__ void GradAtPoints(const CeedInt num_elem, const CeedScalarBase *__restrict__ c_B, const CeedInt *__restrict__ points_per_elem, |
| 212 | + const CeedScalarBase *__restrict__ d_X, const CeedScalarBase *__restrict__ d_U, |
| 213 | + CeedScalarBase *__restrict__ d_V) { |
214 | 214 | extern __shared__ CeedScalar slice[]; |
215 | 215 |
|
216 | 216 | SharedData_Cuda data; |
@@ -264,9 +264,9 @@ extern "C" __global__ void GradAtPoints(const CeedInt num_elem, const CeedScalar |
264 | 264 | } |
265 | 265 | } |
266 | 266 |
|
267 | | -extern "C" __global__ void GradTransposeAtPoints(const CeedInt num_elem, const CeedScalarCPU *__restrict__ c_B, |
268 | | - const CeedInt *__restrict__ points_per_elem, const CeedScalarCPU *__restrict__ d_X, |
269 | | - const CeedScalarCPU *__restrict__ d_U, CeedScalarCPU *__restrict__ d_V) { |
| 267 | +extern "C" __global__ void GradTransposeAtPoints(const CeedInt num_elem, const CeedScalarBase *__restrict__ c_B, |
| 268 | + const CeedInt *__restrict__ points_per_elem, const CeedScalarBase *__restrict__ d_X, |
| 269 | + const CeedScalarBase *__restrict__ d_U, CeedScalarBase *__restrict__ d_V) { |
270 | 270 | extern __shared__ CeedScalar slice[]; |
271 | 271 |
|
272 | 272 | SharedData_Cuda data; |
@@ -335,9 +335,9 @@ extern "C" __global__ void GradTransposeAtPoints(const CeedInt num_elem, const C |
335 | 335 | } |
336 | 336 | } |
337 | 337 |
|
338 | | -extern "C" __global__ void GradTransposeAddAtPoints(const CeedInt num_elem, const CeedScalarCPU *__restrict__ c_B, |
339 | | - const CeedInt *__restrict__ points_per_elem, const CeedScalarCPU *__restrict__ d_X, |
340 | | - const CeedScalarCPU *__restrict__ d_U, CeedScalarCPU *__restrict__ d_V) { |
| 338 | +extern "C" __global__ void GradTransposeAddAtPoints(const CeedInt num_elem, const CeedScalarBase *__restrict__ c_B, |
| 339 | + const CeedInt *__restrict__ points_per_elem, const CeedScalarBase *__restrict__ d_X, |
| 340 | + const CeedScalarBase *__restrict__ d_U, CeedScalarBase *__restrict__ d_V) { |
341 | 341 | extern __shared__ CeedScalar slice[]; |
342 | 342 |
|
343 | 343 | SharedData_Cuda data; |
|
0 commit comments