@@ -40,7 +40,7 @@ inline __device__ void ChebyshevDerivativeAtPoint(const CeedScalar x, CeedScalar
4040// ------------------------------------------------------------------------------
4141// 1D interpolate to points
4242// ------------------------------------------------------------------------------
43- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
43+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
4444inline __device__ void InterpAtPoints1d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_C, const CeedScalar *r_X,
4545 CeedScalar *__restrict__ r_V) {
4646 CeedScalar chebyshev_x[Q_1D];
@@ -61,7 +61,7 @@ inline __device__ void InterpAtPoints1d(SharedData_Cuda &data, const CeedInt p,
6161// ------------------------------------------------------------------------------
6262// 1D interpolate transpose
6363// ------------------------------------------------------------------------------
64- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
64+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
6565inline __device__ void InterpTransposeAtPoints1d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_U, const CeedScalar *r_X,
6666 CeedScalar *__restrict__ r_C) {
6767 CeedScalar chebyshev_x[Q_1D];
@@ -86,7 +86,7 @@ inline __device__ void InterpTransposeAtPoints1d(SharedData_Cuda &data, const Ce
8686// ------------------------------------------------------------------------------
8787// 1D derivatives at points
8888// ------------------------------------------------------------------------------
89- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
89+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
9090inline __device__ void GradAtPoints1d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_C, const CeedScalar *r_X,
9191 CeedScalar *__restrict__ r_V) {
9292 CeedScalar chebyshev_x[Q_1D];
@@ -107,7 +107,7 @@ inline __device__ void GradAtPoints1d(SharedData_Cuda &data, const CeedInt p, co
107107// ------------------------------------------------------------------------------
108108// 1D derivatives transpose
109109// ------------------------------------------------------------------------------
110- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
110+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
111111inline __device__ void GradTransposeAtPoints1d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_U, const CeedScalar *r_X,
112112 CeedScalar *__restrict__ r_C) {
113113 CeedScalar chebyshev_x[Q_1D];
@@ -136,7 +136,7 @@ inline __device__ void GradTransposeAtPoints1d(SharedData_Cuda &data, const Ceed
136136// ------------------------------------------------------------------------------
137137// 2D interpolate to points
138138// ------------------------------------------------------------------------------
139- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
139+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
140140inline __device__ void InterpAtPoints2d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_C, const CeedScalar *r_X,
141141 CeedScalar *__restrict__ r_V) {
142142 for (CeedInt i = 0 ; i < NUM_COMP; i++) r_V[i] = 0.0 ;
@@ -166,7 +166,7 @@ inline __device__ void InterpAtPoints2d(SharedData_Cuda &data, const CeedInt p,
166166// ------------------------------------------------------------------------------
167167// 2D interpolate transpose
168168// ------------------------------------------------------------------------------
169- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
169+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
170170inline __device__ void InterpTransposeAtPoints2d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_U, const CeedScalar *r_X,
171171 CeedScalar *__restrict__ r_C) {
172172 for (CeedInt comp = 0 ; comp < NUM_COMP; comp++) {
@@ -204,7 +204,7 @@ inline __device__ void InterpTransposeAtPoints2d(SharedData_Cuda &data, const Ce
204204// ------------------------------------------------------------------------------
205205// 2D derivatives at points
206206// ------------------------------------------------------------------------------
207- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
207+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
208208inline __device__ void GradAtPoints2d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_C, const CeedScalar *r_X,
209209 CeedScalar *__restrict__ r_V) {
210210 for (CeedInt i = 0 ; i < NUM_COMP * 2 ; i++) r_V[i] = 0.0 ;
@@ -238,7 +238,7 @@ inline __device__ void GradAtPoints2d(SharedData_Cuda &data, const CeedInt p, co
238238// ------------------------------------------------------------------------------
239239// 2D derivatives transpose
240240// ------------------------------------------------------------------------------
241- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
241+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
242242inline __device__ void GradTransposeAtPoints2d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_U, const CeedScalar *r_X,
243243 CeedScalar *__restrict__ r_C) {
244244 for (CeedInt comp = 0 ; comp < NUM_COMP; comp++) {
@@ -284,7 +284,7 @@ inline __device__ void GradTransposeAtPoints2d(SharedData_Cuda &data, const Ceed
284284// ------------------------------------------------------------------------------
285285// 3D interpolate to points
286286// ------------------------------------------------------------------------------
287- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
287+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
288288inline __device__ void InterpAtPoints3d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_C, const CeedScalar *r_X,
289289 CeedScalar *__restrict__ r_V) {
290290 for (CeedInt i = 0 ; i < NUM_COMP; i++) r_V[i] = 0.0 ;
@@ -319,7 +319,7 @@ inline __device__ void InterpAtPoints3d(SharedData_Cuda &data, const CeedInt p,
319319// ------------------------------------------------------------------------------
320320// 3D interpolate transpose
321321// ------------------------------------------------------------------------------
322- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
322+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
323323inline __device__ void InterpTransposeAtPoints3d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_U, const CeedScalar *r_X,
324324 CeedScalar *__restrict__ r_C) {
325325 for (CeedInt comp = 0 ; comp < NUM_COMP; comp++) {
@@ -362,7 +362,7 @@ inline __device__ void InterpTransposeAtPoints3d(SharedData_Cuda &data, const Ce
362362// ------------------------------------------------------------------------------
363363// 3D derivatives at points
364364// ------------------------------------------------------------------------------
365- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
365+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
366366inline __device__ void GradAtPoints3d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_C, const CeedScalar *r_X,
367367 CeedScalar *__restrict__ r_V) {
368368 for (CeedInt i = 0 ; i < NUM_COMP * 3 ; i++) r_V[i] = 0.0 ;
@@ -402,7 +402,7 @@ inline __device__ void GradAtPoints3d(SharedData_Cuda &data, const CeedInt p, co
402402// ------------------------------------------------------------------------------
403403// 3D derivatives transpose
404404// ------------------------------------------------------------------------------
405- template <int NUM_COMP, int NUM_POINTS, int Q_1D>
405+ template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D>
406406inline __device__ void GradTransposeAtPoints3d (SharedData_Cuda &data, const CeedInt p, const CeedScalar *__restrict__ r_U, const CeedScalar *r_X,
407407 CeedScalar *__restrict__ r_C) {
408408 for (CeedInt comp = 0 ; comp < NUM_COMP; comp++) {
0 commit comments