@@ -181,9 +181,9 @@ static int CeedBasisApplyAtPointsCore_Cuda(CeedBasis basis, bool apply_add, cons
181181
182182 if (data -> moduleAtPoints ) CeedCallCuda (ceed , cuModuleUnload (data -> moduleAtPoints ));
183183 CeedCallBackend (CeedBasisGetNumComponents (basis , & num_comp ));
184- CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , & data -> moduleAtPoints , 9 , "BASIS_Q_1D" , Q_1d , "BASIS_P_1D" , P_1d , "BASIS_BUF_LEN" ,
185- Q_1d * CeedIntPow (Q_1d > P_1d ? Q_1d : P_1d , dim - 1 ), "BASIS_DIM" , dim , "BASIS_NUM_COMP" , num_comp ,
186- "BASIS_NUM_NODES" , CeedIntPow (P_1d , dim ), "BASIS_NUM_QPTS" , CeedIntPow (Q_1d , dim ), "BASIS_NUM_PTS" ,
184+ CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , "basis_at_points" , & data -> moduleAtPoints , 9 , "BASIS_Q_1D" , Q_1d , "BASIS_P_1D" , P_1d ,
185+ "BASIS_BUF_LEN" , Q_1d * CeedIntPow (Q_1d > P_1d ? Q_1d : P_1d , dim - 1 ), "BASIS_DIM" , dim , "BASIS_NUM_COMP" ,
186+ num_comp , "BASIS_NUM_NODES" , CeedIntPow (P_1d , dim ), "BASIS_NUM_QPTS" , CeedIntPow (Q_1d , dim ), "BASIS_NUM_PTS" ,
187187 max_num_points , "POINTS_BUFF_LEN" , CeedIntPow (Q_1d , dim - 1 )));
188188 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> moduleAtPoints , "InterpAtPoints" , & data -> InterpAtPoints ));
189189 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> moduleAtPoints , "InterpTransposeAtPoints" , & data -> InterpTransposeAtPoints ));
@@ -421,9 +421,9 @@ int CeedBasisCreateTensorH1_Cuda(CeedInt dim, CeedInt P_1d, CeedInt Q_1d, const
421421 const char basis_kernel_source [] = "// Tensor basis source\n#include <ceed/jit-source/cuda/cuda-ref-basis-tensor.h>\n" ;
422422
423423 CeedCallBackend (CeedBasisGetNumComponents (basis , & num_comp ));
424- CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , & data -> module , 7 , "BASIS_Q_1D" , Q_1d , "BASIS_P_1D" , P_1d , "BASIS_BUF_LEN" ,
425- Q_1d * CeedIntPow (Q_1d > P_1d ? Q_1d : P_1d , dim - 1 ), "BASIS_DIM" , dim , "BASIS_NUM_COMP" , num_comp ,
426- "BASIS_NUM_NODES" , CeedIntPow (P_1d , dim ), "BASIS_NUM_QPTS" , CeedIntPow (Q_1d , dim )));
424+ CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , "basis_h1_tensor" , & data -> module , 7 , "BASIS_Q_1D" , Q_1d , "BASIS_P_1D" , P_1d ,
425+ "BASIS_BUF_LEN" , Q_1d * CeedIntPow (Q_1d > P_1d ? Q_1d : P_1d , dim - 1 ), "BASIS_DIM" , dim , "BASIS_NUM_COMP" ,
426+ num_comp , "BASIS_NUM_NODES" , CeedIntPow (P_1d , dim ), "BASIS_NUM_QPTS" , CeedIntPow (Q_1d , dim )));
427427 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "Interp" , & data -> Interp ));
428428 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "Grad" , & data -> Grad ));
429429 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "Weight" , & data -> Weight ));
@@ -477,8 +477,8 @@ int CeedBasisCreateH1_Cuda(CeedElemTopology topo, CeedInt dim, CeedInt num_nodes
477477 const char basis_kernel_source [] = "// Nontensor basis source\n#include <ceed/jit-source/cuda/cuda-ref-basis-nontensor.h>\n" ;
478478
479479 CeedCallBackend (CeedBasisGetNumComponents (basis , & num_comp ));
480- CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , & data -> module , 5 , "BASIS_Q" , num_qpts , "BASIS_P" , num_nodes , "BASIS_Q_COMP_INTERP" ,
481- q_comp_interp , "BASIS_Q_COMP_DERIV" , q_comp_grad , "BASIS_NUM_COMP" , num_comp ));
480+ CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , "basis_h1_nontensor" , & data -> module , 5 , "BASIS_Q" , num_qpts , "BASIS_P" , num_nodes ,
481+ "BASIS_Q_COMP_INTERP" , q_comp_interp , "BASIS_Q_COMP_DERIV" , q_comp_grad , "BASIS_NUM_COMP" , num_comp ));
482482 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "Interp" , & data -> Interp ));
483483 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "InterpTranspose" , & data -> InterpTranspose ));
484484 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "Deriv" , & data -> Deriv ));
@@ -532,8 +532,8 @@ int CeedBasisCreateHdiv_Cuda(CeedElemTopology topo, CeedInt dim, CeedInt num_nod
532532 const char basis_kernel_source [] = "// Nontensor basis source\n#include <ceed/jit-source/cuda/cuda-ref-basis-nontensor.h>\n" ;
533533
534534 CeedCallBackend (CeedBasisGetNumComponents (basis , & num_comp ));
535- CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , & data -> module , 5 , "BASIS_Q" , num_qpts , "BASIS_P" , num_nodes , "BASIS_Q_COMP_INTERP" ,
536- q_comp_interp , "BASIS_Q_COMP_DERIV" , q_comp_div , "BASIS_NUM_COMP" , num_comp ));
535+ CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , "basis_h_div" , & data -> module , 5 , "BASIS_Q" , num_qpts , "BASIS_P" , num_nodes ,
536+ "BASIS_Q_COMP_INTERP" , q_comp_interp , "BASIS_Q_COMP_DERIV" , q_comp_div , "BASIS_NUM_COMP" , num_comp ));
537537 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "Interp" , & data -> Interp ));
538538 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "InterpTranspose" , & data -> InterpTranspose ));
539539 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "Deriv" , & data -> Deriv ));
@@ -587,8 +587,8 @@ int CeedBasisCreateHcurl_Cuda(CeedElemTopology topo, CeedInt dim, CeedInt num_no
587587 const char basis_kernel_source [] = "// Nontensor basis source\n#include <ceed/jit-source/cuda/cuda-ref-basis-nontensor.h>\n" ;
588588
589589 CeedCallBackend (CeedBasisGetNumComponents (basis , & num_comp ));
590- CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , & data -> module , 5 , "BASIS_Q" , num_qpts , "BASIS_P" , num_nodes , "BASIS_Q_COMP_INTERP" ,
591- q_comp_interp , "BASIS_Q_COMP_DERIV" , q_comp_curl , "BASIS_NUM_COMP" , num_comp ));
590+ CeedCallBackend (CeedCompile_Cuda (ceed , basis_kernel_source , "basis_h_curl" , & data -> module , 5 , "BASIS_Q" , num_qpts , "BASIS_P" , num_nodes ,
591+ "BASIS_Q_COMP_INTERP" , q_comp_interp , "BASIS_Q_COMP_DERIV" , q_comp_curl , "BASIS_NUM_COMP" , num_comp ));
592592 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "Interp" , & data -> Interp ));
593593 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "InterpTranspose" , & data -> InterpTranspose ));
594594 CeedCallBackend (CeedGetKernel_Cuda (ceed , data -> module , "Deriv" , & data -> Deriv ));
0 commit comments