CEED
diff --git a/‎backends/cuda-gen/ceed-cuda-gen-operator-build.cpp‎
Lines changed: 19 additions & 19 deletions b/‎backends/cuda-gen/ceed-cuda-gen-operator-build.cpp‎
Lines changed: 19 additions & 19 deletions
diff --git a/‎backends/cuda/ceed-cuda-compile.cpp‎
Lines changed: 11 additions & 3 deletions b/‎backends/cuda/ceed-cuda-compile.cpp‎
Lines changed: 11 additions & 3 deletions
diff --git a/‎backends/hip-gen/ceed-hip-gen-operator-build.cpp‎
Lines changed: 2 additions & 2 deletions b/‎backends/hip-gen/ceed-hip-gen-operator-build.cpp‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎include/ceed-impl.h‎
Lines changed: 1 addition & 1 deletion b/‎include/ceed-impl.h‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎include/ceed/ceed-f32.h‎
Lines changed: 10 additions & 0 deletions b/‎include/ceed/ceed-f32.h‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎include/ceed/ceed-f64.h‎
Lines changed: 3 additions & 1 deletion b/‎include/ceed/ceed-f64.h‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎include/ceed/ceed.h‎
Lines changed: 3 additions & 2 deletions b/‎include/ceed/ceed.h‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎include/ceed/types.h‎
Lines changed: 4 additions & 2 deletions b/‎include/ceed/types.h‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎interface/ceed-operator.c‎
Lines changed: 15 additions & 11 deletions b/‎interface/ceed-operator.c‎
Lines changed: 15 additions & 11 deletions
diff --git a/‎interface/ceed-types.c‎
Lines changed: 5 additions & 0 deletions b/‎interface/ceed-types.c‎
Lines changed: 5 additions & 0 deletions
@@ -1572,17 +1572,17 @@ extern "C" int CeedOperatorBuildKernel_Cuda_gen(CeedOperator op, bool *is_good_b
 
   // Compile
   {
-    bool          is_compile_good = false;
-    const CeedInt T_1d            = CeedIntMax(is_all_tensor ? Q_1d : Q, data->max_P_1d);
-    bool          use_mixed_precision;
+    bool           is_compile_good = false;
+    const CeedInt  T_1d            = CeedIntMax(is_all_tensor ? Q_1d : Q, data->max_P_1d);
+    CeedScalarType precision;
 
     // Check for mixed precision
-    CeedCallBackend(CeedOperatorGetMixedPrecision(op, &use_mixed_precision));
+    CeedCallBackend(CeedOperatorGetPrecision(op, &precision));
 
     data->thread_1d = T_1d;
-    if (use_mixed_precision) {
-      CeedCallBackend(
-          CeedTryCompile_Cuda(ceed, code.str().c_str(), &is_compile_good, &data->module, 2, "OP_T_1D", T_1d, "CEED_JIT_MIXED_PRECISION", 1));
+    if (precision != CEED_SCALAR_TYPE) {
+      CeedCallBackend(CeedTryCompile_Cuda(ceed, code.str().c_str(), &is_compile_good, &data->module, 2, "OP_T_1D", T_1d, "CEED_JIT_PRECISION",
+                                          CeedScalarTypes[precision]));
     } else {
       CeedCallBackend(CeedTryCompile_Cuda(ceed, code.str().c_str(), &is_compile_good, &data->module, 1, "OP_T_1D", T_1d));
     }
@@ -2052,18 +2052,18 @@ static int CeedOperatorBuildKernelAssemblyAtPoints_Cuda_gen(CeedOperator op, boo
 
   // Compile
   {
-    bool          is_compile_good = false;
-    const CeedInt T_1d            = CeedIntMax(is_all_tensor ? Q_1d : Q, data->max_P_1d);
-    bool          use_mixed_precision;
+    bool           is_compile_good = false;
+    const CeedInt  T_1d            = CeedIntMax(is_all_tensor ? Q_1d : Q, data->max_P_1d);
+    CeedScalarType precision;
 
     // Check for mixed precision
-    CeedCallBackend(CeedOperatorGetMixedPrecision(op, &use_mixed_precision));
+    CeedCallBackend(CeedOperatorGetPrecision(op, &precision));
 
     data->thread_1d = T_1d;
-    if (use_mixed_precision) {
+    if (precision != CEED_SCALAR_TYPE) {
       CeedCallBackend(CeedTryCompile_Cuda(ceed, code.str().c_str(), &is_compile_good,
                                           is_full ? &data->module_assemble_full : &data->module_assemble_diagonal, 2, "OP_T_1D", T_1d,
-                                          "CEED_JIT_MIXED_PRECISION", 1));
+                                          "CEED_JIT_PRECISION", CeedScalarTypes[precision]));
     } else {
       CeedCallBackend(CeedTryCompile_Cuda(ceed, code.str().c_str(), &is_compile_good,
                                           is_full ? &data->module_assemble_full : &data->module_assemble_diagonal, 1, "OP_T_1D", T_1d));
@@ -2642,17 +2642,17 @@ extern "C" int CeedOperatorBuildKernelLinearAssembleQFunction_Cuda_gen(CeedOpera
 
   // Compile
   {
-    bool          is_compile_good = false;
-    const CeedInt T_1d            = CeedIntMax(is_all_tensor ? Q_1d : Q, data->max_P_1d);
-    bool          use_mixed_precision;
+    bool           is_compile_good = false;
+    const CeedInt  T_1d            = CeedIntMax(is_all_tensor ? Q_1d : Q, data->max_P_1d);
+    CeedScalarType precision;
 
     // Check for mixed precision
-    CeedCallBackend(CeedOperatorGetMixedPrecision(op, &use_mixed_precision));
+    CeedCallBackend(CeedOperatorGetPrecision(op, &precision));
 
     data->thread_1d = T_1d;
-    if (use_mixed_precision) {
+    if (precision != CEED_SCALAR_TYPE) {
       CeedCallBackend(CeedTryCompile_Cuda(ceed, code.str().c_str(), &is_compile_good, &data->module_assemble_qfunction, 2, "OP_T_1D", T_1d,
-                                          "CEED_JIT_MIXED_PRECISION", 1));
+                                          "CEED_JIT_PRECISION", CeedScalarTypes[precision]));
     } else {
       CeedCallBackend(CeedTryCompile_Cuda(ceed, code.str().c_str(), &is_compile_good, &data->module_assemble_qfunction, 1, "OP_T_1D", T_1d));
     }
 
@@ -52,12 +52,20 @@ static int CeedCompileCore_Cuda(Ceed ceed, const char *source, const bool throw_
   // Get kernel specific options, such as kernel constants
   if (num_defines > 0) {
     char *name;
-    int   val;
 
     for (int i = 0; i < num_defines; i++) {
       name = va_arg(args, char *);
-      val  = va_arg(args, int);
-      code << "#define " << name << " " << val << "\n";
+      if (!strcmp(name, "CEED_JIT_PRECISION")) {
+        char *val;
+
+        val = va_arg(args, char *);
+        code << "#define " << name << " " << val << "\n";
+      } else {
+        int val;
+
+        val = va_arg(args, int);
+        code << "#define " << name << " " << val << "\n";
+      }
     }
   }
 
 
@@ -2483,8 +2483,8 @@ extern "C" int CeedOperatorBuildKernelLinearAssembleQFunction_Hip_gen(CeedOperat
       CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[f], &field_size));
       CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[f], &eval_mode));
       if (eval_mode == CEED_EVAL_GRAD) {
-        code << tab << "CeedScalar r_q_in_" << f << "[num_comp_in_" << f << "*" << "dim_in_" << f << "*"
-             << (is_all_tensor && (max_dim >= 3) ? "Q_1d" : "1") << "] = {0.};\n";
+        code << tab << "CeedScalar r_q_in_" << f << "[num_comp_in_" << f << "*"
+             << "dim_in_" << f << "*" << (is_all_tensor && (max_dim >= 3) ? "Q_1d" : "1") << "] = {0.};\n";
       } else {
         code << tab << "CeedScalar r_q_in_" << f << "[num_comp_in_" << f << "*" << (is_all_tensor && (max_dim >= 3) ? "Q_1d" : "1") << "] = {0.};\n";
       }
 
@@ -381,7 +381,7 @@ struct CeedOperator_private {
   bool                      is_composite;
   bool                      is_at_points;
   bool                      has_restriction;
-  bool                      use_mixed_precision;
+  CeedScalarType            precision;
   CeedQFunctionAssemblyData qf_assembled;
   CeedOperatorAssemblyData  op_assembled;
   CeedOperator             *sub_operators;
 
@@ -18,8 +18,18 @@
 
 /// Set base scalar type to FP32. (See CeedScalarType enum in ceed.h for all options.)
 #define CEED_SCALAR_TYPE CEED_SCALAR_FP32
+#if defined(CEED_RUNNING_JIT_PASS) && defined(CEED_JIT_PRECISION) && (CEED_JIT_PRECISION != CEED_SCALAR_TYPE)
+#ifdef CEED_JIT_PRECISION == CEED_SCALAR_FP64
+typedef double CeedScalar;
+typedef float  CeedScalarCPU;
+
+/// Machine epsilon
+static const CeedScalar CEED_EPSILON = DBL_EPSILON;
+#endif  // CEED_JIT_PRECISION
+#else
 typedef float      CeedScalar;
 typedef CeedScalar CeedScalarCPU;
 
 /// Machine epsilon
 static const CeedScalar CEED_EPSILON = FLT_EPSILON;
+#endif
@@ -18,12 +18,14 @@
 
 /// Set base scalar type to FP64. (See CeedScalarType enum in ceed.h for all options.)
 #define CEED_SCALAR_TYPE CEED_SCALAR_FP64
-#if defined(CEED_RUNNING_JIT_PASS) && defined(CEED_JIT_MIXED_PRECISION)
+#if defined(CEED_RUNNING_JIT_PASS) && defined(CEED_JIT_PRECISION) && (CEED_JIT_PRECISION != CEED_SCALAR_TYPE)
+#if CEED_JIT_PRECISION == CEED_SCALAR_FP32
 typedef float  CeedScalar;
 typedef double CeedScalarCPU;
 
 /// Machine epsilon
 static const CeedScalar CEED_EPSILON = FLT_EPSILON;
+#endif  // CEED_JIT_PRECISION
 #else
 typedef double     CeedScalar;
 typedef CeedScalar CeedScalarCPU;
 
@@ -178,6 +178,7 @@ CEED_EXTERN const char *const  CeedEvalModes[];
 CEED_EXTERN const char *const  CeedQuadModes[];
 CEED_EXTERN const char *const  CeedElemTopologies[];
 CEED_EXTERN const char *const  CeedContextFieldTypes[];
+CEED_EXTERN const char *const  CeedScalarTypes[];
 
 CEED_EXTERN int CeedGetPreferredMemType(Ceed ceed, CeedMemType *type);
 
@@ -427,8 +428,8 @@ CEED_EXTERN int  CeedOperatorCheckReady(CeedOperator op);
 CEED_EXTERN int  CeedOperatorGetActiveVectorLengths(CeedOperator op, CeedSize *input_size, CeedSize *output_size);
 CEED_EXTERN int  CeedOperatorSetQFunctionAssemblyReuse(CeedOperator op, bool reuse_assembly_data);
 CEED_EXTERN int  CeedOperatorSetQFunctionAssemblyDataUpdateNeeded(CeedOperator op, bool needs_data_update);
-CEED_EXTERN int  CeedOperatorSetMixedPrecision(CeedOperator op);
-CEED_EXTERN int  CeedOperatorGetMixedPrecision(CeedOperator op, bool *use_mixed_precision);
+CEED_EXTERN int  CeedOperatorSetPrecision(CeedOperator op, CeedScalarType precision);
+CEED_EXTERN int  CeedOperatorGetPrecision(CeedOperator op, CeedScalarType *precision);
 CEED_EXTERN int  CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request);
 CEED_EXTERN int  CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr,
                                                                   CeedRequest *request);
 
@@ -118,10 +118,12 @@ typedef signed char CeedInt8;
 /// @ingroup Ceed
 typedef enum {
   /// Single precision
-  CEED_SCALAR_FP32,
+  CEED_SCALAR_FP32 = 0,
   /// Double precision
-  CEED_SCALAR_FP64
+  CEED_SCALAR_FP64 = 1
 } CeedScalarType;
+#define CEED_SCALAR_FP32 0
+#define CEED_SCALAR_FP64 1
 /// Base scalar type for the library to use: change which header is included to change the precision.
 #include "ceed-f64.h"  // IWYU pragma: export
 
 
@@ -635,43 +635,45 @@ int CeedOperatorIsSetupDone(CeedOperator op, bool *is_setup_done) {
 }
 
 /**
-  @brief Set a `CeedOperator` to use reduced precision for operator application
+  @brief Set the floating point precision for `CeedOperator` application
 
-  @param[in] op `CeedOperator`
+  @param[in] op        `CeedOperator`
+  @param[in] precision `CeedScalarType` to use for operator application
 
   @return An error code: 0 - success, otherwise - failure
 
   @ref User
 **/
-int CeedOperatorSetMixedPrecision(CeedOperator op) {
+int CeedOperatorSetPrecision(CeedOperator op, CeedScalarType scalar_type) {
   bool is_immutable, is_composite, supports_mixed_precision;
   Ceed ceed;
 
   CeedCall(CeedOperatorGetCeed(op, &ceed));
   CeedCall(CeedOperatorIsImmutable(op, &is_immutable));
-  CeedCheck(!is_immutable, ceed, CEED_ERROR_INCOMPATIBLE, "CeedOperatorSetMixedPrecision must be called before operator is finalized");
+  CeedCheck(!is_immutable, ceed, CEED_ERROR_INCOMPATIBLE, "CeedOperatorSetPrecision must be called before operator is finalized");
   CeedCall(CeedOperatorIsComposite(op, &is_composite));
-  CeedCheck(!is_composite, ceed, CEED_ERROR_INCOMPATIBLE, "CeedOperatorSetMixedPrecision should be set on single operators");
+  CeedCheck(!is_composite, ceed, CEED_ERROR_INCOMPATIBLE, "CeedOperatorSetPrecision should be set on single operators");
   CeedCall(CeedGetSupportsMixedPrecision(ceed, &supports_mixed_precision));
-  CeedCheck(supports_mixed_precision, ceed, CEED_ERROR_UNSUPPORTED, "Backend does not implement mixed precision operators");
+  CeedCheck(scalar_type == CEED_SCALAR_TYPE || supports_mixed_precision, ceed, CEED_ERROR_UNSUPPORTED,
+            "Backend does not implement mixed precision operators");
 
-  op->use_mixed_precision = true;
+  op->precision = scalar_type;
   CeedCallBackend(CeedDestroy(&ceed));
   return CEED_ERROR_SUCCESS;
 }
 
 /**
   @brief Get whether a `CeedOperator` is set to use reduced precision for operator application
 
-  @param[in]  op                  `CeedOperator`
-  @param[out] use_mixed_precision Variable to store `CeedQFunction`
+  @param[in]  op        `CeedOperator`
+  @param[out] precision Variable to store operator precision
 
   @return An error code: 0 - success, otherwise - failure
 
   @ref User
 **/
-int CeedOperatorGetMixedPrecision(CeedOperator op, bool *use_mixed_precision) {
-  *use_mixed_precision = op->use_mixed_precision;
+int CeedOperatorGetPrecision(CeedOperator op, CeedScalarType *precision) {
+  *precision = op->precision;
   return CEED_ERROR_SUCCESS;
 }
 
@@ -809,6 +811,7 @@ int CeedOperatorCreate(Ceed ceed, CeedQFunction qf, CeedQFunction dqf, CeedQFunc
   (*op)->ref_count   = 1;
   (*op)->input_size  = -1;
   (*op)->output_size = -1;
+  (*op)->precision   = CEED_SCALAR_TYPE;
   CeedCall(CeedQFunctionReferenceCopy(qf, &(*op)->qf));
   if (dqf && dqf != CEED_QFUNCTION_NONE) CeedCall(CeedQFunctionReferenceCopy(dqf, &(*op)->dqf));
   if (dqfT && dqfT != CEED_QFUNCTION_NONE) CeedCall(CeedQFunctionReferenceCopy(dqfT, &(*op)->dqfT));
@@ -853,6 +856,7 @@ int CeedOperatorCreateAtPoints(Ceed ceed, CeedQFunction qf, CeedQFunction dqf, C
   (*op)->is_at_points = true;
   (*op)->input_size   = -1;
   (*op)->output_size  = -1;
+  (*op)->precision    = CEED_SCALAR_TYPE;
   CeedCall(CeedQFunctionReferenceCopy(qf, &(*op)->qf));
   if (dqf && dqf != CEED_QFUNCTION_NONE) CeedCall(CeedQFunctionReferenceCopy(dqf, &(*op)->dqf));
   if (dqfT && dqfT != CEED_QFUNCTION_NONE) CeedCall(CeedQFunctionReferenceCopy(dqfT, &(*op)->dqfT));
 
@@ -64,3 +64,8 @@ const char *const CeedFESpaces[] = {
     [CEED_FE_SPACE_HDIV]  = "H(div) space",
     [CEED_FE_SPACE_HCURL] = "H(curl) space",
 };
+
+const char *const CeedScalarTypes[] = {
+    [CEED_SCALAR_FP32] = "CEED_SCALAR_FP32",
+    [CEED_SCALAR_FP64] = "CEED_SCALAR_FP32",
+};