File tree Expand file tree Collapse file tree
runtime/libs/circle-schema Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -87,6 +87,13 @@ enum TensorType : byte {
8787 GGML_Q8_1 = - 5 ,
8888
8989 // MX dtypes
90+ // Current restrictions of MX dtypes
91+ // - MX dtypes are not used for model I/O
92+ // - MX dtypes are used for activations, not for constant inputs (ex. weight)
93+ // - MX dtype's parameters (block size, exponent scale, etc) follows
94+ // OCP Microscaling Formats Specification
95+ // - Model does not have exponent scale data.
96+ // Backend should define and use internally if needed
9097 MXFP4 = - 6 ,
9198 MXINT8 = - 7 ,
9299}
Original file line number Diff line number Diff line change @@ -87,6 +87,13 @@ enum TensorType : byte {
8787 GGML_Q8_1 = - 5 ,
8888
8989 // MX dtypes
90+ // Current restrictions of MX dtypes
91+ // - MX dtypes are not used for model I/O
92+ // - MX dtypes are used for activations, not for constant inputs (ex. weight)
93+ // - MX dtype's parameters (block size, exponent scale, etc) follows
94+ // OCP Microscaling Formats Specification
95+ // - Model does not have exponent scale data.
96+ // Backend should define and use internally if needed
9097 MXFP4 = - 6 ,
9198 MXINT8 = - 7 ,
9299}
Original file line number Diff line number Diff line change @@ -87,6 +87,13 @@ enum TensorType : byte {
8787 GGML_Q8_1 = - 5 ,
8888
8989 // MX dtypes
90+ // Current restrictions of MX dtypes
91+ // - MX dtypes are not used for model I/O
92+ // - MX dtypes are used for activations, not for constant inputs (ex. weight)
93+ // - MX dtype's parameters (block size, exponent scale, etc) follows
94+ // OCP Microscaling Formats Specification
95+ // - Model does not have exponent scale data.
96+ // Backend should define and use internally if needed
9097 MXFP4 = - 6 ,
9198 MXINT8 = - 7 ,
9299}
You can’t perform that action at this time.
0 commit comments