@@ -103,6 +103,7 @@ Status FirefoxMatMulInteger8::Compute(OpKernelContext* ctx) const {
103103 gemm_shape.BIsSigned = b_is_signed;
104104
105105 const size_t batch_size = helper.OutputOffsets ().size ();
106+
106107 std::vector<MLAS_GEMM_QUANT_DATA_PARAMS> gemm_data_vec (batch_size);
107108
108109 for (size_t batch = 0 ; batch < batch_size; batch++) {
@@ -118,7 +119,6 @@ Status FirefoxMatMulInteger8::Compute(OpKernelContext* ctx) const {
118119 gemm_params.B = b_data + helper.RightOffsets ()[batch];
119120 gemm_params.C = y_data + helper.OutputOffsets ()[batch];
120121 }
121-
122122 #if 0
123123 std::cout << "Matrix A (sample):\n";
124124 for (size_t i = 0; i < 5; ++i) {
@@ -147,7 +147,6 @@ Status FirefoxMatMulInteger8::Compute(OpKernelContext* ctx) const {
147147 } else {
148148 std::cout << "b_zero_point is null\n";
149149 }
150-
151150 #endif
152151 // auto start_matmul = Clock::now();
153152 int8Multiply (
@@ -161,7 +160,7 @@ Status FirefoxMatMulInteger8::Compute(OpKernelContext* ctx) const {
161160 reinterpret_cast <float *>(y_data)
162161 );
163162 // auto end_matmul = Clock::now();
164- // auto matmul_time = std::chrono::duration_cast<Microseconds>(end_matmul - start_matmul).count();
163+ // auto matmul_time = std::chrono::duration_cast<Microseconds>(end_matmul - start_matmul).count();
165164
166165 // rowsA = M
167166 // width = K
@@ -191,20 +190,18 @@ Status FirefoxMatMulInteger8::Compute(OpKernelContext* ctx) const {
191190 outputPtr[rowIndex * colsB + colIndex] = tempResult;
192191 }
193192 }
194- #endif
195193
196- /*
197194 // Mlas (will fallback if we don't meet requirements)
198195 auto start_mblas = Clock::now();
199196 MlasGemmBatch(gemm_shape, gemm_data_vec.data(), batch_size, ctx->GetOperatorThreadPool());
200197 auto end_mblas = Clock::now();
201198 auto mblas_time = std::chrono::duration_cast<Microseconds>(end_mblas - start_mblas).count();
202- */
203199 // Output timing results
204- // std::cout << "Timing (microseconds):\n";
205- // std::cout << "MatMulFull: " << matmul_time << "\n";
206- // std::cout << "MlasGemmBatch: " << mblas_time << "\n";
200+ std::cout << "Timing (microseconds):\n";
201+ std::cout << "MatMulFull: " << matmul_time << "\n";
202+ std::cout << "MlasGemmBatch: " << mblas_time << "\n";
207203
204+ #endif
208205 return Status::OK ();
209206}
210207
0 commit comments