@@ -251,7 +251,6 @@ inline float euclidean_distance_squared<distance_comp_inner, float, ::std::int8_
251
251
int16x8_t vreg_b_s16_0 = vmovl_s8 (vget_low_s8 (vreg_b));
252
252
int16x8_t vreg_b_s16_1 = vmovl_s8 (vget_high_s8 (vreg_b));
253
253
254
- # if 1
255
254
vreg_a_s16_0 = vmulq_s16 (vreg_a_s16_0, vreg_b_s16_0);
256
255
vreg_a_s16_1 = vmulq_s16 (vreg_a_s16_1, vreg_b_s16_1);
257
256
@@ -264,24 +263,6 @@ inline float euclidean_distance_squared<distance_comp_inner, float, ::std::int8_
264
263
vreg_dsum_fp32_1 = vsubq_f32 (vreg_dsum_fp32_1, vreg_res_fp32_1);
265
264
vreg_dsum_fp32_2 = vsubq_f32 (vreg_dsum_fp32_2, vreg_res_fp32_2);
266
265
vreg_dsum_fp32_3 = vsubq_f32 (vreg_dsum_fp32_3, vreg_res_fp32_3);
267
- #else
268
- // TODO: WILL BE REMOVED BEFORE MERGE
269
- vreg_a_s16_0 = vnegq_s16 (vreg_a_s16_0);
270
- vreg_a_s16_1 = vnegq_s16 (vreg_a_s16_1);
271
-
272
- float32x4_t vreg_a_fp32_0 = vcvtq_f32_s32 (vmovl_s16 (vget_low_s16 (vreg_a_s16_0)));
273
- float32x4_t vreg_b_fp32_0 = vcvtq_f32_s32 (vmovl_s16 (vget_low_s16 (vreg_b_s16_0)));
274
- vreg_dsum_fp32_0 = vfmaq_f32 (vreg_dsum_fp32_0, vreg_a_fp32_0, vreg_b_fp32_0);
275
- float32x4_t vreg_a_fp32_1 = vcvtq_f32_s32 (vmovl_s16 (vget_high_s16 (vreg_a_s16_0)));
276
- float32x4_t vreg_b_fp32_1 = vcvtq_f32_s32 (vmovl_s16 (vget_high_s16 (vreg_b_s16_0)));
277
- vreg_dsum_fp32_1 = vfmaq_f32 (vreg_dsum_fp32_1, vreg_a_fp32_1, vreg_b_fp32_1);
278
- float32x4_t vreg_a_fp32_2 = vcvtq_f32_s32 (vmovl_s16 (vget_low_s16 (vreg_a_s16_1)));
279
- float32x4_t vreg_b_fp32_2 = vcvtq_f32_s32 (vmovl_s16 (vget_low_s16 (vreg_b_s16_1)));
280
- vreg_dsum_fp32_2 = vfmaq_f32 (vreg_dsum_fp32_2, vreg_a_fp32_2, vreg_b_fp32_2);
281
- float32x4_t vreg_a_fp32_3 = vcvtq_f32_s32 (vmovl_s16 (vget_high_s16 (vreg_a_s16_1)));
282
- float32x4_t vreg_b_fp32_3 = vcvtq_f32_s32 (vmovl_s16 (vget_high_s16 (vreg_b_s16_1)));
283
- vreg_dsum_fp32_3 = vfmaq_f32 (vreg_dsum_fp32_3, vreg_a_fp32_3, vreg_b_fp32_3);
284
- #endif
285
266
}
286
267
287
268
vreg_dsum_fp32_0 = vaddq_f32 (vreg_dsum_fp32_0, vreg_dsum_fp32_1);
0 commit comments