We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 20c1430 commit dbd3bdaCopy full SHA for dbd3bda
1 file changed
src/embedding/simd.rs
@@ -386,7 +386,7 @@ pub mod f32_ops {
386
#[allow(unused_imports)]
387
use std::arch::x86_64::*;
388
389
- #[inline(always)]
+ #[inline]
390
#[target_feature(enable = "avx2")]
391
unsafe fn hsum_f32x8(v: __m256) -> f32 {
392
let v128 = _mm_add_ps(_mm256_castps256_ps128(v), _mm256_extractf128_ps(v, 1));
@@ -906,7 +906,7 @@ pub mod i8_ops {
906
907
908
909
910
911
unsafe fn hsum_i32x8(v: __m256i) -> i32 {
912
let v128 = _mm_add_epi32(_mm256_castsi256_si128(v), _mm256_extracti128_si256(v, 1));
0 commit comments