@@ -968,7 +968,7 @@ SIMSIMD_MAKE_DOTS_INNER(i8i8i32_neon, i8, i32, simsimd_b128_vec_t, simsimd_dot_i
968968// U8 GEMM: k_tile=16 (16 u8s = 16 bytes = NEON register width)
969969SIMSIMD_MAKE_DOTS_SERIAL_PACKED_SIZE (neon , u8 , i32 , 16 )
970970SIMSIMD_MAKE_DOTS_SERIAL_PACK (neon , u8 , i32 , 16 )
971- SIMSIMD_MAKE_DOTS_INNER (u8u8i32_neon , u8 , i32 , simsimd_b128_vec_t , simsimd_dot_u8x16_state_neon_t ,
971+ SIMSIMD_MAKE_DOTS_INNER (u8u8i32_neon , u8 , u32 , simsimd_b128_vec_t , simsimd_dot_u8x16_state_neon_t ,
972972 simsimd_dot_u8x16_init_neon , _simsimd_load_b128_neon , _simsimd_partial_load_b8x16_neon ,
973973 simsimd_dot_u8x16_update_neon , simsimd_dot_u8x16_finalize_neon ,
974974 /*k_tile=*/ 16 , /*MR=*/ 4 , /*MC=*/ 128 , /*NC=*/ 2048 , /*KC=*/ 256 )
@@ -1090,7 +1090,7 @@ SIMSIMD_MAKE_DOTS_INNER(i8i8i32_haswell, i8, i32, simsimd_b256_vec_t, simsimd_do
10901090// U8 GEMM: k_tile=32 (32 u8s = 32 bytes = AVX2 register width)
10911091SIMSIMD_MAKE_DOTS_SERIAL_PACKED_SIZE (haswell , u8 , i32 , 32 )
10921092SIMSIMD_MAKE_DOTS_SERIAL_PACK (haswell , u8 , i32 , 32 )
1093- SIMSIMD_MAKE_DOTS_INNER (u8u8i32_haswell , u8 , i32 , simsimd_b256_vec_t , simsimd_dot_u8x32_state_haswell_t ,
1093+ SIMSIMD_MAKE_DOTS_INNER (u8u8i32_haswell , u8 , u32 , simsimd_b256_vec_t , simsimd_dot_u8x32_state_haswell_t ,
10941094 simsimd_dot_u8x32_init_haswell , _simsimd_load_b256_haswell , _simsimd_partial_load_b8x32_haswell ,
10951095 simsimd_dot_u8x32_update_haswell , simsimd_dot_u8x32_finalize_haswell ,
10961096 /*k_tile=*/ 32 , /*MR=*/ 4 , /*MC=*/ 128 , /*NC=*/ 2048 , /*KC=*/ 256 )
@@ -1199,7 +1199,7 @@ SIMSIMD_MAKE_DOTS_INNER(i8i8i32_ice, i8, i32, simsimd_b512_vec_t, simsimd_dot_i8
11991199// U8 GEMM: k_tile=64 (64 u8s = 64 bytes = 1 cache line)
12001200SIMSIMD_MAKE_DOTS_SERIAL_PACKED_SIZE (ice , u8 , i32 , SIMSIMD_DOTS_SERIAL_TILE_K_U8 )
12011201SIMSIMD_MAKE_DOTS_SERIAL_PACK (ice , u8 , i32 , SIMSIMD_DOTS_SERIAL_TILE_K_U8 )
1202- SIMSIMD_MAKE_DOTS_INNER (u8u8i32_ice , u8 , i32 , simsimd_b512_vec_t , simsimd_dot_u8x64_state_ice_t ,
1202+ SIMSIMD_MAKE_DOTS_INNER (u8u8i32_ice , u8 , u32 , simsimd_b512_vec_t , simsimd_dot_u8x64_state_ice_t ,
12031203 simsimd_dot_u8x64_init_ice , _simsimd_load_b512_skylake , _simsimd_partial_load_b8x64_skylake ,
12041204 simsimd_dot_u8x64_update_ice , simsimd_dot_u8x64_finalize_ice ,
12051205 /*k_tile=*/ 64 , /*MR=*/ 4 , /*MC=*/ 128 , /*NC=*/ 2048 , /*KC=*/ 256 )
0 commit comments