{
u32 mask = pow2_mask (max_count - count);
u32 bmp =
- u32x16_is_equal_mask (u32x16_mask_load_zero (data, mask), splat);
+ u32x16_is_equal_mask (u32x16_mask_load_zero (data, mask), splat) &
+ mask;
return count + count_trailing_zeros (~bmp);
}
#elif defined(CLIB_HAVE_VEC256)
}
if (count == max_count)
return count;
-#if defined(CxLIB_HAVE_VEC256_MASK_LOAD_STORE)
+#if defined(CLIB_HAVE_VEC256_MASK_LOAD_STORE)
else
{
u32 mask = pow2_mask (max_count - count);
- u32 bmp = u32x8_is_equal_mask (u32x8_mask_load_zero (data, mask), splat);
+ u32 bmp =
+ u32x8_is_equal_mask (u32x8_mask_load_zero (data, mask), splat) & mask;
return count + count_trailing_zeros (~bmp);
}
#endif
else
{
u64 mask = pow2_mask (max_count - count);
- u64 bmp = u8x64_is_equal_mask (u8x64_mask_load_zero (data, mask), splat);
+ u64 bmp =
+ u8x64_is_equal_mask (u8x64_mask_load_zero (data, mask), splat) & mask;
return count + count_trailing_zeros (~bmp);
}
#endif
else
{
u32 mask = pow2_mask (max_count - count);
- u64 bmp = u8x32_msb_mask (u8x32_mask_load_zero (data, mask) == splat);
+ u64 bmp =
+ u8x32_msb_mask (u8x32_mask_load_zero (data, mask) == splat) & mask;
return count + count_trailing_zeros (~bmp);
}
#endif