Skip to content

Commit

Permalink
Merge pull request #6 from cgutman/fix_avx512_oob
Browse files Browse the repository at this point in the history
Fix memory corruption in AVX-512 codepath
  • Loading branch information
sleepybishop authored Jul 11, 2024
2 parents e9e242e + 740829b commit 19f07b5
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion deps/obl/oblas_lite.c
Original file line number Diff line number Diff line change
Expand Up @@ -73,7 +73,7 @@ void obl_axpyb32_ref(u8 *a, u32 *b, u8 u, unsigned k)
const __m128i uhi_128 = _mm_loadu_si128((__m128i *)u_hi); \
const __m512i urow_lo = _mm512_broadcast_i32x4(ulo_128); \
const __m512i urow_hi = _mm512_broadcast_i32x4(uhi_128); \
__m512i *ap = (__m512i *)a, *ae = (__m512i *)(a + k - (k % sizeof(__m256i))), *bp = (__m512i *)b; \
__m512i *ap = (__m512i *)a, *ae = (__m512i *)(a + k - (k % sizeof(__m512i))), *bp = (__m512i *)b; \
for (; ap < ae; ap++, bp++) { \
__m512i bx = _mm512_loadu_si512(bp); \
__m512i lo = _mm512_and_si512(bx, mask); \
Expand Down

0 comments on commit 19f07b5

Please sign in to comment.