Skip to content

Commit f371ecd

Browse files
authored
fix x86 conv int8 avx512vnni crash (#6038)
1 parent bb021da commit f371ecd

File tree

1 file changed

+6
-6
lines changed

1 file changed

+6
-6
lines changed

src/layer/x86/convolution_im2col_gemm_int8.h

+6-6
Original file line numberDiff line numberDiff line change
@@ -385,10 +385,10 @@ static void convolution_im2col_input_tile_conv1x1s1d1_int8(const Mat& bottom_blo
385385
int kk = 0;
386386
for (; kk < max_kk / 8; kk++)
387387
{
388-
__m128i _r01 = _mm_load_si128((const __m128i*)p0);
389-
__m128i _r23 = _mm_load_si128((const __m128i*)(p0 + 16));
390-
__m128i _r45 = _mm_load_si128((const __m128i*)(p0 + 32));
391-
__m128i _r67 = _mm_load_si128((const __m128i*)(p0 + 48));
388+
__m128i _r01 = _mm_loadu_si128((const __m128i*)p0);
389+
__m128i _r23 = _mm_loadu_si128((const __m128i*)(p0 + 16));
390+
__m128i _r45 = _mm_loadu_si128((const __m128i*)(p0 + 32));
391+
__m128i _r67 = _mm_loadu_si128((const __m128i*)(p0 + 48));
392392

393393
#if __AVX512VNNI__ || __AVXVNNI__
394394
// 0011
@@ -506,8 +506,8 @@ static void convolution_im2col_input_tile_conv1x1s1d1_int8(const Mat& bottom_blo
506506
int kk = 0;
507507
for (; kk < max_kk / 8; kk++)
508508
{
509-
__m128i _r01 = _mm_load_si128((const __m128i*)p0);
510-
__m128i _r23 = _mm_load_si128((const __m128i*)(p0 + 16));
509+
__m128i _r01 = _mm_loadu_si128((const __m128i*)p0);
510+
__m128i _r23 = _mm_loadu_si128((const __m128i*)(p0 + 16));
511511

512512
#if __AVX512VNNI__ || __AVXVNNI__
513513
__m128i _t0 = _mm_unpacklo_epi32(_r01, _r23);

0 commit comments

Comments
 (0)