File tree 1 file changed +6
-6
lines changed
1 file changed +6
-6
lines changed Original file line number Diff line number Diff line change @@ -385,10 +385,10 @@ static void convolution_im2col_input_tile_conv1x1s1d1_int8(const Mat& bottom_blo
385
385
int kk = 0 ;
386
386
for (; kk < max_kk / 8 ; kk++)
387
387
{
388
- __m128i _r01 = _mm_load_si128 ((const __m128i*)p0);
389
- __m128i _r23 = _mm_load_si128 ((const __m128i*)(p0 + 16 ));
390
- __m128i _r45 = _mm_load_si128 ((const __m128i*)(p0 + 32 ));
391
- __m128i _r67 = _mm_load_si128 ((const __m128i*)(p0 + 48 ));
388
+ __m128i _r01 = _mm_loadu_si128 ((const __m128i*)p0);
389
+ __m128i _r23 = _mm_loadu_si128 ((const __m128i*)(p0 + 16 ));
390
+ __m128i _r45 = _mm_loadu_si128 ((const __m128i*)(p0 + 32 ));
391
+ __m128i _r67 = _mm_loadu_si128 ((const __m128i*)(p0 + 48 ));
392
392
393
393
#if __AVX512VNNI__ || __AVXVNNI__
394
394
// 0011
@@ -506,8 +506,8 @@ static void convolution_im2col_input_tile_conv1x1s1d1_int8(const Mat& bottom_blo
506
506
int kk = 0 ;
507
507
for (; kk < max_kk / 8 ; kk++)
508
508
{
509
- __m128i _r01 = _mm_load_si128 ((const __m128i*)p0);
510
- __m128i _r23 = _mm_load_si128 ((const __m128i*)(p0 + 16 ));
509
+ __m128i _r01 = _mm_loadu_si128 ((const __m128i*)p0);
510
+ __m128i _r23 = _mm_loadu_si128 ((const __m128i*)(p0 + 16 ));
511
511
512
512
#if __AVX512VNNI__ || __AVXVNNI__
513
513
__m128i _t0 = _mm_unpacklo_epi32 (_r01, _r23);
You can’t perform that action at this time.
0 commit comments