Skip to content

Commit

Permalink
fix build
Browse files Browse the repository at this point in the history
  • Loading branch information
nihui committed Jul 16, 2023
1 parent ea67d1b commit d31a804
Showing 1 changed file with 4 additions and 4 deletions.
8 changes: 4 additions & 4 deletions src/layer/x86/convolution_packed_int8.h
Original file line number Diff line number Diff line change
Expand Up @@ -633,10 +633,10 @@ static void convolution_transform_kernel_packed_int8(const Mat& kernel, Mat& ker
{
#if __AVX512F__
__m128i _w0 = _mm_cvtepi32_epi8(_mm_i32gather_epi32((const int*)(kptr0 + k), _vindex, sizeof(signed char)));
_mm_storeu_si32(g00, _w0);
_mm_store_ss((float*)g00, _mm_castsi128_ps(_w0));
#elif __AVX2__
__m128i _w0 = _mm_shuffle_epi8(_mm_i32gather_epi32((const int*)(kptr0 + k), _vindex, sizeof(signed char)), _sindex8);
_mm_storeu_si32(g00, _w0);
_mm_store_ss((float*)g00, _mm_castsi128_ps(_w0));
#else
const signed char* k0 = kptr0 + k;
const signed char* k1 = kptr1 + k;
Expand Down Expand Up @@ -757,10 +757,10 @@ static void convolution_transform_kernel_packed_int8(const Mat& kernel, Mat& ker
{
#if __AVX512F__
__m128i _w0 = _mm_cvtepi32_epi8(_mm_i32gather_epi32((const int*)(kptr0 + k), _vindex, sizeof(signed char)));
_mm_storeu_si32(g00, _w0);
_mm_store_ss((float*)g00, _mm_castsi128_ps(_w0));
#elif __AVX2__
__m128i _w0 = _mm_shuffle_epi8(_mm_i32gather_epi32((const int*)(kptr0 + k), _vindex, sizeof(signed char)), _sindex8);
_mm_storeu_si32(g00, _w0);
_mm_store_ss((float*)g00, _mm_castsi128_ps(_w0));
#else
const signed char* k0 = kptr0 + k;
const signed char* k1 = kptr1 + k;
Expand Down

0 comments on commit d31a804

Please sign in to comment.