Skip to content

Commit

Permalink
a
Browse files Browse the repository at this point in the history
  • Loading branch information
nihui committed Dec 12, 2024
1 parent 82f1a2b commit 494f042
Showing 1 changed file with 6 additions and 6 deletions.
12 changes: 6 additions & 6 deletions src/layer/x86/gemm_int8.h
Original file line number Diff line number Diff line change
Expand Up @@ -1403,7 +1403,7 @@ static void pack_A_tile_fp32_to_int8(const Mat& A, Mat& AT, int i, int max_ii, i
{
const float* p0 = (const float*)A + (i + ii) * A_hstep + k * elempack;

__m512 _scales = _mm512_loadu_ps((const float*)scales + i + ii);
__m512 _scales = _mm512_load_ps((const float*)scales + i + ii);
#if __AVX512VNNI__
__m512i _v127 = _mm512_set1_epi8(127);
#endif // __AVX512VNNI__
Expand Down Expand Up @@ -1775,7 +1775,7 @@ static void pack_A_tile_fp32_to_int8(const Mat& A, Mat& AT, int i, int max_ii, i
{
const float* p0 = (const float*)A + (i + ii) * A_hstep + k * elempack;

__m256 _scales = _mm256_loadu_ps((const float*)scales + i + ii);
__m256 _scales = _mm256_load_ps((const float*)scales + i + ii);
#if __AVX512VNNI__ || __AVXVNNI__
__m256i _v127 = _mm256_set1_epi8(127);
#endif // __AVX512VNNI__ || __AVXVNNI__
Expand Down Expand Up @@ -2099,7 +2099,7 @@ static void pack_A_tile_fp32_to_int8(const Mat& A, Mat& AT, int i, int max_ii, i
{
const float* p0 = (const float*)A + (i + ii) * A_hstep + k * elempack;

__m128 _scales = _mm_loadu_ps((const float*)scales + i + ii);
__m128 _scales = _mm_load_ps((const float*)scales + i + ii);
#if __AVX512VNNI__ || __AVXVNNI__
__m128i _v127 = _mm_set1_epi8(127);
#endif // __AVX512VNNI__ || __AVXVNNI__
Expand Down Expand Up @@ -3144,7 +3144,7 @@ static void transpose_pack_A_tile_fp32_to_int8(const Mat& A, Mat& AT, int i, int
{
const float* p0 = (const float*)A + k * A_hstep + (i + ii) * elempack;

__m512 _scales = _mm512_loadu_ps((const float*)scales + i + ii);
__m512 _scales = _mm512_load_ps((const float*)scales + i + ii);
#if __AVX512VNNI__
__m512i _v127 = _mm512_set1_epi8(127);
#endif
Expand Down Expand Up @@ -3604,7 +3604,7 @@ static void transpose_pack_A_tile_fp32_to_int8(const Mat& A, Mat& AT, int i, int
{
const float* p0 = (const float*)A + k * A_hstep + (i + ii) * elempack;

__m256 _scales = _mm256_loadu_ps((const float*)scales + i + ii);
__m256 _scales = _mm256_load_ps((const float*)scales + i + ii);
#if __AVX512VNNI__ || __AVXVNNI__
__m256i _v127 = _mm256_set1_epi8(127);
#endif // __AVX512VNNI__ || __AVXVNNI__
Expand Down Expand Up @@ -4221,7 +4221,7 @@ static void transpose_pack_A_tile_fp32_to_int8(const Mat& A, Mat& AT, int i, int
}
if (elempack == 1)
{
__m128 _scales = _mm_loadu_ps((const float*)scales + i + ii);
__m128 _scales = _mm_load_ps((const float*)scales + i + ii);

int kk = 0;
#if __AVX512VNNI__ || __AVXVNNI__
Expand Down

0 comments on commit 494f042

Please sign in to comment.