diff options
author | Jean-Marc Valin <jmvalin@jmvalin.ca> | 2023-10-08 00:45:39 +0300 |
---|---|---|
committer | Jean-Marc Valin <jmvalin@jmvalin.ca> | 2023-10-08 00:45:39 +0300 |
commit | 81624caf9ceb452fa8f909dcd8ad14511136da87 (patch) | |
tree | fe6cf26a9cd3f372f98bdc06d559c1544f294473 /celt | |
parent | 0563d71b255c2ef0cb65aab706ecbd44e0328c8d (diff) |
Silencing alignment warnings on x86 intrinsics
Those intrinsics don't actually require alignment so we're OK
Diffstat (limited to 'celt')
-rw-r--r-- | celt/x86/pitch_avx.c | 2 | ||||
-rw-r--r-- | celt/x86/vq_sse2.c | 8 | ||||
-rw-r--r-- | celt/x86/x86cpu.h | 2 |
3 files changed, 6 insertions, 6 deletions
diff --git a/celt/x86/pitch_avx.c b/celt/x86/pitch_avx.c index 1a667dd7..63dea97f 100644 --- a/celt/x86/pitch_avx.c +++ b/celt/x86/pitch_avx.c @@ -56,7 +56,7 @@ static void xcorr_kernel_avx(const float *x, const float *y, float sum[8], int l if (i != len) { static const int mask[15] = {-1, -1, -1, -1, -1, -1, -1, 0, 0, 0, 0, 0, 0, 0, 0}; __m256i m; - m = _mm256_loadu_si256((__m256i*)(mask + 7+i-len)); + m = _mm256_loadu_si256((__m256i*)(void*)(mask + 7+i-len)); x0 = _mm256_maskload_ps(x+i, m); xsum0 = _mm256_fmadd_ps(x0, _mm256_maskload_ps(y+i , m), xsum0); xsum1 = _mm256_fmadd_ps(x0, _mm256_maskload_ps(y+i+1, m), xsum1); diff --git a/celt/x86/vq_sse2.c b/celt/x86/vq_sse2.c index 77504286..4c4ebf8e 100644 --- a/celt/x86/vq_sse2.c +++ b/celt/x86/vq_sse2.c @@ -75,7 +75,7 @@ opus_val16 op_pvq_search_sse2(celt_norm *_X, int *iy, int K, int N, int arch) sums = _mm_add_ps(sums, x4); /* Clear y and iy in case we don't do the projection. */ _mm_storeu_ps(&y[j], _mm_setzero_ps()); - _mm_storeu_si128((__m128i*)&iy[j], _mm_setzero_si128()); + _mm_storeu_si128((__m128i*)(void*)&iy[j], _mm_setzero_si128()); _mm_storeu_ps(&X[j], x4); _mm_storeu_ps(&signy[j], s4); } @@ -116,7 +116,7 @@ opus_val16 op_pvq_search_sse2(celt_norm *_X, int *iy, int K, int N, int arch) rx4 = _mm_mul_ps(x4, rcp4); iy4 = _mm_cvttps_epi32(rx4); pulses_sum = _mm_add_epi32(pulses_sum, iy4); - _mm_storeu_si128((__m128i*)&iy[j], iy4); + _mm_storeu_si128((__m128i*)(void*)&iy[j], iy4); y4 = _mm_cvtepi32_ps(iy4); xy4 = _mm_add_ps(xy4, _mm_mul_ps(x4, y4)); yy4 = _mm_add_ps(yy4, _mm_mul_ps(y4, y4)); @@ -205,10 +205,10 @@ opus_val16 op_pvq_search_sse2(celt_norm *_X, int *iy, int K, int N, int arch) { __m128i y4; __m128i s4; - y4 = _mm_loadu_si128((__m128i*)&iy[j]); + y4 = _mm_loadu_si128((__m128i*)(void*)&iy[j]); s4 = _mm_castps_si128(_mm_loadu_ps(&signy[j])); y4 = _mm_xor_si128(_mm_add_epi32(y4, s4), s4); - _mm_storeu_si128((__m128i*)&iy[j], y4); + _mm_storeu_si128((__m128i*)(void*)&iy[j], y4); } RESTORE_STACK; return yy; diff --git a/celt/x86/x86cpu.h b/celt/x86/x86cpu.h index 8bd69551..fe46d1d9 100644 --- a/celt/x86/x86cpu.h +++ b/celt/x86/x86cpu.h @@ -68,6 +68,6 @@ int opus_select_arch(void); (_mm_cvtepi8_epi32(_mm_cvtsi32_si128(OP_LOADU_EPI32(x)))) #define OP_CVTEPI16_EPI32_M64(x) \ - (_mm_cvtepi16_epi32(_mm_loadl_epi64((__m128i *)(x)))) + (_mm_cvtepi16_epi32(_mm_loadl_epi64((__m128i *)(void*)(x)))) #endif |