cast ambiguous _mm_set1_epiNN() constants

author Johann <johannkoenig@google.com>

Tue, 30 Apr 2019 19:26:18 +0000 (12:26 -0700)

committer Johann <johannkoenig@google.com>

Tue, 30 Apr 2019 19:44:51 +0000 (12:44 -0700)
author Johann <johannkoenig@google.com>
Tue, 30 Apr 2019 19:26:18 +0000 (12:26 -0700)
committer Johann <johannkoenig@google.com>
Tue, 30 Apr 2019 19:44:51 +0000 (12:44 -0700)
diff --git a/vp9/encoder/x86/vp9_diamond_search_sad_avx.c b/vp9/encoder/x86/vp9_diamond_search_sad_avx.c

index 2f3c66c0835cf0d8d9253ee1ff6e2e9fa9c6074a..aa46c5889d3a884683e539fe58b6b2abd312fe76 100644 (file)
--- a/vp9/encoder/x86/vp9_diamond_search_sad_avx.c
+++ b/vp9/encoder/x86/vp9_diamond_search_sad_avx.c
@@ -160,7 +160,7 @@ int vp9_diamond_search_sad_avx(const MACROBLOCK *x,
        }
  
        // The inverse mask indicates which of the MVs are outside
-      v_outside_d = _mm_xor_si128(v_inside_d, _mm_set1_epi8(0xff));
+      v_outside_d = _mm_xor_si128(v_inside_d, _mm_set1_epi8((int8_t)0xff));
        // Shift right to keep the sign bit clear, we will use this later
        // to set the cost to the maximum value.
        v_outside_d = _mm_srli_epi32(v_outside_d, 1);
diff --git a/vp9/encoder/x86/vp9_highbd_block_error_intrin_sse2.c b/vp9/encoder/x86/vp9_highbd_block_error_intrin_sse2.c

index af04b6c524bb06250cb2811aa5b75701c2020e1e..d7aafe7b011ead1cd217fa9807672e550d781f4e 100644 (file)
--- a/vp9/encoder/x86/vp9_highbd_block_error_intrin_sse2.c
+++ b/vp9/encoder/x86/vp9_highbd_block_error_intrin_sse2.c
@@ -32,7 +32,7 @@ int64_t vp9_highbd_block_error_sse2(const tran_low_t *coeff,
      __m128i mm_dqcoeff2 = _mm_load_si128((const __m128i *)(dqcoeff + i + 4));
      // Check if any values require more than 15 bit
      max = _mm_set1_epi32(0x3fff);
-    min = _mm_set1_epi32(0xffffc000);
+    min = _mm_set1_epi32((int32_t)0xffffc000);
      cmp0 = _mm_xor_si128(_mm_cmpgt_epi32(mm_coeff, max),
                           _mm_cmplt_epi32(mm_coeff, min));
      cmp1 = _mm_xor_si128(_mm_cmpgt_epi32(mm_coeff2, max),
diff --git a/vpx_dsp/x86/fwd_txfm_impl_sse2.h b/vpx_dsp/x86/fwd_txfm_impl_sse2.h

index fd28d0d559d3cc58fd8a0b5216a3a1dea8e39356..d546f02a148fe8a43946c6538d984408eedb5049 100644 (file)
--- a/vpx_dsp/x86/fwd_txfm_impl_sse2.h
+++ b/vpx_dsp/x86/fwd_txfm_impl_sse2.h
@@ -93,9 +93,9 @@ void FDCT4x4_2D(const int16_t *input, tran_low_t *output, int stride) {
  #if DCT_HIGH_BIT_DEPTH
    // Check inputs small enough to use optimised code
    cmp0 = _mm_xor_si128(_mm_cmpgt_epi16(in0, _mm_set1_epi16(0x3ff)),
-                       _mm_cmplt_epi16(in0, _mm_set1_epi16(0xfc00)));
+                       _mm_cmplt_epi16(in0, _mm_set1_epi16((int16_t)0xfc00)));
    cmp1 = _mm_xor_si128(_mm_cmpgt_epi16(in1, _mm_set1_epi16(0x3ff)),
-                       _mm_cmplt_epi16(in1, _mm_set1_epi16(0xfc00)));
+                       _mm_cmplt_epi16(in1, _mm_set1_epi16((int16_t)0xfc00)));
    test = _mm_movemask_epi8(_mm_or_si128(cmp0, cmp1));
    if (test) {
      vpx_highbd_fdct4x4_c(input, output, stride);
diff --git a/vpx_dsp/x86/highbd_loopfilter_sse2.c b/vpx_dsp/x86/highbd_loopfilter_sse2.c

index f7fb40d5159f8dce875e07a110dd404a2be45802..d265fc1a92176cb0c0638f4008b178474ebf5d1d 100644 (file)
--- a/vpx_dsp/x86/highbd_loopfilter_sse2.c
+++ b/vpx_dsp/x86/highbd_loopfilter_sse2.c
@@ -764,8 +764,8 @@ void vpx_highbd_lpf_horizontal_4_sse2(uint16_t *s, int pitch,
      limit_v = _mm_unpacklo_epi8(_mm_load_si128((const __m128i *)limit), zero);
      thresh_v = _mm_unpacklo_epi8(_mm_load_si128((const __m128i *)thresh), zero);
      t80 = _mm_set1_epi16(0x80);
-    tff80 = _mm_set1_epi16(0xff80);
-    tffe0 = _mm_set1_epi16(0xffe0);
+    tff80 = _mm_set1_epi16((int16_t)0xff80);
+    tffe0 = _mm_set1_epi16((int16_t)0xffe0);
      t1f = _mm_srli_epi16(_mm_set1_epi16(0x1fff), 8);
      t7f = _mm_srli_epi16(_mm_set1_epi16(0x7fff), 8);
    } else if (bd == 10) {
@@ -776,8 +776,8 @@ void vpx_highbd_lpf_horizontal_4_sse2(uint16_t *s, int pitch,
      thresh_v = _mm_slli_epi16(
          _mm_unpacklo_epi8(_mm_load_si128((const __m128i *)thresh), zero), 2);
      t80 = _mm_slli_epi16(_mm_set1_epi16(0x80), 2);
-    tff80 = _mm_slli_epi16(_mm_set1_epi16(0xff80), 2);
-    tffe0 = _mm_slli_epi16(_mm_set1_epi16(0xffe0), 2);
+    tff80 = _mm_slli_epi16(_mm_set1_epi16((int16_t)0xff80), 2);
+    tffe0 = _mm_slli_epi16(_mm_set1_epi16((int16_t)0xffe0), 2);
      t1f = _mm_srli_epi16(_mm_set1_epi16(0x1fff), 6);
      t7f = _mm_srli_epi16(_mm_set1_epi16(0x7fff), 6);
    } else {  // bd == 12
@@ -788,8 +788,8 @@ void vpx_highbd_lpf_horizontal_4_sse2(uint16_t *s, int pitch,
      thresh_v = _mm_slli_epi16(
          _mm_unpacklo_epi8(_mm_load_si128((const __m128i *)thresh), zero), 4);
      t80 = _mm_slli_epi16(_mm_set1_epi16(0x80), 4);
-    tff80 = _mm_slli_epi16(_mm_set1_epi16(0xff80), 4);
-    tffe0 = _mm_slli_epi16(_mm_set1_epi16(0xffe0), 4);
+    tff80 = _mm_slli_epi16(_mm_set1_epi16((int16_t)0xff80), 4);
+    tffe0 = _mm_slli_epi16(_mm_set1_epi16((int16_t)0xffe0), 4);
      t1f = _mm_srli_epi16(_mm_set1_epi16(0x1fff), 4);
      t7f = _mm_srli_epi16(_mm_set1_epi16(0x7fff), 4);
    }
diff --git a/vpx_dsp/x86/loopfilter_avx2.c b/vpx_dsp/x86/loopfilter_avx2.c

index 85a7314269d6b41b6e25a38f59e8e3f780bfdfd9..be391992af88be9f959a16c5124637c416a0cc4a 100644 (file)
--- a/vpx_dsp/x86/loopfilter_avx2.c
+++ b/vpx_dsp/x86/loopfilter_avx2.c
@@ -52,7 +52,7 @@ void vpx_lpf_horizontal_16_avx2(unsigned char *s, int pitch,
      abs_p1p0 =
          _mm_or_si128(_mm_subs_epu8(q1p1, q0p0), _mm_subs_epu8(q0p0, q1p1));
      abs_q1q0 = _mm_srli_si128(abs_p1p0, 8);
-    fe = _mm_set1_epi8(0xfe);
+    fe = _mm_set1_epi8((int8_t)0xfe);
      ff = _mm_cmpeq_epi8(abs_p1p0, abs_p1p0);
      abs_p0q0 =
          _mm_or_si128(_mm_subs_epu8(q0p0, p0q0), _mm_subs_epu8(p0q0, q0p0));
@@ -84,7 +84,7 @@ void vpx_lpf_horizontal_16_avx2(unsigned char *s, int pitch,
    {
      const __m128i t4 = _mm_set1_epi8(4);
      const __m128i t3 = _mm_set1_epi8(3);
-    const __m128i t80 = _mm_set1_epi8(0x80);
+    const __m128i t80 = _mm_set1_epi8((int8_t)0x80);
      const __m128i t1 = _mm_set1_epi16(0x1);
      __m128i qs1ps1 = _mm_xor_si128(q1p1, t80);
      __m128i qs0ps0 = _mm_xor_si128(q0p0, t80);
@@ -423,7 +423,7 @@ void vpx_lpf_horizontal_16_dual_avx2(unsigned char *s, int pitch,
          _mm_or_si128(_mm_subs_epu8(p1, p0), _mm_subs_epu8(p0, p1));
      const __m128i abs_q1q0 =
          _mm_or_si128(_mm_subs_epu8(q1, q0), _mm_subs_epu8(q0, q1));
-    const __m128i fe = _mm_set1_epi8(0xfe);
+    const __m128i fe = _mm_set1_epi8((int8_t)0xfe);
      const __m128i ff = _mm_cmpeq_epi8(abs_p1p0, abs_p1p0);
      __m128i abs_p0q0 =
          _mm_or_si128(_mm_subs_epu8(p0, q0), _mm_subs_epu8(q0, p0));
@@ -458,8 +458,8 @@ void vpx_lpf_horizontal_16_dual_avx2(unsigned char *s, int pitch,
    {
      const __m128i t4 = _mm_set1_epi8(4);
      const __m128i t3 = _mm_set1_epi8(3);
-    const __m128i t80 = _mm_set1_epi8(0x80);
-    const __m128i te0 = _mm_set1_epi8(0xe0);
+    const __m128i t80 = _mm_set1_epi8((int8_t)0x80);
+    const __m128i te0 = _mm_set1_epi8((int8_t)0xe0);
      const __m128i t1f = _mm_set1_epi8(0x1f);
      const __m128i t1 = _mm_set1_epi8(0x1);
      const __m128i t7f = _mm_set1_epi8(0x7f);
diff --git a/vpx_dsp/x86/loopfilter_sse2.c b/vpx_dsp/x86/loopfilter_sse2.c

index 20dcb0d225e130683743c3371913f2de1fb8b34b..f90522cd7d08d524f65d7c14a484594e3d026127 100644 (file)
--- a/vpx_dsp/x86/loopfilter_sse2.c
+++ b/vpx_dsp/x86/loopfilter_sse2.c
@@ -61,7 +61,7 @@ static INLINE __m128i abs_diff(__m128i a, __m128i b) {
    do {                                                                      \
      const __m128i t3t4 =                                                    \
          _mm_set_epi8(3, 3, 3, 3, 3, 3, 3, 3, 4, 4, 4, 4, 4, 4, 4, 4);       \
-    const __m128i t80 = _mm_set1_epi8(0x80);                                \
+    const __m128i t80 = _mm_set1_epi8((int8_t)0x80);                        \
      __m128i filter, filter2filter1, work;                                   \
                                                                              \
      ps1ps0 = _mm_xor_si128(p1p0, t80); /* ^ 0x80 */                         \
@@ -263,7 +263,7 @@ void vpx_lpf_horizontal_16_sse2(unsigned char *s, int pitch,
      __m128i abs_p1q1, abs_p0q0, abs_q1q0, fe, ff, work;
      abs_p1p0 = abs_diff(q1p1, q0p0);
      abs_q1q0 = _mm_srli_si128(abs_p1p0, 8);
-    fe = _mm_set1_epi8(0xfe);
+    fe = _mm_set1_epi8((int8_t)0xfe);
      ff = _mm_cmpeq_epi8(abs_p1p0, abs_p1p0);
      abs_p0q0 = abs_diff(q0p0, p0q0);
      abs_p1q1 = abs_diff(q1p1, p1q1);
@@ -291,7 +291,7 @@ void vpx_lpf_horizontal_16_sse2(unsigned char *s, int pitch,
    {
      const __m128i t4 = _mm_set1_epi8(4);
      const __m128i t3 = _mm_set1_epi8(3);
-    const __m128i t80 = _mm_set1_epi8(0x80);
+    const __m128i t80 = _mm_set1_epi8((int8_t)0x80);
      const __m128i t1 = _mm_set1_epi16(0x1);
      __m128i qs1ps1 = _mm_xor_si128(q1p1, t80);
      __m128i qs0ps0 = _mm_xor_si128(q0p0, t80);
@@ -628,7 +628,7 @@ void vpx_lpf_horizontal_16_dual_sse2(unsigned char *s, int pitch,
    {
      const __m128i abs_p1p0 = abs_diff(p1, p0);
      const __m128i abs_q1q0 = abs_diff(q1, q0);
-    const __m128i fe = _mm_set1_epi8(0xfe);
+    const __m128i fe = _mm_set1_epi8((int8_t)0xfe);
      const __m128i ff = _mm_cmpeq_epi8(zero, zero);
      __m128i abs_p0q0 = abs_diff(p0, q0);
      __m128i abs_p1q1 = abs_diff(p1, q1);
@@ -677,8 +677,8 @@ void vpx_lpf_horizontal_16_dual_sse2(unsigned char *s, int pitch,
    {
      const __m128i t4 = _mm_set1_epi8(4);
      const __m128i t3 = _mm_set1_epi8(3);
-    const __m128i t80 = _mm_set1_epi8(0x80);
-    const __m128i te0 = _mm_set1_epi8(0xe0);
+    const __m128i t80 = _mm_set1_epi8((int8_t)0x80);
+    const __m128i te0 = _mm_set1_epi8((int8_t)0xe0);
      const __m128i t1f = _mm_set1_epi8(0x1f);
      const __m128i t1 = _mm_set1_epi8(0x1);
      const __m128i t7f = _mm_set1_epi8(0x7f);
@@ -954,7 +954,7 @@ void vpx_lpf_horizontal_8_sse2(unsigned char *s, int pitch,
    {
      // filter_mask and hev_mask
      const __m128i one = _mm_set1_epi8(1);
-    const __m128i fe = _mm_set1_epi8(0xfe);
+    const __m128i fe = _mm_set1_epi8((int8_t)0xfe);
      const __m128i ff = _mm_cmpeq_epi8(fe, fe);
      __m128i abs_p1q1, abs_p0q0, abs_q1q0, abs_p1p0, work;
      abs_p1p0 = abs_diff(q1p1, q0p0);
@@ -1054,7 +1054,7 @@ void vpx_lpf_horizontal_8_sse2(unsigned char *s, int pitch,
    {
      const __m128i t4 = _mm_set1_epi8(4);
      const __m128i t3 = _mm_set1_epi8(3);
-    const __m128i t80 = _mm_set1_epi8(0x80);
+    const __m128i t80 = _mm_set1_epi8((int8_t)0x80);
      const __m128i t1 = _mm_set1_epi8(0x1);
      const __m128i ps1 =
          _mm_xor_si128(_mm_loadl_epi64((__m128i *)(s - 2 * pitch)), t80);
@@ -1180,7 +1180,7 @@ void vpx_lpf_horizontal_8_dual_sse2(
      const __m128i abs_q1q0 =
          _mm_or_si128(_mm_subs_epu8(q1, q0), _mm_subs_epu8(q0, q1));
      const __m128i one = _mm_set1_epi8(1);
-    const __m128i fe = _mm_set1_epi8(0xfe);
+    const __m128i fe = _mm_set1_epi8((int8_t)0xfe);
      const __m128i ff = _mm_cmpeq_epi8(abs_p1p0, abs_p1p0);
      __m128i abs_p0q0 =
          _mm_or_si128(_mm_subs_epu8(p0, q0), _mm_subs_epu8(q0, p0));
@@ -1292,8 +1292,8 @@ void vpx_lpf_horizontal_8_dual_sse2(
    {
      const __m128i t4 = _mm_set1_epi8(4);
      const __m128i t3 = _mm_set1_epi8(3);
-    const __m128i t80 = _mm_set1_epi8(0x80);
-    const __m128i te0 = _mm_set1_epi8(0xe0);
+    const __m128i t80 = _mm_set1_epi8((int8_t)0x80);
+    const __m128i te0 = _mm_set1_epi8((int8_t)0xe0);
      const __m128i t1f = _mm_set1_epi8(0x1f);
      const __m128i t1 = _mm_set1_epi8(0x1);
      const __m128i t7f = _mm_set1_epi8(0x7f);
@@ -1425,7 +1425,7 @@ void vpx_lpf_horizontal_4_dual_sse2(unsigned char *s, int pitch,
          _mm_or_si128(_mm_subs_epu8(p1, p0), _mm_subs_epu8(p0, p1));
      const __m128i abs_q1q0 =
          _mm_or_si128(_mm_subs_epu8(q1, q0), _mm_subs_epu8(q0, q1));
-    const __m128i fe = _mm_set1_epi8(0xfe);
+    const __m128i fe = _mm_set1_epi8((int8_t)0xfe);
      const __m128i ff = _mm_cmpeq_epi8(abs_p1p0, abs_p1p0);
      __m128i abs_p0q0 =
          _mm_or_si128(_mm_subs_epu8(p0, q0), _mm_subs_epu8(q0, p0));
@@ -1461,8 +1461,8 @@ void vpx_lpf_horizontal_4_dual_sse2(unsigned char *s, int pitch,
    {
      const __m128i t4 = _mm_set1_epi8(4);
      const __m128i t3 = _mm_set1_epi8(3);
-    const __m128i t80 = _mm_set1_epi8(0x80);
-    const __m128i te0 = _mm_set1_epi8(0xe0);
+    const __m128i t80 = _mm_set1_epi8((int8_t)0x80);
+    const __m128i te0 = _mm_set1_epi8((int8_t)0xe0);
      const __m128i t1f = _mm_set1_epi8(0x1f);
      const __m128i t1 = _mm_set1_epi8(0x1);
      const __m128i t7f = _mm_set1_epi8(0x7f);
author	Johann <johannkoenig@google.com>
	Tue, 30 Apr 2019 19:26:18 +0000 (12:26 -0700)
committer	Johann <johannkoenig@google.com>
	Tue, 30 Apr 2019 19:44:51 +0000 (12:44 -0700)
vp9/encoder/x86/vp9_diamond_search_sad_avx.c		patch \| blob \| history
vp9/encoder/x86/vp9_highbd_block_error_intrin_sse2.c		patch \| blob \| history
vpx_dsp/x86/fwd_txfm_impl_sse2.h		patch \| blob \| history
vpx_dsp/x86/highbd_loopfilter_sse2.c		patch \| blob \| history
vpx_dsp/x86/loopfilter_avx2.c		patch \| blob \| history
vpx_dsp/x86/loopfilter_sse2.c		patch \| blob \| history