mem_sse2.h: storeu_uint32 -> storeu_int32

author James Zern <jzern@google.com>

Sat, 6 Nov 2021 23:43:11 +0000 (16:43 -0700)

committer James Zern <jzern@google.com>

Mon, 8 Nov 2021 21:43:09 +0000 (13:43 -0800)
author James Zern <jzern@google.com>
Sat, 6 Nov 2021 23:43:11 +0000 (16:43 -0700)
committer James Zern <jzern@google.com>
Mon, 8 Nov 2021 21:43:09 +0000 (13:43 -0800)
diff --git a/vp8/common/x86/bilinear_filter_sse2.c b/vp8/common/x86/bilinear_filter_sse2.c

index 9bf65d8045e89d7514ab389673d8eab7455d86f3..ff6cbbd68c55ec64f72b5e3b4edafe60de42ff69 100644 (file)
--- a/vp8/common/x86/bilinear_filter_sse2.c
+++ b/vp8/common/x86/bilinear_filter_sse2.c
@@ -313,10 +313,10 @@ static INLINE void vertical_4x4(uint16_t *src, uint8_t *dst, const int stride,
        const __m128i compensated = _mm_add_epi16(sum, round_factor);
        const __m128i shifted = _mm_srai_epi16(compensated, VP8_FILTER_SHIFT);
        __m128i packed = _mm_packus_epi16(shifted, shifted);
-      storeu_uint32(dst, _mm_cvtsi128_si32(packed));
+      storeu_int32(dst, _mm_cvtsi128_si32(packed));
        packed = _mm_srli_si128(packed, 4);
        dst += stride;
-      storeu_uint32(dst, _mm_cvtsi128_si32(packed));
+      storeu_int32(dst, _mm_cvtsi128_si32(packed));
        dst += stride;
        src += 8;
      }
diff --git a/vpx_dsp/x86/loopfilter_sse2.c b/vpx_dsp/x86/loopfilter_sse2.c

index b6ff24834b9826434fcab212953939ab3b588ce2..347c9fdbe900f83cb82486683c2b288b1022c69b 100644 (file)
--- a/vpx_dsp/x86/loopfilter_sse2.c
+++ b/vpx_dsp/x86/loopfilter_sse2.c
@@ -211,21 +211,21 @@ void vpx_lpf_vertical_4_sse2(uint8_t *s, int pitch, const uint8_t *blimit,
    // 00 10 20 30 01 11 21 31  02 12 22 32 03 13 23 33
    ps1ps0 = _mm_unpacklo_epi8(ps1ps0, x0);
  
-  storeu_uint32(s + 0 * pitch - 2, _mm_cvtsi128_si32(ps1ps0));
+  storeu_int32(s + 0 * pitch - 2, _mm_cvtsi128_si32(ps1ps0));
    ps1ps0 = _mm_srli_si128(ps1ps0, 4);
-  storeu_uint32(s + 1 * pitch - 2, _mm_cvtsi128_si32(ps1ps0));
+  storeu_int32(s + 1 * pitch - 2, _mm_cvtsi128_si32(ps1ps0));
    ps1ps0 = _mm_srli_si128(ps1ps0, 4);
-  storeu_uint32(s + 2 * pitch - 2, _mm_cvtsi128_si32(ps1ps0));
+  storeu_int32(s + 2 * pitch - 2, _mm_cvtsi128_si32(ps1ps0));
    ps1ps0 = _mm_srli_si128(ps1ps0, 4);
-  storeu_uint32(s + 3 * pitch - 2, _mm_cvtsi128_si32(ps1ps0));
+  storeu_int32(s + 3 * pitch - 2, _mm_cvtsi128_si32(ps1ps0));
  
-  storeu_uint32(s + 4 * pitch - 2, _mm_cvtsi128_si32(qs1qs0));
+  storeu_int32(s + 4 * pitch - 2, _mm_cvtsi128_si32(qs1qs0));
    qs1qs0 = _mm_srli_si128(qs1qs0, 4);
-  storeu_uint32(s + 5 * pitch - 2, _mm_cvtsi128_si32(qs1qs0));
+  storeu_int32(s + 5 * pitch - 2, _mm_cvtsi128_si32(qs1qs0));
    qs1qs0 = _mm_srli_si128(qs1qs0, 4);
-  storeu_uint32(s + 6 * pitch - 2, _mm_cvtsi128_si32(qs1qs0));
+  storeu_int32(s + 6 * pitch - 2, _mm_cvtsi128_si32(qs1qs0));
    qs1qs0 = _mm_srli_si128(qs1qs0, 4);
-  storeu_uint32(s + 7 * pitch - 2, _mm_cvtsi128_si32(qs1qs0));
+  storeu_int32(s + 7 * pitch - 2, _mm_cvtsi128_si32(qs1qs0));
  }
  
  void vpx_lpf_horizontal_16_sse2(unsigned char *s, int pitch,
diff --git a/vpx_dsp/x86/mem_sse2.h b/vpx_dsp/x86/mem_sse2.h

index 258ab38e606ea770c56842e2ac5353d529b5a183..75fa2b0b72a6bb49a7efe7707af144dfa406400a 100644 (file)
--- a/vpx_dsp/x86/mem_sse2.h
+++ b/vpx_dsp/x86/mem_sse2.h
@@ -16,7 +16,7 @@
  
  #include "./vpx_config.h"
  
-static INLINE void storeu_uint32(void *dst, uint32_t v) {
+static INLINE void storeu_int32(void *dst, int32_t v) {
    memcpy(dst, &v, sizeof(v));
  }
author	James Zern <jzern@google.com>
	Sat, 6 Nov 2021 23:43:11 +0000 (16:43 -0700)
committer	James Zern <jzern@google.com>
	Mon, 8 Nov 2021 21:43:09 +0000 (13:43 -0800)
vp8/common/x86/bilinear_filter_sse2.c		patch \| blob \| history
vpx_dsp/x86/loopfilter_sse2.c		patch \| blob \| history
vpx_dsp/x86/mem_sse2.h		patch \| blob \| history