Giving consistent names to IDCT/IWHT functions.

author Dmitry Kovalev <dkovalev@google.com>

Fri, 4 Oct 2013 21:17:06 +0000 (14:17 -0700)

committer Dmitry Kovalev <dkovalev@google.com>

Fri, 4 Oct 2013 21:17:06 +0000 (14:17 -0700)
author Dmitry Kovalev <dkovalev@google.com>
Fri, 4 Oct 2013 21:17:06 +0000 (14:17 -0700)
committer Dmitry Kovalev <dkovalev@google.com>
Fri, 4 Oct 2013 21:17:06 +0000 (14:17 -0700)
diff --git a/test/fdct4x4_test.cc b/test/fdct4x4_test.cc

index ea40ca62aeae7de2858ea6aca8625cb2a130f78e..d34c79112360f4d57472f1bb68c8552a456d4819 100644 (file)
--- a/test/fdct4x4_test.cc
+++ b/test/fdct4x4_test.cc
@@ -31,7 +31,7 @@ void fdct4x4(int16_t *in, int16_t *out, uint8_t* /*dst*/,
  }
  void idct4x4_add(int16_t* /*in*/, int16_t *out, uint8_t *dst,
                   int stride, int /*tx_type*/) {
-  vp9_short_idct4x4_add_c(out, dst, stride >> 1);
+  vp9_idct4x4_16_add_c(out, dst, stride >> 1);
  }
  void fht4x4(int16_t *in, int16_t *out, uint8_t* /*dst*/,
              int stride, int tx_type) {
diff --git a/vp9/common/arm/neon/vp9_short_idct4x4_1_add_neon.asm b/vp9/common/arm/neon/vp9_short_idct4x4_1_add_neon.asm

index 869ee5f3f6aea6b975ec5aaf794d21f6c9e10629..0d4a721c4d329dc3c289659883097df2a2657af4 100644 (file)
--- a/vp9/common/arm/neon/vp9_short_idct4x4_1_add_neon.asm
+++ b/vp9/common/arm/neon/vp9_short_idct4x4_1_add_neon.asm
@@ -8,21 +8,21 @@
  ;
  
  
-    EXPORT  |vp9_short_idct4x4_1_add_neon|
+    EXPORT  |vp9_idct4x4_1_add_neon|
      ARM
      REQUIRE8
      PRESERVE8
  
      AREA ||.text||, CODE, READONLY, ALIGN=2
  
-;void vp9_short_idct4x4_1_add_neon(int16_t *input, uint8_t *dest,
+;void vp9_idct4x4_1_add_neon(int16_t *input, uint8_t *dest,
  ;                                  int dest_stride)
  ;
  ; r0  int16_t input
  ; r1  uint8_t *dest
  ; r2  int dest_stride)
  
-|vp9_short_idct4x4_1_add_neon| PROC
+|vp9_idct4x4_1_add_neon| PROC
      ldrsh            r0, [r0]
  
      ; generate cospi_16_64 = 11585
@@ -63,6 +63,6 @@
      vst1.32          {d7[1]}, [r12]
  
      bx               lr
-    ENDP             ; |vp9_short_idct4x4_1_add_neon|
+    ENDP             ; |vp9_idct4x4_1_add_neon|
  
      END
diff --git a/vp9/common/arm/neon/vp9_short_idct4x4_add_neon.asm b/vp9/common/arm/neon/vp9_short_idct4x4_add_neon.asm

index 640fb93569cd19674e22eab4ed7dc1aaff37b534..00283fc8d780b2c19fafcca398b2f0a2eed4c604 100644 (file)
--- a/vp9/common/arm/neon/vp9_short_idct4x4_add_neon.asm
+++ b/vp9/common/arm/neon/vp9_short_idct4x4_add_neon.asm
@@ -8,7 +8,7 @@
  ;  be found in the AUTHORS file in the root of the source tree.
  ;
  
-    EXPORT  |vp9_short_idct4x4_add_neon|
+    EXPORT  |vp9_idct4x4_16_add_neon|
      ARM
      REQUIRE8
      PRESERVE8
@@ -16,13 +16,13 @@
      AREA ||.text||, CODE, READONLY, ALIGN=2
  
      AREA     Block, CODE, READONLY ; name this block of code
-;void vp9_short_idct4x4_add_neon(int16_t *input, uint8_t *dest, int dest_stride)
+;void vp9_idct4x4_16_add_neon(int16_t *input, uint8_t *dest, int dest_stride)
  ;
  ; r0  int16_t input
  ; r1  uint8_t *dest
  ; r2  int dest_stride)
  
-|vp9_short_idct4x4_add_neon| PROC
+|vp9_idct4x4_16_add_neon| PROC
  
      ; The 2D transform is done with two passes which are actually pretty
      ; similar. We first transform the rows. This is done by transposing
@@ -185,6 +185,6 @@
      vst1.32 {d26[1]}, [r1], r2
      vst1.32 {d26[0]}, [r1]  ; no post-increment
      bx              lr
-    ENDP  ; |vp9_short_idct4x4_add_neon|
+    ENDP  ; |vp9_idct4x4_16_add_neon|
  
      END
diff --git a/vp9/common/vp9_idct.c b/vp9/common/vp9_idct.c

index 99d84c9cad16e689f77758bda0881cccdcdd21ee..46363700764d4b5b0231d9cd4570dcbec7604c82 100644 (file)
--- a/vp9/common/vp9_idct.c
+++ b/vp9/common/vp9_idct.c
@@ -18,7 +18,7 @@
  #include "vp9/common/vp9_common.h"
  #include "vp9/common/vp9_idct.h"
  
-void vp9_short_iwalsh4x4_add_c(int16_t *input, uint8_t *dest, int dest_stride) {
+void vp9_iwht4x4_16_add_c(int16_t *input, uint8_t *dest, int dest_stride) {
  /* 4-point reversible, orthonormal inverse Walsh-Hadamard in 3.5 adds,
     0.5 shifts per pixel. */
    int i;
@@ -70,7 +70,7 @@ void vp9_short_iwalsh4x4_add_c(int16_t *input, uint8_t *dest, int dest_stride) {
    }
  }
  
-void vp9_short_iwalsh4x4_1_add_c(int16_t *in, uint8_t *dest, int dest_stride) {
+void vp9_iwht4x4_1_add_c(int16_t *in, uint8_t *dest, int dest_stride) {
    int i;
    int a1, e1;
    int16_t tmp[4];
@@ -116,7 +116,7 @@ void vp9_idct4_1d_c(int16_t *input, int16_t *output) {
    output[3] = step[0] - step[3];
  }
  
-void vp9_short_idct4x4_add_c(int16_t *input, uint8_t *dest, int dest_stride) {
+void vp9_idct4x4_16_add_c(int16_t *input, uint8_t *dest, int dest_stride) {
    int16_t out[4 * 4];
    int16_t *outptr = out;
    int i, j;
@@ -140,7 +140,7 @@ void vp9_short_idct4x4_add_c(int16_t *input, uint8_t *dest, int dest_stride) {
    }
  }
  
-void vp9_short_idct4x4_1_add_c(int16_t *input, uint8_t *dest, int dest_stride) {
+void vp9_idct4x4_1_add_c(int16_t *input, uint8_t *dest, int dest_stride) {
    int i;
    int a1;
    int16_t out = dct_const_round_shift(input[0] * cospi_16_64);
@@ -1286,20 +1286,19 @@ void vp9_short_idct32x32_1_add_c(int16_t *input, uint8_t *dest,
  }
  
  // idct
-void vp9_idct_add(int16_t *input, uint8_t *dest, int stride, int eob) {
+void vp9_idct4x4_add(int16_t *input, uint8_t *dest, int stride, int eob) {
    if (eob > 1)
-    vp9_short_idct4x4_add(input, dest, stride);
+    vp9_idct4x4_16_add(input, dest, stride);
    else
-    vp9_short_idct4x4_1_add(input, dest, stride);
+    vp9_idct4x4_1_add(input, dest, stride);
  }
  
  
-void vp9_idct_add_lossless(int16_t *input, uint8_t *dest, int stride,
-                             int eob) {
+void vp9_iwht4x4_add(int16_t *input, uint8_t *dest, int stride, int eob) {
    if (eob > 1)
-    vp9_short_iwalsh4x4_add(input, dest, stride);
+    vp9_iwht4x4_16_add(input, dest, stride);
    else
-    vp9_short_iwalsh4x4_1_add_c(input, dest, stride);
+    vp9_iwht4x4_1_add(input, dest, stride);
  }
  
  void vp9_idct_add_8x8(int16_t *input, uint8_t *dest, int stride, int eob) {
@@ -1348,7 +1347,7 @@ void vp9_idct_add_32x32(int16_t *input, uint8_t *dest, int stride, int eob) {
  void vp9_iht_add(TX_TYPE tx_type, int16_t *input, uint8_t *dest, int stride,
                     int eob) {
    if (tx_type == DCT_DCT)
-    vp9_idct_add(input, dest, stride, eob);
+    vp9_idct4x4_add(input, dest, stride, eob);
    else
      vp9_short_iht4x4_add(input, dest, stride, tx_type);
  }
diff --git a/vp9/common/vp9_idct.h b/vp9/common/vp9_idct.h

index 0ef905cc8e9501a2c13dfd1378cca4548f3ee376..a15b6d36f4032cad57e03557c4f4d25c06052b7d 100644 (file)
--- a/vp9/common/vp9_idct.h
+++ b/vp9/common/vp9_idct.h
@@ -88,9 +88,8 @@ typedef struct {
  } transform_2d;
  
  
-void vp9_idct_add(int16_t *input, uint8_t *dest, int stride, int eob);
-void vp9_idct_add_lossless(int16_t *input, uint8_t *dest,
-                           int stride, int eob);
+void vp9_idct4x4_add(int16_t *input, uint8_t *dest, int stride, int eob);
+void vp9_iwht4x4_add(int16_t *input, uint8_t *dest, int stride, int eob);
  void vp9_idct_add_8x8(int16_t *input, uint8_t *dest, int stride, int eob);
  void vp9_idct_add_16x16(int16_t *input, uint8_t *dest, int stride, int eob);
  void vp9_idct_add_32x32(int16_t *input, uint8_t *dest, int stride, int eob);
diff --git a/vp9/common/vp9_rtcd_defs.sh b/vp9/common/vp9_rtcd_defs.sh

index 61be7c6b78ad4316710c384c152f8ec426365ddd..58b7ee7b88d3312ed08cff0adfd89bcf71cf64f4 100644 (file)
--- a/vp9/common/vp9_rtcd_defs.sh
+++ b/vp9/common/vp9_rtcd_defs.sh
@@ -267,11 +267,11 @@ specialize vp9_convolve8_avg_vert ssse3 neon dspr2
  #
  # dct
  #
-prototype void vp9_short_idct4x4_1_add "int16_t *input, uint8_t *dest, int dest_stride"
-specialize vp9_short_idct4x4_1_add sse2 neon
+prototype void vp9_idct4x4_1_add "int16_t *input, uint8_t *dest, int dest_stride"
+specialize vp9_idct4x4_1_add sse2 neon
  
-prototype void vp9_short_idct4x4_add "int16_t *input, uint8_t *dest, int dest_stride"
-specialize vp9_short_idct4x4_add sse2 neon
+prototype void vp9_idct4x4_16_add "int16_t *input, uint8_t *dest, int dest_stride"
+specialize vp9_idct4x4_16_add sse2 neon
  
  prototype void vp9_short_idct8x8_1_add "int16_t *input, uint8_t *dest, int dest_stride"
  specialize vp9_short_idct8x8_1_add sse2 neon
@@ -310,11 +310,11 @@ prototype void vp9_idct4_1d "int16_t *input, int16_t *output"
  specialize vp9_idct4_1d sse2
  # dct and add
  
-prototype void vp9_short_iwalsh4x4_1_add "int16_t *input, uint8_t *dest, int dest_stride"
-specialize vp9_short_iwalsh4x4_1_add
+prototype void vp9_iwht4x4_1_add "int16_t *input, uint8_t *dest, int dest_stride"
+specialize vp9_iwht4x4_1_add
  
-prototype void vp9_short_iwalsh4x4_add "int16_t *input, uint8_t *dest, int dest_stride"
-specialize vp9_short_iwalsh4x4_add
+prototype void vp9_iwht4x4_16_add "int16_t *input, uint8_t *dest, int dest_stride"
+specialize vp9_iwht4x4_16_add
  
  #
  # Encoder functions below this point.
diff --git a/vp9/common/x86/vp9_idct_intrin_sse2.c b/vp9/common/x86/vp9_idct_intrin_sse2.c

index d00993c4793b5ce3989b1be78878145f4648bb92..f03af33782e434a1ba991ccc5f2a52e0be1ce5a2 100644 (file)
--- a/vp9/common/x86/vp9_idct_intrin_sse2.c
+++ b/vp9/common/x86/vp9_idct_intrin_sse2.c
@@ -15,7 +15,7 @@
  #include "vp9/common/vp9_common.h"
  #include "vp9/common/vp9_idct.h"
  
-void vp9_short_idct4x4_add_sse2(int16_t *input, uint8_t *dest, int stride) {
+void vp9_idct4x4_16_add_sse2(int16_t *input, uint8_t *dest, int stride) {
    const __m128i zero = _mm_setzero_si128();
    const __m128i eight = _mm_set1_epi16(8);
    const __m128i cst = _mm_setr_epi16((int16_t)cospi_16_64, (int16_t)cospi_16_64,
@@ -148,7 +148,7 @@ void vp9_short_idct4x4_add_sse2(int16_t *input, uint8_t *dest, int stride) {
    RECON_AND_STORE4X4(dest, input3);
  }
  
-void vp9_short_idct4x4_1_add_sse2(int16_t *input, uint8_t *dest, int stride) {
+void vp9_idct4x4_1_add_sse2(int16_t *input, uint8_t *dest, int stride) {
    __m128i dc_value;
    const __m128i zero = _mm_setzero_si128();
    int a;
diff --git a/vp9/decoder/vp9_decodframe.c b/vp9/decoder/vp9_decodframe.c

index da6711e3c877c7e8055f6a0630fb1cf9c147fbeb..c4073e1ce46a07e17543da1c7c0bc4d0427d0a37 100644 (file)
--- a/vp9/decoder/vp9_decodframe.c
+++ b/vp9/decoder/vp9_decodframe.c
@@ -490,8 +490,7 @@ static void setup_quantization(VP9D_COMP *pbi, struct vp9_read_bit_buffer *rb) {
                   cm->uv_dc_delta_q == 0 &&
                   cm->uv_ac_delta_q == 0;
  
-  xd->itxm_add = xd->lossless ? vp9_idct_add_lossless
-                              : vp9_idct_add;
+  xd->itxm_add = xd->lossless ? vp9_iwht4x4_add : vp9_idct4x4_add;
  }
  
  static INTERPOLATIONFILTERTYPE read_interp_filter_type(
diff --git a/vp9/encoder/vp9_encodeframe.c b/vp9/encoder/vp9_encodeframe.c

index 4fde38d3f1ba5eaf8ce3510bcac9d2fc1bcf353d..c9da9cc2750007cfb29a0a494df150ebeb251b14 100644 (file)
--- a/vp9/encoder/vp9_encodeframe.c
+++ b/vp9/encoder/vp9_encodeframe.c
@@ -1868,8 +1868,8 @@ static void switch_lossless_mode(VP9_COMP *cpi, int lossless) {
      // printf("Switching to lossless\n");
      cpi->mb.fwd_txm8x4 = vp9_short_walsh8x4;
      cpi->mb.fwd_txm4x4 = vp9_short_walsh4x4;
-    cpi->mb.e_mbd.inv_txm4x4_1_add = vp9_short_iwalsh4x4_1_add;
-    cpi->mb.e_mbd.inv_txm4x4_add = vp9_short_iwalsh4x4_add;
+    cpi->mb.e_mbd.inv_txm4x4_1_add = vp9_iwht4x4_1_add;
+    cpi->mb.e_mbd.inv_txm4x4_add = vp9_iwht4x4_16_add;
      cpi->mb.optimize = 0;
      cpi->common.lf.filter_level = 0;
      cpi->zbin_mode_boost_enabled = 0;
@@ -1878,8 +1878,8 @@ static void switch_lossless_mode(VP9_COMP *cpi, int lossless) {
      // printf("Not lossless\n");
      cpi->mb.fwd_txm8x4 = vp9_short_fdct8x4;
      cpi->mb.fwd_txm4x4 = vp9_short_fdct4x4;
-    cpi->mb.e_mbd.inv_txm4x4_1_add = vp9_short_idct4x4_1_add;
-    cpi->mb.e_mbd.inv_txm4x4_add = vp9_short_idct4x4_add;
+    cpi->mb.e_mbd.inv_txm4x4_1_add = vp9_idct4x4_1_add;
+    cpi->mb.e_mbd.inv_txm4x4_add = vp9_idct4x4_16_add;
    }
  }
  
diff --git a/vp9/encoder/vp9_onyx_if.c b/vp9/encoder/vp9_onyx_if.c

index 753afbc78d1fb47264e321934abe6aace8dcdb12..501100b3f082b35ca021a7115ee321ffb0445bef 100644 (file)
--- a/vp9/encoder/vp9_onyx_if.c
+++ b/vp9/encoder/vp9_onyx_if.c
@@ -1260,11 +1260,11 @@ void vp9_change_config(VP9_PTR ptr, VP9_CONFIG *oxcf) {
  
    cpi->oxcf.lossless = oxcf->lossless;
    if (cpi->oxcf.lossless) {
-    cpi->mb.e_mbd.inv_txm4x4_1_add    = vp9_short_iwalsh4x4_1_add;
-    cpi->mb.e_mbd.inv_txm4x4_add      = vp9_short_iwalsh4x4_add;
+    cpi->mb.e_mbd.inv_txm4x4_1_add    = vp9_iwht4x4_1_add;
+    cpi->mb.e_mbd.inv_txm4x4_add      = vp9_iwht4x4_16_add;
    } else {
-    cpi->mb.e_mbd.inv_txm4x4_1_add    = vp9_short_idct4x4_1_add;
-    cpi->mb.e_mbd.inv_txm4x4_add      = vp9_short_idct4x4_add;
+    cpi->mb.e_mbd.inv_txm4x4_1_add    = vp9_idct4x4_1_add;
+    cpi->mb.e_mbd.inv_txm4x4_add      = vp9_idct4x4_16_add;
    }
  
    cpi->baseline_gf_interval = DEFAULT_GF_INTERVAL;
author	Dmitry Kovalev <dkovalev@google.com>
	Fri, 4 Oct 2013 21:17:06 +0000 (14:17 -0700)
committer	Dmitry Kovalev <dkovalev@google.com>
	Fri, 4 Oct 2013 21:17:06 +0000 (14:17 -0700)
test/fdct4x4_test.cc		patch \| blob \| history
vp9/common/arm/neon/vp9_short_idct4x4_1_add_neon.asm		patch \| blob \| history
vp9/common/arm/neon/vp9_short_idct4x4_add_neon.asm		patch \| blob \| history
vp9/common/vp9_idct.c		patch \| blob \| history
vp9/common/vp9_idct.h		patch \| blob \| history
vp9/common/vp9_rtcd_defs.sh		patch \| blob \| history
vp9/common/x86/vp9_idct_intrin_sse2.c		patch \| blob \| history
vp9/decoder/vp9_decodframe.c		patch \| blob \| history
vp9/encoder/vp9_encodeframe.c		patch \| blob \| history
vp9/encoder/vp9_onyx_if.c		patch \| blob \| history