Fix frame sizes in pkt to support spatial layers.

author Jerome Jiang <jianj@google.com>

Mon, 22 Jan 2018 23:34:59 +0000 (15:34 -0800)

committer Jerome Jiang <jianj@google.com>

Tue, 23 Jan 2018 05:05:39 +0000 (21:05 -0800)
author Jerome Jiang <jianj@google.com>
Mon, 22 Jan 2018 23:34:59 +0000 (15:34 -0800)
committer Jerome Jiang <jianj@google.com>
Tue, 23 Jan 2018 05:05:39 +0000 (21:05 -0800)
diff --git a/test/datarate_test.cc b/test/datarate_test.cc

index 40eb972c083659a729ebca20224d40e310fc376c..a3d1530d8035dd8f24ac8f210fdd9bb2db03716e 100644 (file)
--- a/test/datarate_test.cc
+++ b/test/datarate_test.cc
@@ -1351,6 +1351,14 @@ class DatarateOnePassCbrSvc
                << "Buffer Underrun at frame " << pkt->data.frame.pts;
          }
        }
+
+      ASSERT_EQ(pkt->data.frame.width[sl],
+                top_sl_width_ * svc_params_.scaling_factor_num[sl] /
+                    svc_params_.scaling_factor_den[sl]);
+
+      ASSERT_EQ(pkt->data.frame.height[sl],
+                top_sl_height_ * svc_params_.scaling_factor_num[sl] /
+                    svc_params_.scaling_factor_den[sl]);
      }
    }
  
@@ -1393,6 +1401,8 @@ class DatarateOnePassCbrSvc
    int number_temporal_layers_;
    int layer_target_avg_bandwidth_[VPX_MAX_LAYERS];
    bool dynamic_drop_layer_;
+  unsigned int top_sl_width_;
+  unsigned int top_sl_height_;
  };
  static void assign_layer_bitrates(vpx_codec_enc_cfg_t *const enc_cfg,
                                    const vpx_svc_extra_cfg_t *svc_params,
@@ -1486,6 +1496,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc2SL1TLScreenContent1) {
    number_spatial_layers_ = cfg_.ss_number_layers;
    number_temporal_layers_ = cfg_.ts_number_layers;
    ::libvpx_test::Y4mVideoSource video("niklas_1280_720_30.y4m", 0, 60);
+  top_sl_width_ = 1280;
+  top_sl_height_ = 720;
    cfg_.rc_target_bitrate = 500;
    ResetModel();
    tune_content_ = 1;
@@ -1527,6 +1539,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc2SL3TL) {
    number_temporal_layers_ = cfg_.ts_number_layers;
    ::libvpx_test::I420VideoSource video("niklas_640_480_30.yuv", 640, 480, 30, 1,
                                         0, 400);
+  top_sl_width_ = 640;
+  top_sl_height_ = 480;
    // TODO(marpan): Check that effective_datarate for each layer hits the
    // layer target_bitrate.
    for (int i = 200; i <= 800; i += 200) {
@@ -1577,6 +1591,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc2SL3TLDenoiserOn) {
    number_temporal_layers_ = cfg_.ts_number_layers;
    ::libvpx_test::I420VideoSource video("niklas_640_480_30.yuv", 640, 480, 30, 1,
                                         0, 400);
+  top_sl_width_ = 640;
+  top_sl_height_ = 480;
    // TODO(marpan): Check that effective_datarate for each layer hits the
    // layer target_bitrate.
    // For SVC, noise_sen = 1 means denoising only the top spatial layer
@@ -1633,6 +1649,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc2SL3TLSmallKf) {
    number_temporal_layers_ = cfg_.ts_number_layers;
    ::libvpx_test::I420VideoSource video("niklas_640_480_30.yuv", 640, 480, 30, 1,
                                         0, 400);
+  top_sl_width_ = 640;
+  top_sl_height_ = 480;
    // For this 3 temporal layer case, pattern repeats every 4 frames, so choose
    // 4 key neighboring key frame periods (so key frame will land on 0-2-1-2).
    for (int j = 64; j <= 67; j++) {
@@ -1675,6 +1693,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc2SL3TL4Threads) {
    number_spatial_layers_ = cfg_.ss_number_layers;
    number_temporal_layers_ = cfg_.ts_number_layers;
    ::libvpx_test::Y4mVideoSource video("niklas_1280_720_30.y4m", 0, 60);
+  top_sl_width_ = 1280;
+  top_sl_height_ = 720;
    cfg_.rc_target_bitrate = 800;
    ResetModel();
    assign_layer_bitrates(&cfg_, &svc_params_, cfg_.ss_number_layers,
@@ -1722,6 +1742,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc3SL3TL) {
    number_temporal_layers_ = cfg_.ts_number_layers;
    ::libvpx_test::I420VideoSource video("niklas_640_480_30.yuv", 640, 480, 30, 1,
                                         0, 400);
+  top_sl_width_ = 640;
+  top_sl_height_ = 480;
    cfg_.rc_target_bitrate = 800;
    ResetModel();
    assign_layer_bitrates(&cfg_, &svc_params_, cfg_.ss_number_layers,
@@ -1769,6 +1791,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc3SL_to_2SL_dynamic) {
    number_temporal_layers_ = cfg_.ts_number_layers;
    ::libvpx_test::I420VideoSource video("niklas_640_480_30.yuv", 640, 480, 30, 1,
                                         0, 400);
+  top_sl_width_ = 640;
+  top_sl_height_ = 480;
    cfg_.rc_target_bitrate = 800;
    ResetModel();
    dynamic_drop_layer_ = true;
@@ -1812,6 +1836,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc3SL3TLSmallKf) {
    number_temporal_layers_ = cfg_.ts_number_layers;
    ::libvpx_test::I420VideoSource video("niklas_640_480_30.yuv", 640, 480, 30, 1,
                                         0, 400);
+  top_sl_width_ = 640;
+  top_sl_height_ = 480;
    // For this 3 temporal layer case, pattern repeats every 4 frames, so choose
    // 4 key neighboring key frame periods (so key frame will land on 0-2-1-2).
    for (int j = 32; j <= 35; j++) {
@@ -1856,6 +1882,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc3SL3TL4threads) {
    number_spatial_layers_ = cfg_.ss_number_layers;
    number_temporal_layers_ = cfg_.ts_number_layers;
    ::libvpx_test::Y4mVideoSource video("niklas_1280_720_30.y4m", 0, 60);
+  top_sl_width_ = 1280;
+  top_sl_height_ = 720;
    cfg_.rc_target_bitrate = 800;
    ResetModel();
    assign_layer_bitrates(&cfg_, &svc_params_, cfg_.ss_number_layers,
@@ -1911,6 +1939,8 @@ TEST_P(DatarateOnePassCbrSvc, OnePassCbrSvc2SL1TL5x5MultipleRuns) {
    bits_in_buffer_model_[1] =
        cfg_.layer_target_bitrate[1] * cfg_.rc_buf_initial_sz;
    ::libvpx_test::Y4mVideoSource video("niklas_1280_720_30.y4m", 0, 60);
+  top_sl_width_ = 1280;
+  top_sl_height_ = 720;
    ASSERT_NO_FATAL_FAILURE(RunLoop(&video));
    CheckLayerRateTargeting(&cfg_, number_spatial_layers_,
                            number_temporal_layers_, file_datarate_, 0.78, 1.15);
diff --git a/test/resize_test.cc b/test/resize_test.cc

index 39952074b1cf44a360d510032b76ef08046b7072..5f80af6fb17e38d2c90a2d42edb17ad4c029118c 100644 (file)
--- a/test/resize_test.cc
+++ b/test/resize_test.cc
@@ -278,10 +278,10 @@ class ResizeTest
    }
  
    virtual void FramePktHook(const vpx_codec_cx_pkt_t *pkt) {
-    ASSERT_NE(static_cast<int>(pkt->data.frame.width), 0);
-    ASSERT_NE(static_cast<int>(pkt->data.frame.height), 0);
-    encode_frame_width_.push_back(pkt->data.frame.width);
-    encode_frame_height_.push_back(pkt->data.frame.height);
+    ASSERT_NE(static_cast<int>(pkt->data.frame.width[0]), 0);
+    ASSERT_NE(static_cast<int>(pkt->data.frame.height[0]), 0);
+    encode_frame_width_.push_back(pkt->data.frame.width[0]);
+    encode_frame_height_.push_back(pkt->data.frame.height[0]);
    }
  
    unsigned int GetFrameWidth(size_t idx) const {
@@ -485,10 +485,10 @@ class ResizeRealtimeTest
    }
  
    virtual void FramePktHook(const vpx_codec_cx_pkt_t *pkt) {
-    ASSERT_NE(static_cast<int>(pkt->data.frame.width), 0);
-    ASSERT_NE(static_cast<int>(pkt->data.frame.height), 0);
-    encode_frame_width_.push_back(pkt->data.frame.width);
-    encode_frame_height_.push_back(pkt->data.frame.height);
+    ASSERT_NE(static_cast<int>(pkt->data.frame.width[0]), 0);
+    ASSERT_NE(static_cast<int>(pkt->data.frame.height[0]), 0);
+    encode_frame_width_.push_back(pkt->data.frame.width[0]);
+    encode_frame_height_.push_back(pkt->data.frame.height[0]);
    }
  
    unsigned int GetMismatchFrames() { return mismatch_nframes_; }
diff --git a/vp8/vp8_cx_iface.c b/vp8/vp8_cx_iface.c

index 5870cc38aa8707718afa779601509282deb93fe6..b30befcc474cafe3800ed88212269376c34d0da2 100644 (file)
--- a/vp8/vp8_cx_iface.c
+++ b/vp8/vp8_cx_iface.c
@@ -911,8 +911,8 @@ static vpx_codec_err_t vp8e_encode(vpx_codec_alg_priv_t *ctx,
              (unsigned long)((delta * ctx->cfg.g_timebase.den + round) /
                              ctx->cfg.g_timebase.num / 10000000);
          pkt.data.frame.flags = lib_flags << 16;
-        pkt.data.frame.width = cpi->common.Width;
-        pkt.data.frame.height = cpi->common.Height;
+        pkt.data.frame.width[0] = cpi->common.Width;
+        pkt.data.frame.height[0] = cpi->common.Height;
  
          if (lib_flags & FRAMEFLAGS_KEY) {
            pkt.data.frame.flags |= VPX_FRAME_IS_KEY;
diff --git a/vp9/vp9_cx_iface.c b/vp9/vp9_cx_iface.c

index 5bfe9aa057973fbb7308b0e95c93d8648b37d1d2..3778c5a164f455540b9bb0fb429ae58b6b10b88e 100644 (file)
--- a/vp9/vp9_cx_iface.c
+++ b/vp9/vp9_cx_iface.c
@@ -1234,6 +1234,8 @@ static vpx_codec_err_t encoder_encode(vpx_codec_alg_priv_t *ctx,
            ctx->pending_frame_magnitude |= size;
            cx_data += size;
            cx_data_sz -= size;
+          pkt.data.frame.width[cpi->svc.spatial_layer_id] = cpi->common.width;
+          pkt.data.frame.height[cpi->svc.spatial_layer_id] = cpi->common.height;
  
            if (ctx->output_cx_pkt_cb.output_cx_pkt) {
              pkt.kind = VPX_CODEC_CX_FRAME_PKT;
@@ -1260,8 +1262,8 @@ static vpx_codec_err_t encoder_encode(vpx_codec_alg_priv_t *ctx,
          pkt.data.frame.duration = (unsigned long)ticks_to_timebase_units(
              timebase, dst_end_time_stamp - dst_time_stamp);
          pkt.data.frame.flags = get_frame_pkt_flags(cpi, lib_flags);
-        pkt.data.frame.width = cpi->common.width;
-        pkt.data.frame.height = cpi->common.height;
+        pkt.data.frame.width[cpi->svc.spatial_layer_id] = cpi->common.width;
+        pkt.data.frame.height[cpi->svc.spatial_layer_id] = cpi->common.height;
  
          if (ctx->pending_cx_data) {
            if (size) ctx->pending_frame_sizes[ctx->pending_frame_count++] = size;
diff --git a/vpx/vpx_encoder.h b/vpx/vpx_encoder.h

index de964eb46fe157160f0376a4fe4f10922571c6dd..5e1bca72cdb729e9edd00ae88666dc9cda276f02 100644 (file)
--- a/vpx/vpx_encoder.h
+++ b/vpx/vpx_encoder.h
@@ -182,8 +182,10 @@ typedef struct vpx_codec_cx_pkt {
         * Only applicable when "output partition" mode is enabled. First
         * partition has id 0.*/
        int partition_id;
-      unsigned int width;               /**< frame width */
-      unsigned int height;              /**< frame height */
+      /*!\brief Width and height of frames in this packet. VP8 will only use the
+       * first one.*/
+      unsigned int width[VPX_SS_MAX_LAYERS];  /**< frame width */
+      unsigned int height[VPX_SS_MAX_LAYERS]; /**< frame height */
      } frame;                            /**< data for compressed frame packet */
      vpx_fixed_buf_t twopass_stats;      /**< data for two-pass packet */
      vpx_fixed_buf_t firstpass_mb_stats; /**< first pass mb packet */
author	Jerome Jiang <jianj@google.com>
	Mon, 22 Jan 2018 23:34:59 +0000 (15:34 -0800)
committer	Jerome Jiang <jianj@google.com>
	Tue, 23 Jan 2018 05:05:39 +0000 (21:05 -0800)
test/datarate_test.cc		patch \| blob \| history
test/resize_test.cc		patch \| blob \| history
vp8/vp8_cx_iface.c		patch \| blob \| history
vp9/vp9_cx_iface.c		patch \| blob \| history
vpx/vpx_encoder.h		patch \| blob \| history