shithub: libvpx

Download patch

ref: a040eb37e4cb924b1a00cdb493a709441885c344
parent: d8ebdcd89d5d19d283a73a2a81d3909b172e7e2d
parent: fa1a9290e6e7cd0bf0afff5213e73fa5f662a9e2
author: Yunqing Wang <yunqingwang@google.com>
date: Mon Feb 6 08:58:11 EST 2012

Merge "Allow to skip highest-resolution encoding in multi-resolution encoder"

--- a/vp8/encoder/pickinter.c
+++ b/vp8/encoder/pickinter.c
@@ -413,12 +413,11 @@
          * such as 2, 4, 8. Will revisit it if needed.
          * Should also try using a look-up table to see if it helps
          * performance. */
-        int round = cpi->oxcf.mr_down_sampling_factor.num/2;
         int parent_mb_row, parent_mb_col;
 
-        parent_mb_row = (mb_row*cpi->oxcf.mr_down_sampling_factor.den+round)
+        parent_mb_row = mb_row*cpi->oxcf.mr_down_sampling_factor.den
                     /cpi->oxcf.mr_down_sampling_factor.num;
-        parent_mb_col = (mb_col*cpi->oxcf.mr_down_sampling_factor.den+round)
+        parent_mb_col = mb_col*cpi->oxcf.mr_down_sampling_factor.den
                     /cpi->oxcf.mr_down_sampling_factor.num;
         parent_mb_index = parent_mb_row*cpi->mr_low_res_mb_cols + parent_mb_col;
     }
--- a/vp8_multi_resolution_encoder.c
+++ b/vp8_multi_resolution_encoder.c
@@ -212,7 +212,10 @@
     double               psnr_totals[NUM_ENCODERS][4] = {{0,0}};
     int                  psnr_count[NUM_ENCODERS] = {0};
 
-    /* Set the required target bitrates for each resolution level. */
+    /* Set the required target bitrates for each resolution level.
+     * If target bitrate for highest-resolution level is set to 0,
+     * (i.e. target_bitrate[0]=0), we skip encoding at that level.
+     */
     unsigned int         target_bitrate[NUM_ENCODERS]={1400, 500, 100};
     /* Enter the frame rate of the input video */
     int                  framerate = 30;
@@ -221,6 +224,9 @@
        dsf[1] controls down sampling from level 1 to level 2;
        dsf[2] is not used. */
     vpx_rational_t dsf[NUM_ENCODERS] = {{2, 1}, {2, 1}, {1, 1}};
+    /* Encode starting from which resolution level. Normally it is 0 that
+     * means the original(highest) resolution. */
+    int                  s_lvl = 0;
 
     if(argc!= (5+NUM_ENCODERS))
         die("Usage: %s <width> <height> <infile> <outfile(s)> <output psnr?>\n",
@@ -234,6 +240,21 @@
     if(width < 16 || width%2 || height <16 || height%2)
         die("Invalid resolution: %ldx%ld", width, height);
 
+    /* Check to see if we need to encode all resolution levels */
+    for (i=0; i<NUM_ENCODERS; i++)
+    {
+        if (target_bitrate[i])
+            break;
+        else
+            s_lvl += 1;
+    }
+
+    if (s_lvl >= NUM_ENCODERS)
+    {
+        printf("No encoding: total number of encoders is 0!");
+        return 0;
+    }
+
     /* Open input video file for encoding */
     if(!(infile = fopen(argv[3], "rb")))
         die("Failed to open %s for reading", argv[3]);
@@ -321,17 +342,15 @@
     else
         read_frame_p = read_frame_by_row;
 
-    for (i=0; i< NUM_ENCODERS; i++)
-        write_ivf_file_header(outfile[i], &cfg[i], 0);
-
     /* Initialize multi-encoder */
-    if(vpx_codec_enc_init_multi(&codec[0], interface, &cfg[0], NUM_ENCODERS,
-                                (show_psnr ? VPX_CODEC_USE_PSNR : 0), &dsf[0]))
-        die_codec(&codec[0], "Failed to initialize encoder");
+    if(vpx_codec_enc_init_multi(&codec[s_lvl], interface, &cfg[s_lvl], s_lvl,
+                             NUM_ENCODERS,
+                             (show_psnr ? VPX_CODEC_USE_PSNR : 0), &dsf[s_lvl]))
+        die_codec(&codec[s_lvl], "Failed to initialize encoder");
 
     /* The extra encoding configuration parameters can be set as follows. */
     /* Set encoding speed */
-    for ( i=0; i<NUM_ENCODERS; i++)
+    for ( i=s_lvl; i<NUM_ENCODERS; i++)
     {
         int speed = -6;
         if(vpx_codec_control(&codec[i], VP8E_SET_CPUUSED, speed))
@@ -341,14 +360,16 @@
      * better performance. */
     {
         unsigned int static_thresh = 1000;
-        if(vpx_codec_control(&codec[0], VP8E_SET_STATIC_THRESHOLD, static_thresh))
-            die_codec(&codec[0], "Failed to set static threshold");
+        if(vpx_codec_control(&codec[s_lvl], VP8E_SET_STATIC_THRESHOLD,
+                             static_thresh))
+            die_codec(&codec[s_lvl], "Failed to set static threshold");
     }
     /* Set static thresh = 0 for other encoders for better quality */
-    for ( i=1; i<NUM_ENCODERS; i++)
+    for ( i=s_lvl+1; i<NUM_ENCODERS; i++)
     {
         unsigned int static_thresh = 0;
-        if(vpx_codec_control(&codec[i], VP8E_SET_STATIC_THRESHOLD, static_thresh))
+        if(vpx_codec_control(&codec[i], VP8E_SET_STATIC_THRESHOLD,
+                             static_thresh))
             die_codec(&codec[i], "Failed to set static threshold");
     }
 
@@ -355,6 +376,9 @@
     frame_avail = 1;
     got_data = 0;
 
+    for (i=s_lvl ; i< NUM_ENCODERS; i++)
+        write_ivf_file_header(outfile[i], &cfg[i], 0);
+
     while(frame_avail || got_data)
     {
         vpx_codec_iter_t iter[NUM_ENCODERS]={NULL};
@@ -381,11 +405,11 @@
         }
 
         /* Encode each frame at multi-levels */
-        if(vpx_codec_encode(&codec[0], frame_avail? &raw[0] : NULL,
+        if(vpx_codec_encode(&codec[s_lvl], frame_avail? &raw[s_lvl] : NULL,
             frame_cnt, 1, flags, arg_deadline))
-            die_codec(&codec[0], "Failed to encode frame");
+            die_codec(&codec[s_lvl], "Failed to encode frame");
 
-        for (i=NUM_ENCODERS-1; i>=0 ; i--)
+        for (i=NUM_ENCODERS-1; i>=s_lvl ; i--)
         {
             got_data = 0;
 
@@ -428,7 +452,7 @@
 
     fclose(infile);
 
-    for (i=0; i< NUM_ENCODERS; i++)
+    for (i=s_lvl; i< NUM_ENCODERS; i++)
     {
         printf("Processed %ld frames.\n",(long int)frame_cnt-1);
 
@@ -454,8 +478,11 @@
         /* Try to rewrite the file header with the actual frame count */
         if(!fseek(outfile[i], 0, SEEK_SET))
             write_ivf_file_header(outfile[i], &cfg[i], frame_cnt-1);
-        fclose(outfile[i]);
+    }
 
+    for (i=0; i< NUM_ENCODERS; i++)
+    {
+        fclose(outfile[i]);
         vpx_img_free(&raw[i]);
     }
 
--- a/vpx/src/vpx_encoder.c
+++ b/vpx/src/vpx_encoder.c
@@ -69,6 +69,7 @@
 vpx_codec_err_t vpx_codec_enc_init_multi_ver(vpx_codec_ctx_t      *ctx,
                                              vpx_codec_iface_t    *iface,
                                              vpx_codec_enc_cfg_t  *cfg,
+                                             int                   s_lvl,
                                              int                   num_enc,
                                              vpx_codec_flags_t     flags,
                                              vpx_rational_t       *dsf,
@@ -99,7 +100,7 @@
 
         if(!(res = iface->enc.mr_get_mem_loc(cfg, &mem_loc)))
         {
-            for (i = 0; i < num_enc; i++)
+            for (i = s_lvl; i < num_enc; i++)
             {
                 vpx_codec_priv_enc_mr_cfg_t mr_cfg;
 
@@ -112,7 +113,7 @@
                 }
 
                 mr_cfg.mr_low_res_mode_info = mem_loc;
-                mr_cfg.mr_total_resolutions = num_enc;
+                mr_cfg.mr_total_resolutions = num_enc - s_lvl;
                 mr_cfg.mr_encoder_id = num_enc-1-i;
                 mr_cfg.mr_down_sampling_factor.num = dsf->num;
                 mr_cfg.mr_down_sampling_factor.den = dsf->den;
--- a/vpx/vpx_encoder.h
+++ b/vpx/vpx_encoder.h
@@ -688,6 +688,7 @@
      * \param[in]    ctx     Pointer to this instance's context.
      * \param[in]    iface   Pointer to the algorithm interface to use.
      * \param[in]    cfg     Configuration to use, if known. May be NULL.
+     * \param[in]    s_lvl   Starting encoder id. Normally it is 0.
      * \param[in]    num_enc Total number of encoders.
      * \param[in]    flags   Bitfield of VPX_CODEC_USE_* flags
      * \param[in]    dsf     Pointer to down-sampling factors.
@@ -701,6 +702,7 @@
     vpx_codec_err_t vpx_codec_enc_init_multi_ver(vpx_codec_ctx_t      *ctx,
                                                  vpx_codec_iface_t    *iface,
                                                  vpx_codec_enc_cfg_t  *cfg,
+                                                 int                   s_lvl,
                                                  int                   num_enc,
                                                  vpx_codec_flags_t     flags,
                                                  vpx_rational_t       *dsf,
@@ -711,8 +713,8 @@
      *
      * Ensures the ABI version parameter is properly set.
      */
-#define vpx_codec_enc_init_multi(ctx, iface, cfg, num_enc, flags, dsf) \
-    vpx_codec_enc_init_multi_ver(ctx, iface, cfg, num_enc, flags, dsf, \
+#define vpx_codec_enc_init_multi(ctx, iface, cfg, s_lvl, num_enc, flags, dsf) \
+    vpx_codec_enc_init_multi_ver(ctx, iface, cfg, s_lvl, num_enc, flags, dsf, \
                                  VPX_ENCODER_ABI_VERSION)