twopass_encoder.c 8.14 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
John Koleszar's avatar
John Koleszar committed
3
 *
4
 *  Use of this source code is governed by a BSD-style license
5 6
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
7
 *  in the file PATENTS.  All contributing project authors may
8
 *  be found in the AUTHORS file in the root of the source tree.
John Koleszar's avatar
John Koleszar committed
9 10
 */

11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
// Two Pass Encoder
// ================
//
// This is an example of a two pass encoder loop. It takes an input file in
// YV12 format, passes it through the encoder twice, and writes the compressed
// frames to disk in IVF format. It builds upon the simple_encoder example.
//
// Twopass Variables
// -----------------
// Twopass mode needs to track the current pass number and the buffer of
// statistics packets.
//
// Updating The Configuration
// ---------------------------------
// In two pass mode, the configuration has to be updated on each pass. The
// statistics buffer is passed on the last pass.
//
// Encoding A Frame
// ----------------
// Encoding a frame in two pass mode is identical to the simple encoder
31 32
// example. To increase the quality while sacrificing encoding speed,
// VPX_DL_BEST_QUALITY can be used in place of VPX_DL_GOOD_QUALITY.
33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
//
// Processing Statistics Packets
// -----------------------------
// Each packet of type `VPX_CODEC_CX_FRAME_PKT` contains the encoded data
// for this frame. We write a IVF frame header, followed by the raw data.
//
//
// Pass Progress Reporting
// -----------------------------
// It's sometimes helpful to see when each pass completes.
//
//
// Clean-up
// -----------------------------
// Destruction of the encoder instance must be done on each pass. The
// raw image should be destroyed at the end as usual.
John Koleszar's avatar
John Koleszar committed
49 50 51 52

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
53 54

#include "vpx/vpx_encoder.h"
John Koleszar's avatar
John Koleszar committed
55

56 57
#include "../tools_common.h"
#include "../video_writer.h"
John Koleszar's avatar
John Koleszar committed
58

59
static const char *exec_name;
60

61
void usage_exit(void) {
62 63
  fprintf(stderr, "Usage: %s <codec> <width> <height> <infile> <outfile>\n",
          exec_name);
64
  exit(EXIT_FAILURE);
65
}
John Koleszar's avatar
John Koleszar committed
66

67 68 69 70 71 72 73 74
static int get_frame_stats(vpx_codec_ctx_t *ctx,
                           const vpx_image_t *img,
                           vpx_codec_pts_t pts,
                           unsigned int duration,
                           vpx_enc_frame_flags_t flags,
                           unsigned int deadline,
                           vpx_fixed_buf_t *stats) {
  int got_pkts = 0;
75 76 77 78 79 80 81 82
  vpx_codec_iter_t iter = NULL;
  const vpx_codec_cx_pkt_t *pkt = NULL;
  const vpx_codec_err_t res = vpx_codec_encode(ctx, img, pts, duration, flags,
                                               deadline);
  if (res != VPX_CODEC_OK)
    die_codec(ctx, "Failed to get frame stats.");

  while ((pkt = vpx_codec_get_cx_data(ctx, &iter)) != NULL) {
83 84
    got_pkts = 1;

85 86 87 88 89 90
    if (pkt->kind == VPX_CODEC_STATS_PKT) {
      const uint8_t *const pkt_buf = pkt->data.twopass_stats.buf;
      const size_t pkt_size = pkt->data.twopass_stats.sz;
      stats->buf = realloc(stats->buf, stats->sz + pkt_size);
      memcpy((uint8_t *)stats->buf + stats->sz, pkt_buf, pkt_size);
      stats->sz += pkt_size;
John Koleszar's avatar
John Koleszar committed
91
    }
92
  }
93 94

  return got_pkts;
John Koleszar's avatar
John Koleszar committed
95 96
}

97 98 99 100 101 102 103 104
static int encode_frame(vpx_codec_ctx_t *ctx,
                        const vpx_image_t *img,
                        vpx_codec_pts_t pts,
                        unsigned int duration,
                        vpx_enc_frame_flags_t flags,
                        unsigned int deadline,
                        VpxVideoWriter *writer) {
  int got_pkts = 0;
105 106 107 108 109 110 111 112
  vpx_codec_iter_t iter = NULL;
  const vpx_codec_cx_pkt_t *pkt = NULL;
  const vpx_codec_err_t res = vpx_codec_encode(ctx, img, pts, duration, flags,
                                               deadline);
  if (res != VPX_CODEC_OK)
    die_codec(ctx, "Failed to encode frame.");

  while ((pkt = vpx_codec_get_cx_data(ctx, &iter)) != NULL) {
113
    got_pkts = 1;
114 115 116 117 118 119 120 121 122 123 124
    if (pkt->kind == VPX_CODEC_CX_FRAME_PKT) {
      const int keyframe = (pkt->data.frame.flags & VPX_FRAME_IS_KEY) != 0;

      if (!vpx_video_writer_write_frame(writer, pkt->data.frame.buf,
                                                pkt->data.frame.sz,
                                                pkt->data.frame.pts))
        die_codec(ctx, "Failed to write compressed frame.");
      printf(keyframe ? "K" : ".");
      fflush(stdout);
    }
  }
125 126

  return got_pkts;
John Koleszar's avatar
John Koleszar committed
127 128
}

129 130 131
static vpx_fixed_buf_t pass0(vpx_image_t *raw,
                             FILE *infile,
                             const VpxInterface *encoder,
132
                             const vpx_codec_enc_cfg_t *cfg) {
133 134 135 136 137 138 139
  vpx_codec_ctx_t codec;
  int frame_count = 0;
  vpx_fixed_buf_t stats = {NULL, 0};

  if (vpx_codec_enc_init(&codec, encoder->codec_interface(), cfg, 0))
    die_codec(&codec, "Failed to initialize encoder");

140
  // Calculate frame statistics.
141 142
  while (vpx_img_read(raw, infile)) {
    ++frame_count;
143
    get_frame_stats(&codec, raw, frame_count, 1, 0, VPX_DL_GOOD_QUALITY,
144 145 146
                    &stats);
  }

147 148
  // Flush encoder.
  while (get_frame_stats(&codec, NULL, frame_count, 1, 0,
149
                         VPX_DL_GOOD_QUALITY, &stats)) {}
150 151 152 153 154 155 156 157 158 159 160 161

  printf("Pass 0 complete. Processed %d frames.\n", frame_count);
  if (vpx_codec_destroy(&codec))
    die_codec(&codec, "Failed to destroy codec.");

  return stats;
}

static void pass1(vpx_image_t *raw,
                  FILE *infile,
                  const char *outfile_name,
                  const VpxInterface *encoder,
162
                  const vpx_codec_enc_cfg_t *cfg) {
163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179
  VpxVideoInfo info = {
    encoder->fourcc,
    cfg->g_w,
    cfg->g_h,
    {cfg->g_timebase.num, cfg->g_timebase.den}
  };
  VpxVideoWriter *writer = NULL;
  vpx_codec_ctx_t codec;
  int frame_count = 0;

  writer = vpx_video_writer_open(outfile_name, kContainerIVF, &info);
  if (!writer)
    die("Failed to open %s for writing", outfile_name);

  if (vpx_codec_enc_init(&codec, encoder->codec_interface(), cfg, 0))
    die_codec(&codec, "Failed to initialize encoder");

180
  // Encode frames.
181 182
  while (vpx_img_read(raw, infile)) {
    ++frame_count;
183
    encode_frame(&codec, raw, frame_count, 1, 0, VPX_DL_GOOD_QUALITY, writer);
184 185
  }

186
  // Flush encoder.
187
  while (encode_frame(&codec, NULL, -1, 1, 0, VPX_DL_GOOD_QUALITY, writer)) {}
188

189 190 191 192 193 194 195 196 197 198
  printf("\n");

  if (vpx_codec_destroy(&codec))
    die_codec(&codec, "Failed to destroy codec.");

  vpx_video_writer_close(writer);

  printf("Pass 1 complete. Processed %d frames.\n", frame_count);
}

199 200
int main(int argc, char **argv) {
  FILE *infile = NULL;
201
  int w, h;
202 203 204 205
  vpx_codec_ctx_t codec;
  vpx_codec_enc_cfg_t cfg;
  vpx_image_t raw;
  vpx_codec_err_t res;
206 207
  vpx_fixed_buf_t stats;

208
  const VpxInterface *encoder = NULL;
209 210
  const int fps = 30;        // TODO(dkovalev) add command line argument
  const int bitrate = 200;   // kbit/s TODO(dkovalev) add command line argument
211 212 213 214 215 216 217 218
  const char *const codec_arg = argv[1];
  const char *const width_arg = argv[2];
  const char *const height_arg = argv[3];
  const char *const infile_arg = argv[4];
  const char *const outfile_arg = argv[5];
  exec_name = argv[0];

  if (argc != 6)
219 220
    die("Invalid number of arguments.");

221 222 223 224
  encoder = get_vpx_encoder_by_name(codec_arg);
  if (!encoder)
    die("Unsupported codec.");

225 226
  w = strtol(width_arg, NULL, 0);
  h = strtol(height_arg, NULL, 0);
227

228 229
  if (w  <= 0 || h <= 0 || (w % 2) != 0 || (h  % 2) != 0)
    die("Invalid frame size: %dx%d", w, h);
230

231 232
  if (!vpx_img_alloc(&raw, VPX_IMG_FMT_I420, w, h, 1))
    die("Failed to allocate image", w, h);
233

234
  printf("Using %s\n", vpx_codec_iface_name(encoder->codec_interface()));
235

236
  // Configuration
237
  res = vpx_codec_enc_config_default(encoder->codec_interface(), &cfg, 0);
238 239 240
  if (res)
    die_codec(&codec, "Failed to get default codec config.");

241 242 243 244
  cfg.g_w = w;
  cfg.g_h = h;
  cfg.g_timebase.num = 1;
  cfg.g_timebase.den = fps;
245 246
  cfg.rc_target_bitrate = bitrate;

247 248
  if (!(infile = fopen(infile_arg, "rb")))
    die("Failed to open %s for reading", infile_arg);
John Koleszar's avatar
John Koleszar committed
249

250 251 252
  // Pass 0
  cfg.g_pass = VPX_RC_FIRST_PASS;
  stats = pass0(&raw, infile, encoder, &cfg);
John Koleszar's avatar
John Koleszar committed
253

254 255 256 257 258
  // Pass 1
  rewind(infile);
  cfg.g_pass = VPX_RC_LAST_PASS;
  cfg.rc_twopass_stats_in = stats;
  pass1(&raw, infile, outfile_arg, encoder, &cfg);
259 260
  free(stats.buf);

261 262
  vpx_img_free(&raw);
  fclose(infile);
John Koleszar's avatar
John Koleszar committed
263

264
  return EXIT_SUCCESS;
John Koleszar's avatar
John Koleszar committed
265
}