WebM Codec SDK
vpxdec
1 /*
2  * Copyright (c) 2010 The WebM project authors. All Rights Reserved.
3  *
4  * Use of this source code is governed by a BSD-style license
5  * that can be found in the LICENSE file in the root of the source
6  * tree. An additional intellectual property rights grant can be found
7  * in the file PATENTS. All contributing project authors may
8  * be found in the AUTHORS file in the root of the source tree.
9  */
10 
11 #include <assert.h>
12 #include <limits.h>
13 #include <stdarg.h>
14 #include <stdio.h>
15 #include <stdlib.h>
16 #include <string.h>
17 
18 #include "./vpx_config.h"
19 
20 #if CONFIG_LIBYUV
21 #include "third_party/libyuv/include/libyuv/scale.h"
22 #endif
23 
24 #include "./args.h"
25 #include "./ivfdec.h"
26 
27 #include "vpx/vpx_decoder.h"
28 #include "vpx_ports/mem_ops.h"
29 #include "vpx_ports/vpx_timer.h"
30 
31 #if CONFIG_VP8_DECODER || CONFIG_VP9_DECODER
32 #include "vpx/vp8dx.h"
33 #endif
34 
35 #include "./md5_utils.h"
36 
37 #include "./tools_common.h"
38 #if CONFIG_WEBM_IO
39 #include "./webmdec.h"
40 #endif
41 #include "./y4menc.h"
42 
43 static const char *exec_name;
44 
45 struct VpxDecInputContext {
46  struct VpxInputContext *vpx_input_ctx;
47  struct WebmInputContext *webm_ctx;
48 };
49 
50 static const arg_def_t help =
51  ARG_DEF(NULL, "help", 0, "Show usage options and exit");
52 static const arg_def_t looparg =
53  ARG_DEF(NULL, "loops", 1, "Number of times to decode the file");
54 static const arg_def_t codecarg = ARG_DEF(NULL, "codec", 1, "Codec to use");
55 static const arg_def_t use_yv12 =
56  ARG_DEF(NULL, "yv12", 0, "Output raw YV12 frames");
57 static const arg_def_t use_i420 =
58  ARG_DEF(NULL, "i420", 0, "Output raw I420 frames");
59 static const arg_def_t flipuvarg =
60  ARG_DEF(NULL, "flipuv", 0, "Flip the chroma planes in the output");
61 static const arg_def_t rawvideo =
62  ARG_DEF(NULL, "rawvideo", 0, "Output raw YUV frames");
63 static const arg_def_t noblitarg =
64  ARG_DEF(NULL, "noblit", 0, "Don't process the decoded frames");
65 static const arg_def_t progressarg =
66  ARG_DEF(NULL, "progress", 0, "Show progress after each frame decodes");
67 static const arg_def_t limitarg =
68  ARG_DEF(NULL, "limit", 1, "Stop decoding after n frames");
69 static const arg_def_t skiparg =
70  ARG_DEF(NULL, "skip", 1, "Skip the first n input frames");
71 static const arg_def_t postprocarg =
72  ARG_DEF(NULL, "postproc", 0, "Postprocess decoded frames");
73 static const arg_def_t summaryarg =
74  ARG_DEF(NULL, "summary", 0, "Show timing summary");
75 static const arg_def_t outputfile =
76  ARG_DEF("o", "output", 1, "Output file name pattern (see below)");
77 static const arg_def_t threadsarg =
78  ARG_DEF("t", "threads", 1, "Max threads to use");
79 static const arg_def_t frameparallelarg =
80  ARG_DEF(NULL, "frame-parallel", 0, "Frame parallel decode (ignored)");
81 static const arg_def_t verbosearg =
82  ARG_DEF("v", "verbose", 0, "Show version string");
83 static const arg_def_t error_concealment =
84  ARG_DEF(NULL, "error-concealment", 0, "Enable decoder error-concealment");
85 static const arg_def_t scalearg =
86  ARG_DEF("S", "scale", 0, "Scale output frames uniformly");
87 static const arg_def_t continuearg =
88  ARG_DEF("k", "keep-going", 0, "(debug) Continue decoding after error");
89 static const arg_def_t fb_arg =
90  ARG_DEF(NULL, "frame-buffers", 1, "Number of frame buffers to use");
91 static const arg_def_t md5arg =
92  ARG_DEF(NULL, "md5", 0, "Compute the MD5 sum of the decoded frame");
93 #if CONFIG_VP9_HIGHBITDEPTH
94 static const arg_def_t outbitdeptharg =
95  ARG_DEF(NULL, "output-bit-depth", 1, "Output bit-depth for decoded frames");
96 #endif
97 static const arg_def_t svcdecodingarg = ARG_DEF(
98  NULL, "svc-decode-layer", 1, "Decode SVC stream up to given spatial layer");
99 static const arg_def_t framestatsarg =
100  ARG_DEF(NULL, "framestats", 1, "Output per-frame stats (.csv format)");
101 static const arg_def_t rowmtarg =
102  ARG_DEF(NULL, "row-mt", 1, "Enable multi-threading to run row-wise in VP9");
103 
104 static const arg_def_t *all_args[] = {
105  &help, &codecarg, &use_yv12, &use_i420,
106  &flipuvarg, &rawvideo, &noblitarg, &progressarg,
107  &limitarg, &skiparg, &postprocarg, &summaryarg,
108  &outputfile, &threadsarg, &frameparallelarg, &verbosearg,
109  &scalearg, &fb_arg, &md5arg, &error_concealment,
110  &continuearg,
111 #if CONFIG_VP9_HIGHBITDEPTH
112  &outbitdeptharg,
113 #endif
114  &svcdecodingarg, &framestatsarg, &rowmtarg, NULL
115 };
116 
117 #if CONFIG_VP8_DECODER
118 static const arg_def_t addnoise_level =
119  ARG_DEF(NULL, "noise-level", 1, "Enable VP8 postproc add noise");
120 static const arg_def_t deblock =
121  ARG_DEF(NULL, "deblock", 0, "Enable VP8 deblocking");
122 static const arg_def_t demacroblock_level = ARG_DEF(
123  NULL, "demacroblock-level", 1, "Enable VP8 demacroblocking, w/ level");
124 static const arg_def_t mfqe =
125  ARG_DEF(NULL, "mfqe", 0, "Enable multiframe quality enhancement");
126 
127 static const arg_def_t *vp8_pp_args[] = { &addnoise_level, &deblock,
128  &demacroblock_level, &mfqe, NULL };
129 #endif
130 
131 #if CONFIG_LIBYUV
132 static INLINE int libyuv_scale(vpx_image_t *src, vpx_image_t *dst,
133  FilterModeEnum mode) {
134 #if CONFIG_VP9_HIGHBITDEPTH
135  if (src->fmt == VPX_IMG_FMT_I42016) {
136  assert(dst->fmt == VPX_IMG_FMT_I42016);
137  return I420Scale_16(
138  (uint16_t *)src->planes[VPX_PLANE_Y], src->stride[VPX_PLANE_Y] / 2,
139  (uint16_t *)src->planes[VPX_PLANE_U], src->stride[VPX_PLANE_U] / 2,
140  (uint16_t *)src->planes[VPX_PLANE_V], src->stride[VPX_PLANE_V] / 2,
141  src->d_w, src->d_h, (uint16_t *)dst->planes[VPX_PLANE_Y],
142  dst->stride[VPX_PLANE_Y] / 2, (uint16_t *)dst->planes[VPX_PLANE_U],
143  dst->stride[VPX_PLANE_U] / 2, (uint16_t *)dst->planes[VPX_PLANE_V],
144  dst->stride[VPX_PLANE_V] / 2, dst->d_w, dst->d_h, mode);
145  }
146 #endif
147  assert(src->fmt == VPX_IMG_FMT_I420);
148  assert(dst->fmt == VPX_IMG_FMT_I420);
149  return I420Scale(src->planes[VPX_PLANE_Y], src->stride[VPX_PLANE_Y],
150  src->planes[VPX_PLANE_U], src->stride[VPX_PLANE_U],
151  src->planes[VPX_PLANE_V], src->stride[VPX_PLANE_V], src->d_w,
152  src->d_h, dst->planes[VPX_PLANE_Y], dst->stride[VPX_PLANE_Y],
153  dst->planes[VPX_PLANE_U], dst->stride[VPX_PLANE_U],
154  dst->planes[VPX_PLANE_V], dst->stride[VPX_PLANE_V], dst->d_w,
155  dst->d_h, mode);
156 }
157 #endif
158 void show_help(FILE *fout, int shorthelp) {
159  int i;
160 
161  fprintf(fout, "Usage: %s <options> filename\n\n", exec_name);
162 
163  if (shorthelp) {
164  fprintf(fout, "Use --help to see the full list of options.\n");
165  return;
166  }
167 
168  fprintf(fout, "Options:\n");
169  arg_show_usage(fout, all_args);
170 #if CONFIG_VP8_DECODER
171  fprintf(fout, "\nVP8 Postprocessing Options:\n");
172  arg_show_usage(fout, vp8_pp_args);
173 #endif
174  fprintf(fout,
175  "\nOutput File Patterns:\n\n"
176  " The -o argument specifies the name of the file(s) to "
177  "write to. If the\n argument does not include any escape "
178  "characters, the output will be\n written to a single file. "
179  "Otherwise, the filename will be calculated by\n expanding "
180  "the following escape characters:\n");
181  fprintf(fout,
182  "\n\t%%w - Frame width"
183  "\n\t%%h - Frame height"
184  "\n\t%%<n> - Frame number, zero padded to <n> places (1..9)"
185  "\n\n Pattern arguments are only supported in conjunction "
186  "with the --yv12 and\n --i420 options. If the -o option is "
187  "not specified, the output will be\n directed to stdout.\n");
188  fprintf(fout, "\nIncluded decoders:\n\n");
189 
190  for (i = 0; i < get_vpx_decoder_count(); ++i) {
191  const VpxInterface *const decoder = get_vpx_decoder_by_index(i);
192  fprintf(fout, " %-6s - %s\n", decoder->name,
193  vpx_codec_iface_name(decoder->codec_interface()));
194  }
195 }
196 
197 void usage_exit(void) {
198  show_help(stderr, 1);
199  exit(EXIT_FAILURE);
200 }
201 
202 static int raw_read_frame(FILE *infile, uint8_t **buffer, size_t *bytes_read,
203  size_t *buffer_size) {
204  char raw_hdr[RAW_FRAME_HDR_SZ];
205  size_t frame_size = 0;
206 
207  if (fread(raw_hdr, RAW_FRAME_HDR_SZ, 1, infile) != 1) {
208  if (!feof(infile)) warn("Failed to read RAW frame size\n");
209  } else {
210  const size_t kCorruptFrameThreshold = 256 * 1024 * 1024;
211  const size_t kFrameTooSmallThreshold = 256 * 1024;
212  frame_size = mem_get_le32(raw_hdr);
213 
214  if (frame_size > kCorruptFrameThreshold) {
215  warn("Read invalid frame size (%u)\n", (unsigned int)frame_size);
216  frame_size = 0;
217  }
218 
219  if (frame_size < kFrameTooSmallThreshold) {
220  warn("Warning: Read invalid frame size (%u) - not a raw file?\n",
221  (unsigned int)frame_size);
222  }
223 
224  if (frame_size > *buffer_size) {
225  uint8_t *new_buf = realloc(*buffer, 2 * frame_size);
226  if (new_buf) {
227  *buffer = new_buf;
228  *buffer_size = 2 * frame_size;
229  } else {
230  warn("Failed to allocate compressed data buffer\n");
231  frame_size = 0;
232  }
233  }
234  }
235 
236  if (!feof(infile)) {
237  if (fread(*buffer, 1, frame_size, infile) != frame_size) {
238  warn("Failed to read full frame\n");
239  return 1;
240  }
241  *bytes_read = frame_size;
242  return 0;
243  }
244 
245  return 1;
246 }
247 
248 static int read_frame(struct VpxDecInputContext *input, uint8_t **buf,
249  size_t *bytes_in_buffer, size_t *buffer_size) {
250  switch (input->vpx_input_ctx->file_type) {
251 #if CONFIG_WEBM_IO
252  case FILE_TYPE_WEBM:
253  return webm_read_frame(input->webm_ctx, buf, bytes_in_buffer);
254 #endif
255  case FILE_TYPE_RAW:
256  return raw_read_frame(input->vpx_input_ctx->file, buf, bytes_in_buffer,
257  buffer_size);
258  case FILE_TYPE_IVF:
259  return ivf_read_frame(input->vpx_input_ctx->file, buf, bytes_in_buffer,
260  buffer_size);
261  default: return 1;
262  }
263 }
264 
265 static void update_image_md5(const vpx_image_t *img, const int planes[3],
266  MD5Context *md5) {
267  int i, y;
268 
269  for (i = 0; i < 3; ++i) {
270  const int plane = planes[i];
271  const unsigned char *buf = img->planes[plane];
272  const int stride = img->stride[plane];
273  const int w = vpx_img_plane_width(img, plane) *
274  ((img->fmt & VPX_IMG_FMT_HIGHBITDEPTH) ? 2 : 1);
275  const int h = vpx_img_plane_height(img, plane);
276 
277  for (y = 0; y < h; ++y) {
278  MD5Update(md5, buf, w);
279  buf += stride;
280  }
281  }
282 }
283 
284 static void write_image_file(const vpx_image_t *img, const int planes[3],
285  FILE *file) {
286  int i, y;
287 #if CONFIG_VP9_HIGHBITDEPTH
288  const int bytes_per_sample = ((img->fmt & VPX_IMG_FMT_HIGHBITDEPTH) ? 2 : 1);
289 #else
290  const int bytes_per_sample = 1;
291 #endif
292 
293  for (i = 0; i < 3; ++i) {
294  const int plane = planes[i];
295  const unsigned char *buf = img->planes[plane];
296  const int stride = img->stride[plane];
297  const int w = vpx_img_plane_width(img, plane);
298  const int h = vpx_img_plane_height(img, plane);
299 
300  for (y = 0; y < h; ++y) {
301  fwrite(buf, bytes_per_sample, w, file);
302  buf += stride;
303  }
304  }
305 }
306 
307 static int file_is_raw(struct VpxInputContext *input) {
308  uint8_t buf[32];
309  int is_raw = 0;
311 
312  si.sz = sizeof(si);
313 
314  if (fread(buf, 1, 32, input->file) == 32) {
315  int i;
316 
317  if (mem_get_le32(buf) < 256 * 1024 * 1024) {
318  for (i = 0; i < get_vpx_decoder_count(); ++i) {
319  const VpxInterface *const decoder = get_vpx_decoder_by_index(i);
320  if (!vpx_codec_peek_stream_info(decoder->codec_interface(), buf + 4,
321  32 - 4, &si)) {
322  is_raw = 1;
323  input->fourcc = decoder->fourcc;
324  input->width = si.w;
325  input->height = si.h;
326  input->framerate.numerator = 30;
327  input->framerate.denominator = 1;
328  break;
329  }
330  }
331  }
332  }
333 
334  rewind(input->file);
335  return is_raw;
336 }
337 
338 static void show_progress(int frame_in, int frame_out, uint64_t dx_time) {
339  fprintf(stderr,
340  "%d decoded frames/%d showed frames in %" PRId64 " us (%.2f fps)\r",
341  frame_in, frame_out, dx_time,
342  (double)frame_out * 1000000.0 / (double)dx_time);
343 }
344 
345 struct ExternalFrameBuffer {
346  uint8_t *data;
347  size_t size;
348  int in_use;
349 };
350 
351 struct ExternalFrameBufferList {
352  int num_external_frame_buffers;
353  struct ExternalFrameBuffer *ext_fb;
354 };
355 
356 // Callback used by libvpx to request an external frame buffer. |cb_priv|
357 // Application private data passed into the set function. |min_size| is the
358 // minimum size in bytes needed to decode the next frame. |fb| pointer to the
359 // frame buffer.
360 static int get_vp9_frame_buffer(void *cb_priv, size_t min_size,
362  int i;
363  struct ExternalFrameBufferList *const ext_fb_list =
364  (struct ExternalFrameBufferList *)cb_priv;
365  if (ext_fb_list == NULL) return -1;
366 
367  // Find a free frame buffer.
368  for (i = 0; i < ext_fb_list->num_external_frame_buffers; ++i) {
369  if (!ext_fb_list->ext_fb[i].in_use) break;
370  }
371 
372  if (i == ext_fb_list->num_external_frame_buffers) return -1;
373 
374  if (ext_fb_list->ext_fb[i].size < min_size) {
375  free(ext_fb_list->ext_fb[i].data);
376  ext_fb_list->ext_fb[i].data = (uint8_t *)calloc(min_size, sizeof(uint8_t));
377  if (!ext_fb_list->ext_fb[i].data) return -1;
378 
379  ext_fb_list->ext_fb[i].size = min_size;
380  }
381 
382  fb->data = ext_fb_list->ext_fb[i].data;
383  fb->size = ext_fb_list->ext_fb[i].size;
384  ext_fb_list->ext_fb[i].in_use = 1;
385 
386  // Set the frame buffer's private data to point at the external frame buffer.
387  fb->priv = &ext_fb_list->ext_fb[i];
388  return 0;
389 }
390 
391 // Callback used by libvpx when there are no references to the frame buffer.
392 // |cb_priv| user private data passed into the set function. |fb| pointer
393 // to the frame buffer.
394 static int release_vp9_frame_buffer(void *cb_priv,
396  struct ExternalFrameBuffer *const ext_fb =
397  (struct ExternalFrameBuffer *)fb->priv;
398  (void)cb_priv;
399  ext_fb->in_use = 0;
400  return 0;
401 }
402 
403 static void generate_filename(const char *pattern, char *out, size_t q_len,
404  unsigned int d_w, unsigned int d_h,
405  unsigned int frame_in) {
406  const char *p = pattern;
407  char *q = out;
408 
409  do {
410  char *next_pat = strchr(p, '%');
411 
412  if (p == next_pat) {
413  size_t pat_len;
414 
415  /* parse the pattern */
416  q[q_len - 1] = '\0';
417  switch (p[1]) {
418  case 'w': snprintf(q, q_len - 1, "%d", d_w); break;
419  case 'h': snprintf(q, q_len - 1, "%d", d_h); break;
420  case '1': snprintf(q, q_len - 1, "%d", frame_in); break;
421  case '2': snprintf(q, q_len - 1, "%02d", frame_in); break;
422  case '3': snprintf(q, q_len - 1, "%03d", frame_in); break;
423  case '4': snprintf(q, q_len - 1, "%04d", frame_in); break;
424  case '5': snprintf(q, q_len - 1, "%05d", frame_in); break;
425  case '6': snprintf(q, q_len - 1, "%06d", frame_in); break;
426  case '7': snprintf(q, q_len - 1, "%07d", frame_in); break;
427  case '8': snprintf(q, q_len - 1, "%08d", frame_in); break;
428  case '9': snprintf(q, q_len - 1, "%09d", frame_in); break;
429  default: die("Unrecognized pattern %%%c\n", p[1]); break;
430  }
431 
432  pat_len = strlen(q);
433  if (pat_len >= q_len - 1) die("Output filename too long.\n");
434  q += pat_len;
435  p += 2;
436  q_len -= pat_len;
437  } else {
438  size_t copy_len;
439 
440  /* copy the next segment */
441  if (!next_pat)
442  copy_len = strlen(p);
443  else
444  copy_len = next_pat - p;
445 
446  if (copy_len >= q_len - 1) die("Output filename too long.\n");
447 
448  memcpy(q, p, copy_len);
449  q[copy_len] = '\0';
450  q += copy_len;
451  p += copy_len;
452  q_len -= copy_len;
453  }
454  } while (*p);
455 }
456 
457 static int is_single_file(const char *outfile_pattern) {
458  const char *p = outfile_pattern;
459 
460  do {
461  p = strchr(p, '%');
462  if (p && p[1] >= '1' && p[1] <= '9')
463  return 0; // pattern contains sequence number, so it's not unique
464  if (p) p++;
465  } while (p);
466 
467  return 1;
468 }
469 
470 static void print_md5(unsigned char digest[16], const char *filename) {
471  int i;
472 
473  for (i = 0; i < 16; ++i) printf("%02x", digest[i]);
474  printf(" %s\n", filename);
475 }
476 
477 static FILE *open_outfile(const char *name) {
478  if (strcmp("-", name) == 0) {
479  set_binary_mode(stdout);
480  return stdout;
481  } else {
482  FILE *file = fopen(name, "wb");
483  if (!file) fatal("Failed to open output file '%s'", name);
484  return file;
485  }
486 }
487 
488 #if CONFIG_VP9_HIGHBITDEPTH
489 static int img_shifted_realloc_required(const vpx_image_t *img,
490  const vpx_image_t *shifted,
491  vpx_img_fmt_t required_fmt) {
492  return img->d_w != shifted->d_w || img->d_h != shifted->d_h ||
493  required_fmt != shifted->fmt;
494 }
495 #endif
496 
497 static int main_loop(int argc, const char **argv_) {
498  vpx_codec_ctx_t decoder;
499  char *fn = NULL;
500  int i;
501  int ret = EXIT_FAILURE;
502  uint8_t *buf = NULL;
503  size_t bytes_in_buffer = 0, buffer_size = 0;
504  FILE *infile;
505  int frame_in = 0, frame_out = 0, flipuv = 0, noblit = 0;
506  int do_md5 = 0, progress = 0;
507  int stop_after = 0, postproc = 0, summary = 0, quiet = 1;
508  int arg_skip = 0;
509  int ec_enabled = 0;
510  int keep_going = 0;
511  int enable_row_mt = 0;
512  const VpxInterface *interface = NULL;
513  const VpxInterface *fourcc_interface = NULL;
514  uint64_t dx_time = 0;
515  struct arg arg;
516  char **argv, **argi, **argj;
517 
518  int single_file;
519  int use_y4m = 1;
520  int opt_yv12 = 0;
521  int opt_i420 = 0;
522  vpx_codec_dec_cfg_t cfg = { 0, 0, 0 };
523 #if CONFIG_VP9_HIGHBITDEPTH
524  unsigned int output_bit_depth = 0;
525 #endif
526  int svc_decoding = 0;
527  int svc_spatial_layer = 0;
528 #if CONFIG_VP8_DECODER
529  vp8_postproc_cfg_t vp8_pp_cfg = { 0, 0, 0 };
530 #endif
531  int frames_corrupted = 0;
532  int dec_flags = 0;
533  int do_scale = 0;
534  vpx_image_t *scaled_img = NULL;
535 #if CONFIG_VP9_HIGHBITDEPTH
536  vpx_image_t *img_shifted = NULL;
537 #endif
538  int frame_avail, got_data, flush_decoder = 0;
539  int num_external_frame_buffers = 0;
540  struct ExternalFrameBufferList ext_fb_list = { 0, NULL };
541 
542  const char *outfile_pattern = NULL;
543  char outfile_name[PATH_MAX] = { 0 };
544  FILE *outfile = NULL;
545 
546  FILE *framestats_file = NULL;
547 
548  MD5Context md5_ctx;
549  unsigned char md5_digest[16];
550 
551  struct VpxDecInputContext input = { NULL, NULL };
552  struct VpxInputContext vpx_input_ctx;
553 #if CONFIG_WEBM_IO
554  struct WebmInputContext webm_ctx;
555  memset(&(webm_ctx), 0, sizeof(webm_ctx));
556  input.webm_ctx = &webm_ctx;
557 #endif
558  input.vpx_input_ctx = &vpx_input_ctx;
559 
560  /* Parse command line */
561  exec_name = argv_[0];
562  argv = argv_dup(argc - 1, argv_ + 1);
563 
564  for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
565  memset(&arg, 0, sizeof(arg));
566  arg.argv_step = 1;
567 
568  if (arg_match(&arg, &help, argi)) {
569  show_help(stdout, 0);
570  exit(EXIT_SUCCESS);
571  } else if (arg_match(&arg, &codecarg, argi)) {
572  interface = get_vpx_decoder_by_name(arg.val);
573  if (!interface)
574  die("Error: Unrecognized argument (%s) to --codec\n", arg.val);
575  } else if (arg_match(&arg, &looparg, argi)) {
576  // no-op
577  } else if (arg_match(&arg, &outputfile, argi))
578  outfile_pattern = arg.val;
579  else if (arg_match(&arg, &use_yv12, argi)) {
580  use_y4m = 0;
581  flipuv = 1;
582  opt_yv12 = 1;
583  } else if (arg_match(&arg, &use_i420, argi)) {
584  use_y4m = 0;
585  flipuv = 0;
586  opt_i420 = 1;
587  } else if (arg_match(&arg, &rawvideo, argi)) {
588  use_y4m = 0;
589  } else if (arg_match(&arg, &flipuvarg, argi))
590  flipuv = 1;
591  else if (arg_match(&arg, &noblitarg, argi))
592  noblit = 1;
593  else if (arg_match(&arg, &progressarg, argi))
594  progress = 1;
595  else if (arg_match(&arg, &limitarg, argi))
596  stop_after = arg_parse_uint(&arg);
597  else if (arg_match(&arg, &skiparg, argi))
598  arg_skip = arg_parse_uint(&arg);
599  else if (arg_match(&arg, &postprocarg, argi))
600  postproc = 1;
601  else if (arg_match(&arg, &md5arg, argi))
602  do_md5 = 1;
603  else if (arg_match(&arg, &summaryarg, argi))
604  summary = 1;
605  else if (arg_match(&arg, &threadsarg, argi))
606  cfg.threads = arg_parse_uint(&arg);
607 #if CONFIG_VP9_DECODER
608  else if (arg_match(&arg, &frameparallelarg, argi)) {
609  /* ignored for compatibility */
610  }
611 #endif
612  else if (arg_match(&arg, &verbosearg, argi))
613  quiet = 0;
614  else if (arg_match(&arg, &scalearg, argi))
615  do_scale = 1;
616  else if (arg_match(&arg, &fb_arg, argi))
617  num_external_frame_buffers = arg_parse_uint(&arg);
618  else if (arg_match(&arg, &continuearg, argi))
619  keep_going = 1;
620 #if CONFIG_VP9_HIGHBITDEPTH
621  else if (arg_match(&arg, &outbitdeptharg, argi)) {
622  output_bit_depth = arg_parse_uint(&arg);
623  }
624 #endif
625  else if (arg_match(&arg, &svcdecodingarg, argi)) {
626  svc_decoding = 1;
627  svc_spatial_layer = arg_parse_uint(&arg);
628  } else if (arg_match(&arg, &framestatsarg, argi)) {
629  framestats_file = fopen(arg.val, "w");
630  if (!framestats_file) {
631  die("Error: Could not open --framestats file (%s) for writing.\n",
632  arg.val);
633  }
634  } else if (arg_match(&arg, &rowmtarg, argi)) {
635  enable_row_mt = arg_parse_uint(&arg);
636  }
637 #if CONFIG_VP8_DECODER
638  else if (arg_match(&arg, &addnoise_level, argi)) {
639  postproc = 1;
640  vp8_pp_cfg.post_proc_flag |= VP8_ADDNOISE;
641  vp8_pp_cfg.noise_level = arg_parse_uint(&arg);
642  } else if (arg_match(&arg, &demacroblock_level, argi)) {
643  postproc = 1;
644  vp8_pp_cfg.post_proc_flag |= VP8_DEMACROBLOCK;
645  vp8_pp_cfg.deblocking_level = arg_parse_uint(&arg);
646  } else if (arg_match(&arg, &deblock, argi)) {
647  postproc = 1;
648  vp8_pp_cfg.post_proc_flag |= VP8_DEBLOCK;
649  } else if (arg_match(&arg, &mfqe, argi)) {
650  postproc = 1;
651  vp8_pp_cfg.post_proc_flag |= VP8_MFQE;
652  } else if (arg_match(&arg, &error_concealment, argi)) {
653  ec_enabled = 1;
654  }
655 #endif // CONFIG_VP8_DECODER
656  else
657  argj++;
658  }
659 
660  /* Check for unrecognized options */
661  for (argi = argv; *argi; argi++)
662  if (argi[0][0] == '-' && strlen(argi[0]) > 1)
663  die("Error: Unrecognized option %s\n", *argi);
664 
665  /* Handle non-option arguments */
666  fn = argv[0];
667 
668  if (!fn) {
669  free(argv);
670  fprintf(stderr, "No input file specified!\n");
671  usage_exit();
672  }
673  /* Open file */
674  infile = strcmp(fn, "-") ? fopen(fn, "rb") : set_binary_mode(stdin);
675 
676  if (!infile) {
677  fatal("Failed to open input file '%s'", strcmp(fn, "-") ? fn : "stdin");
678  }
679 #if CONFIG_OS_SUPPORT
680  /* Make sure we don't dump to the terminal, unless forced to with -o - */
681  if (!outfile_pattern && isatty(fileno(stdout)) && !do_md5 && !noblit) {
682  fprintf(stderr,
683  "Not dumping raw video to your terminal. Use '-o -' to "
684  "override.\n");
685  return EXIT_FAILURE;
686  }
687 #endif
688  input.vpx_input_ctx->file = infile;
689  if (file_is_ivf(input.vpx_input_ctx))
690  input.vpx_input_ctx->file_type = FILE_TYPE_IVF;
691 #if CONFIG_WEBM_IO
692  else if (file_is_webm(input.webm_ctx, input.vpx_input_ctx))
693  input.vpx_input_ctx->file_type = FILE_TYPE_WEBM;
694 #endif
695  else if (file_is_raw(input.vpx_input_ctx))
696  input.vpx_input_ctx->file_type = FILE_TYPE_RAW;
697  else {
698  fprintf(stderr, "Unrecognized input file type.\n");
699 #if !CONFIG_WEBM_IO
700  fprintf(stderr, "vpxdec was built without WebM container support.\n");
701 #endif
702  return EXIT_FAILURE;
703  }
704 
705  outfile_pattern = outfile_pattern ? outfile_pattern : "-";
706  single_file = is_single_file(outfile_pattern);
707 
708  if (!noblit && single_file) {
709  generate_filename(outfile_pattern, outfile_name, PATH_MAX,
710  vpx_input_ctx.width, vpx_input_ctx.height, 0);
711  if (do_md5)
712  MD5Init(&md5_ctx);
713  else
714  outfile = open_outfile(outfile_name);
715  }
716 
717  if (use_y4m && !noblit) {
718  if (!single_file) {
719  fprintf(stderr,
720  "YUV4MPEG2 not supported with output patterns,"
721  " try --i420 or --yv12 or --rawvideo.\n");
722  return EXIT_FAILURE;
723  }
724 
725 #if CONFIG_WEBM_IO
726  if (vpx_input_ctx.file_type == FILE_TYPE_WEBM) {
727  if (webm_guess_framerate(input.webm_ctx, input.vpx_input_ctx)) {
728  fprintf(stderr,
729  "Failed to guess framerate -- error parsing "
730  "webm file?\n");
731  return EXIT_FAILURE;
732  }
733  }
734 #endif
735  }
736 
737  fourcc_interface = get_vpx_decoder_by_fourcc(vpx_input_ctx.fourcc);
738  if (interface && fourcc_interface && interface != fourcc_interface)
739  warn("Header indicates codec: %s\n", fourcc_interface->name);
740  else
741  interface = fourcc_interface;
742 
743  if (!interface) interface = get_vpx_decoder_by_index(0);
744 
745  dec_flags = (postproc ? VPX_CODEC_USE_POSTPROC : 0) |
746  (ec_enabled ? VPX_CODEC_USE_ERROR_CONCEALMENT : 0);
747  if (vpx_codec_dec_init(&decoder, interface->codec_interface(), &cfg,
748  dec_flags)) {
749  fprintf(stderr, "Failed to initialize decoder: %s\n",
750  vpx_codec_error(&decoder));
751  goto fail2;
752  }
753  if (svc_decoding) {
755  svc_spatial_layer)) {
756  fprintf(stderr, "Failed to set spatial layer for svc decode: %s\n",
757  vpx_codec_error(&decoder));
758  goto fail;
759  }
760  }
761  if (interface->fourcc == VP9_FOURCC &&
762  vpx_codec_control(&decoder, VP9D_SET_ROW_MT, enable_row_mt)) {
763  fprintf(stderr, "Failed to set decoder in row multi-thread mode: %s\n",
764  vpx_codec_error(&decoder));
765  goto fail;
766  }
767  if (!quiet) fprintf(stderr, "%s\n", decoder.name);
768 
769 #if CONFIG_VP8_DECODER
770  if (vp8_pp_cfg.post_proc_flag &&
771  vpx_codec_control(&decoder, VP8_SET_POSTPROC, &vp8_pp_cfg)) {
772  fprintf(stderr, "Failed to configure postproc: %s\n",
773  vpx_codec_error(&decoder));
774  goto fail;
775  }
776 #endif
777 
778  if (arg_skip) fprintf(stderr, "Skipping first %d frames.\n", arg_skip);
779  while (arg_skip) {
780  if (read_frame(&input, &buf, &bytes_in_buffer, &buffer_size)) break;
781  arg_skip--;
782  }
783 
784  if (num_external_frame_buffers > 0) {
785  ext_fb_list.num_external_frame_buffers = num_external_frame_buffers;
786  ext_fb_list.ext_fb = (struct ExternalFrameBuffer *)calloc(
787  num_external_frame_buffers, sizeof(*ext_fb_list.ext_fb));
788  if (vpx_codec_set_frame_buffer_functions(&decoder, get_vp9_frame_buffer,
789  release_vp9_frame_buffer,
790  &ext_fb_list)) {
791  fprintf(stderr, "Failed to configure external frame buffers: %s\n",
792  vpx_codec_error(&decoder));
793  goto fail;
794  }
795  }
796 
797  frame_avail = 1;
798  got_data = 0;
799 
800  if (framestats_file) fprintf(framestats_file, "bytes,qp\n");
801 
802  /* Decode file */
803  while (frame_avail || got_data) {
804  vpx_codec_iter_t iter = NULL;
805  vpx_image_t *img;
806  struct vpx_usec_timer timer;
807  int corrupted = 0;
808 
809  frame_avail = 0;
810  if (!stop_after || frame_in < stop_after) {
811  if (!read_frame(&input, &buf, &bytes_in_buffer, &buffer_size)) {
812  frame_avail = 1;
813  frame_in++;
814 
815  vpx_usec_timer_start(&timer);
816 
817  if (vpx_codec_decode(&decoder, buf, (unsigned int)bytes_in_buffer, NULL,
818  0)) {
819  const char *detail = vpx_codec_error_detail(&decoder);
820  warn("Failed to decode frame %d: %s", frame_in,
821  vpx_codec_error(&decoder));
822  if (detail) warn("Additional information: %s", detail);
823  corrupted = 1;
824  if (!keep_going) goto fail;
825  }
826 
827  if (framestats_file) {
828  int qp;
829  if (vpx_codec_control(&decoder, VPXD_GET_LAST_QUANTIZER, &qp)) {
830  warn("Failed VPXD_GET_LAST_QUANTIZER: %s",
831  vpx_codec_error(&decoder));
832  if (!keep_going) goto fail;
833  }
834  fprintf(framestats_file, "%d,%d\n", (int)bytes_in_buffer, qp);
835  }
836 
837  vpx_usec_timer_mark(&timer);
838  dx_time += vpx_usec_timer_elapsed(&timer);
839  } else {
840  flush_decoder = 1;
841  }
842  } else {
843  flush_decoder = 1;
844  }
845 
846  vpx_usec_timer_start(&timer);
847 
848  if (flush_decoder) {
849  // Flush the decoder in frame parallel decode.
850  if (vpx_codec_decode(&decoder, NULL, 0, NULL, 0)) {
851  warn("Failed to flush decoder: %s", vpx_codec_error(&decoder));
852  corrupted = 1;
853  if (!keep_going) goto fail;
854  }
855  }
856 
857  got_data = 0;
858  if ((img = vpx_codec_get_frame(&decoder, &iter))) {
859  ++frame_out;
860  got_data = 1;
861  }
862 
863  vpx_usec_timer_mark(&timer);
864  dx_time += (unsigned int)vpx_usec_timer_elapsed(&timer);
865 
866  if (!corrupted &&
867  vpx_codec_control(&decoder, VP8D_GET_FRAME_CORRUPTED, &corrupted)) {
868  warn("Failed VP8_GET_FRAME_CORRUPTED: %s", vpx_codec_error(&decoder));
869  if (!keep_going) goto fail;
870  }
871  frames_corrupted += corrupted;
872 
873  if (progress) show_progress(frame_in, frame_out, dx_time);
874 
875  if (!noblit && img) {
876  const int PLANES_YUV[] = { VPX_PLANE_Y, VPX_PLANE_U, VPX_PLANE_V };
877  const int PLANES_YVU[] = { VPX_PLANE_Y, VPX_PLANE_V, VPX_PLANE_U };
878  const int *planes = flipuv ? PLANES_YVU : PLANES_YUV;
879 
880  if (do_scale) {
881  if (frame_out == 1) {
882  // If the output frames are to be scaled to a fixed display size then
883  // use the width and height specified in the container. If either of
884  // these is set to 0, use the display size set in the first frame
885  // header. If that is unavailable, use the raw decoded size of the
886  // first decoded frame.
887  int render_width = vpx_input_ctx.width;
888  int render_height = vpx_input_ctx.height;
889  if (!render_width || !render_height) {
890  int render_size[2];
892  render_size)) {
893  // As last resort use size of first frame as display size.
894  render_width = img->d_w;
895  render_height = img->d_h;
896  } else {
897  render_width = render_size[0];
898  render_height = render_size[1];
899  }
900  }
901  scaled_img =
902  vpx_img_alloc(NULL, img->fmt, render_width, render_height, 16);
903  scaled_img->bit_depth = img->bit_depth;
904  }
905 
906  if (img->d_w != scaled_img->d_w || img->d_h != scaled_img->d_h) {
907 #if CONFIG_LIBYUV
908  libyuv_scale(img, scaled_img, kFilterBox);
909  img = scaled_img;
910 #else
911  fprintf(stderr,
912  "Failed to scale output frame: %s.\n"
913  "Scaling is disabled in this configuration. "
914  "To enable scaling, configure with --enable-libyuv\n",
915  vpx_codec_error(&decoder));
916  goto fail;
917 #endif
918  }
919  }
920 #if CONFIG_VP9_HIGHBITDEPTH
921  // Default to codec bit depth if output bit depth not set
922  if (!output_bit_depth && single_file && !do_md5) {
923  output_bit_depth = img->bit_depth;
924  }
925  // Shift up or down if necessary
926  if (output_bit_depth != 0 && output_bit_depth != img->bit_depth) {
927  const vpx_img_fmt_t shifted_fmt =
928  output_bit_depth == 8
929  ? img->fmt ^ (img->fmt & VPX_IMG_FMT_HIGHBITDEPTH)
930  : img->fmt | VPX_IMG_FMT_HIGHBITDEPTH;
931  if (img_shifted &&
932  img_shifted_realloc_required(img, img_shifted, shifted_fmt)) {
933  vpx_img_free(img_shifted);
934  img_shifted = NULL;
935  }
936  if (!img_shifted) {
937  img_shifted =
938  vpx_img_alloc(NULL, shifted_fmt, img->d_w, img->d_h, 16);
939  img_shifted->bit_depth = output_bit_depth;
940  }
941  if (output_bit_depth > img->bit_depth) {
942  vpx_img_upshift(img_shifted, img, output_bit_depth - img->bit_depth);
943  } else {
944  vpx_img_downshift(img_shifted, img,
945  img->bit_depth - output_bit_depth);
946  }
947  img = img_shifted;
948  }
949 #endif
950 
951  if (single_file) {
952  if (use_y4m) {
953  char buf[Y4M_BUFFER_SIZE] = { 0 };
954  size_t len = 0;
955  if (img->fmt == VPX_IMG_FMT_I440 || img->fmt == VPX_IMG_FMT_I44016) {
956  fprintf(stderr, "Cannot produce y4m output for 440 sampling.\n");
957  goto fail;
958  }
959  if (frame_out == 1) {
960  // Y4M file header
961  len = y4m_write_file_header(
962  buf, sizeof(buf), vpx_input_ctx.width, vpx_input_ctx.height,
963  &vpx_input_ctx.framerate, img->fmt, img->bit_depth);
964  if (do_md5) {
965  MD5Update(&md5_ctx, (md5byte *)buf, (unsigned int)len);
966  } else {
967  fputs(buf, outfile);
968  }
969  }
970 
971  // Y4M frame header
972  len = y4m_write_frame_header(buf, sizeof(buf));
973  if (do_md5) {
974  MD5Update(&md5_ctx, (md5byte *)buf, (unsigned int)len);
975  } else {
976  fputs(buf, outfile);
977  }
978  } else {
979  if (frame_out == 1) {
980  // Check if --yv12 or --i420 options are consistent with the
981  // bit-stream decoded
982  if (opt_i420) {
983  if (img->fmt != VPX_IMG_FMT_I420 &&
984  img->fmt != VPX_IMG_FMT_I42016) {
985  fprintf(stderr, "Cannot produce i420 output for bit-stream.\n");
986  goto fail;
987  }
988  }
989  if (opt_yv12) {
990  if ((img->fmt != VPX_IMG_FMT_I420 &&
991  img->fmt != VPX_IMG_FMT_YV12) ||
992  img->bit_depth != 8) {
993  fprintf(stderr, "Cannot produce yv12 output for bit-stream.\n");
994  goto fail;
995  }
996  }
997  }
998  }
999 
1000  if (do_md5) {
1001  update_image_md5(img, planes, &md5_ctx);
1002  } else {
1003  if (!corrupted) write_image_file(img, planes, outfile);
1004  }
1005  } else {
1006  generate_filename(outfile_pattern, outfile_name, PATH_MAX, img->d_w,
1007  img->d_h, frame_in);
1008  if (do_md5) {
1009  MD5Init(&md5_ctx);
1010  update_image_md5(img, planes, &md5_ctx);
1011  MD5Final(md5_digest, &md5_ctx);
1012  print_md5(md5_digest, outfile_name);
1013  } else {
1014  outfile = open_outfile(outfile_name);
1015  write_image_file(img, planes, outfile);
1016  fclose(outfile);
1017  }
1018  }
1019  }
1020  }
1021 
1022  if (summary || progress) {
1023  show_progress(frame_in, frame_out, dx_time);
1024  fprintf(stderr, "\n");
1025  }
1026 
1027  if (frames_corrupted) {
1028  fprintf(stderr, "WARNING: %d frames corrupted.\n", frames_corrupted);
1029  } else {
1030  ret = EXIT_SUCCESS;
1031  }
1032 
1033 fail:
1034 
1035  if (vpx_codec_destroy(&decoder)) {
1036  fprintf(stderr, "Failed to destroy decoder: %s\n",
1037  vpx_codec_error(&decoder));
1038  }
1039 
1040 fail2:
1041 
1042  if (!noblit && single_file) {
1043  if (do_md5) {
1044  MD5Final(md5_digest, &md5_ctx);
1045  print_md5(md5_digest, outfile_name);
1046  } else {
1047  fclose(outfile);
1048  }
1049  }
1050 
1051 #if CONFIG_WEBM_IO
1052  if (input.vpx_input_ctx->file_type == FILE_TYPE_WEBM)
1053  webm_free(input.webm_ctx);
1054 #endif
1055 
1056  if (input.vpx_input_ctx->file_type != FILE_TYPE_WEBM) free(buf);
1057 
1058  if (scaled_img) vpx_img_free(scaled_img);
1059 #if CONFIG_VP9_HIGHBITDEPTH
1060  if (img_shifted) vpx_img_free(img_shifted);
1061 #endif
1062 
1063  for (i = 0; i < ext_fb_list.num_external_frame_buffers; ++i) {
1064  free(ext_fb_list.ext_fb[i].data);
1065  }
1066  free(ext_fb_list.ext_fb);
1067 
1068  fclose(infile);
1069  if (framestats_file) fclose(framestats_file);
1070 
1071  free(argv);
1072 
1073  return ret;
1074 }
1075 
1076 int main(int argc, const char **argv_) {
1077  unsigned int loops = 1, i;
1078  char **argv, **argi, **argj;
1079  struct arg arg;
1080  int error = 0;
1081 
1082  argv = argv_dup(argc - 1, argv_ + 1);
1083  for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
1084  memset(&arg, 0, sizeof(arg));
1085  arg.argv_step = 1;
1086 
1087  if (arg_match(&arg, &looparg, argi)) {
1088  loops = arg_parse_uint(&arg);
1089  break;
1090  }
1091  }
1092  free(argv);
1093  for (i = 0; !error && i < loops; i++) error = main_loop(argc, argv_);
1094  return error;
1095 }
Definition: vpx_image.h:49
Image Descriptor.
Definition: vpx_image.h:71
Describes the decoder algorithm interface to applications.
const char * vpx_codec_iface_name(vpx_codec_iface_t *iface)
Return the name for a given interface.
Definition: vpx_image.h:40
unsigned int threads
Definition: vpx_decoder.h:108
unsigned int sz
Definition: vpx_decoder.h:90
Stream properties.
Definition: vpx_decoder.h:89
Definition: vp8dx.h:85
int noise_level
Definition: vp8.h:93
unsigned int bit_depth
Definition: vpx_image.h:79
Provides definitions for using VP8 or VP9 within the vpx Decoder interface.
vpx_codec_err_t vpx_codec_peek_stream_info(vpx_codec_iface_t *iface, const uint8_t *data, unsigned int data_sz, vpx_codec_stream_info_t *si)
Parse stream info from a buffer.
#define VPX_PLANE_Y
Definition: vpx_image.h:95
uint8_t * data
Definition: vpx_frame_buffer.h:40
const char * name
Definition: vpx_codec.h:198
#define VPX_PLANE_V
Definition: vpx_image.h:97
Codec control function to get last decoded frame quantizer.
Definition: vp8dx.h:125
#define VPX_IMG_FMT_HIGHBITDEPTH
Definition: vpx_image.h:35
Definition: vp8dx.h:117
vpx_image_t * vpx_img_alloc(vpx_image_t *img, vpx_img_fmt_t fmt, unsigned int d_w, unsigned int d_h, unsigned int align)
Open a descriptor, allocating storage for the underlying image.
Definition: vpx_image.h:42
unsigned int d_w
Definition: vpx_image.h:82
#define vpx_codec_dec_init(ctx, iface, cfg, flags)
Convenience macro for vpx_codec_dec_init_ver()
Definition: vpx_decoder.h:144
vpx_codec_err_t vpx_codec_decode(vpx_codec_ctx_t *ctx, const uint8_t *data, unsigned int data_sz, void *user_priv, long deadline)
Decode data.
enum vpx_img_fmt vpx_img_fmt_t
List of supported image formats.
size_t size
Definition: vpx_frame_buffer.h:41
int stride[4]
Definition: vpx_image.h:100
void vpx_img_free(vpx_image_t *img)
Close an image descriptor.
vpx_img_fmt_t fmt
Definition: vpx_image.h:72
unsigned char * planes[4]
Definition: vpx_image.h:99
Definition: vp8.h:49
#define VPX_CODEC_USE_POSTPROC
Definition: vpx_decoder.h:74
Definition: vp8dx.h:63
Codec control function to set row level multi-threading.
Definition: vp8dx.h:133
const char * vpx_codec_error_detail(vpx_codec_ctx_t *ctx)
Retrieve detailed error information for codec context.
void * priv
Definition: vpx_frame_buffer.h:42
#define VPX_PLANE_U
Definition: vpx_image.h:96
int deblocking_level
Definition: vp8.h:92
unsigned int w
Definition: vpx_decoder.h:91
External frame buffer.
Definition: vpx_frame_buffer.h:39
#define vpx_codec_control(ctx, id, data)
vpx_codec_control wrapper macro
Definition: vpx_codec.h:404
vpx_codec_err_t vpx_codec_destroy(vpx_codec_ctx_t *ctx)
Destroy a codec instance.
unsigned int d_h
Definition: vpx_image.h:83
post process flags
Definition: vp8.h:88
vpx_codec_err_t vpx_codec_set_frame_buffer_functions(vpx_codec_ctx_t *ctx, vpx_get_frame_buffer_cb_fn_t cb_get, vpx_release_frame_buffer_cb_fn_t cb_release, void *cb_priv)
Pass in external frame buffers for the decoder to use.
unsigned int h
Definition: vpx_decoder.h:92
const char * vpx_codec_error(vpx_codec_ctx_t *ctx)
Retrieve error synopsis for codec context.
Initialization Configurations.
Definition: vpx_decoder.h:107
Definition: vpx_image.h:45
const void * vpx_codec_iter_t
Iterator.
Definition: vpx_codec.h:187
vpx_image_t * vpx_codec_get_frame(vpx_codec_ctx_t *ctx, vpx_codec_iter_t *iter)
Decoded frames iterator.
int post_proc_flag
the types of post processing to be done, should be combination of "vp8_postproc_level" ...
Definition: vp8.h:91
Codec context structure.
Definition: vpx_codec.h:197