Add ssse3 aom_smooth_v_predictor_16,32,64xh
[aom.git] / aomdec.c
blob54cbecb49186b8a19ae0d0f41bf929b55a01e5d6
1 /*
2 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
12 #include <assert.h>
13 #include <stdio.h>
14 #include <stdlib.h>
15 #include <stdarg.h>
16 #include <string.h>
17 #include <limits.h>
19 #include "./aom_config.h"
21 #if CONFIG_OS_SUPPORT
22 #if HAVE_UNISTD_H
23 #include <unistd.h> // NOLINT
24 #elif !defined(STDOUT_FILENO)
25 #define STDOUT_FILENO 1
26 #endif
27 #endif
29 #if CONFIG_LIBYUV
30 #include "third_party/libyuv/include/libyuv/scale.h"
31 #endif
33 #include "./args.h"
34 #include "./ivfdec.h"
36 #include "aom/aom_decoder.h"
37 #include "aom_ports/mem_ops.h"
38 #include "aom_ports/aom_timer.h"
40 #if CONFIG_AV1_DECODER
41 #include "aom/aomdx.h"
42 #endif
44 #include "./md5_utils.h"
46 #if CONFIG_OBU_NO_IVF
47 #include "./obudec.h"
48 #endif
50 #include "./tools_common.h"
51 #if CONFIG_WEBM_IO
52 #include "./webmdec.h"
53 #endif
55 #include "./y4menc.h"
57 static const char *exec_name;
59 struct AvxDecInputContext {
60 struct AvxInputContext *aom_input_ctx;
61 struct WebmInputContext *webm_ctx;
64 static const arg_def_t help =
65 ARG_DEF(NULL, "help", 0, "Show usage options and exit");
66 static const arg_def_t looparg =
67 ARG_DEF(NULL, "loops", 1, "Number of times to decode the file");
68 static const arg_def_t codecarg = ARG_DEF(NULL, "codec", 1, "Codec to use");
69 static const arg_def_t use_yv12 =
70 ARG_DEF(NULL, "yv12", 0, "Output raw YV12 frames");
71 static const arg_def_t use_i420 =
72 ARG_DEF(NULL, "i420", 0, "Output raw I420 frames");
73 static const arg_def_t flipuvarg =
74 ARG_DEF(NULL, "flipuv", 0, "Flip the chroma planes in the output");
75 static const arg_def_t rawvideo =
76 ARG_DEF(NULL, "rawvideo", 0, "Output raw YUV frames");
77 static const arg_def_t noblitarg =
78 ARG_DEF(NULL, "noblit", 0, "Don't process the decoded frames");
79 static const arg_def_t progressarg =
80 ARG_DEF(NULL, "progress", 0, "Show progress after each frame decodes");
81 static const arg_def_t limitarg =
82 ARG_DEF(NULL, "limit", 1, "Stop decoding after n frames");
83 static const arg_def_t skiparg =
84 ARG_DEF(NULL, "skip", 1, "Skip the first n input frames");
85 static const arg_def_t postprocarg =
86 ARG_DEF(NULL, "postproc", 0, "Postprocess decoded frames");
87 static const arg_def_t summaryarg =
88 ARG_DEF(NULL, "summary", 0, "Show timing summary");
89 static const arg_def_t outputfile =
90 ARG_DEF("o", "output", 1, "Output file name pattern (see below)");
91 static const arg_def_t threadsarg =
92 ARG_DEF("t", "threads", 1, "Max threads to use");
93 static const arg_def_t verbosearg =
94 ARG_DEF("v", "verbose", 0, "Show version string");
95 static const arg_def_t scalearg =
96 ARG_DEF("S", "scale", 0, "Scale output frames uniformly");
97 static const arg_def_t continuearg =
98 ARG_DEF("k", "keep-going", 0, "(debug) Continue decoding after error");
99 static const arg_def_t fb_arg =
100 ARG_DEF(NULL, "frame-buffers", 1, "Number of frame buffers to use");
101 static const arg_def_t md5arg =
102 ARG_DEF(NULL, "md5", 0, "Compute the MD5 sum of the decoded frame");
103 static const arg_def_t framestatsarg =
104 ARG_DEF(NULL, "framestats", 1, "Output per-frame stats (.csv format)");
105 static const arg_def_t outbitdeptharg =
106 ARG_DEF(NULL, "output-bit-depth", 1, "Output bit-depth for decoded frames");
107 static const arg_def_t tilem = ARG_DEF(NULL, "tile-mode", 1,
108 "Tile coding mode "
109 "(0 for normal tile coding mode)");
110 static const arg_def_t tiler = ARG_DEF(NULL, "tile-row", 1,
111 "Row index of tile to decode "
112 "(-1 for all rows)");
113 static const arg_def_t tilec = ARG_DEF(NULL, "tile-column", 1,
114 "Column index of tile to decode "
115 "(-1 for all columns)");
117 static const arg_def_t *all_args[] = {
118 &help, &codecarg, &use_yv12, &use_i420, &flipuvarg,
119 &rawvideo, &noblitarg, &progressarg, &limitarg, &skiparg,
120 &postprocarg, &summaryarg, &outputfile, &threadsarg, &verbosearg,
121 &scalearg, &fb_arg, &md5arg, &framestatsarg, &continuearg,
122 &outbitdeptharg, &tilem, &tiler, &tilec, NULL
125 #if CONFIG_LIBYUV
126 static INLINE int libyuv_scale(aom_image_t *src, aom_image_t *dst,
127 FilterModeEnum mode) {
128 if (src->fmt == AOM_IMG_FMT_I42016) {
129 assert(dst->fmt == AOM_IMG_FMT_I42016);
130 return I420Scale_16(
131 (uint16_t *)src->planes[AOM_PLANE_Y], src->stride[AOM_PLANE_Y] / 2,
132 (uint16_t *)src->planes[AOM_PLANE_U], src->stride[AOM_PLANE_U] / 2,
133 (uint16_t *)src->planes[AOM_PLANE_V], src->stride[AOM_PLANE_V] / 2,
134 src->d_w, src->d_h, (uint16_t *)dst->planes[AOM_PLANE_Y],
135 dst->stride[AOM_PLANE_Y] / 2, (uint16_t *)dst->planes[AOM_PLANE_U],
136 dst->stride[AOM_PLANE_U] / 2, (uint16_t *)dst->planes[AOM_PLANE_V],
137 dst->stride[AOM_PLANE_V] / 2, dst->d_w, dst->d_h, mode);
139 assert(src->fmt == AOM_IMG_FMT_I420);
140 assert(dst->fmt == AOM_IMG_FMT_I420);
141 return I420Scale(src->planes[AOM_PLANE_Y], src->stride[AOM_PLANE_Y],
142 src->planes[AOM_PLANE_U], src->stride[AOM_PLANE_U],
143 src->planes[AOM_PLANE_V], src->stride[AOM_PLANE_V], src->d_w,
144 src->d_h, dst->planes[AOM_PLANE_Y], dst->stride[AOM_PLANE_Y],
145 dst->planes[AOM_PLANE_U], dst->stride[AOM_PLANE_U],
146 dst->planes[AOM_PLANE_V], dst->stride[AOM_PLANE_V], dst->d_w,
147 dst->d_h, mode);
149 #endif
151 void show_help(FILE *fout, int shorthelp) {
152 fprintf(fout, "Usage: %s <options> filename\n\n", exec_name);
154 if (shorthelp) {
155 fprintf(fout, "Use --help to see the full list of options.\n");
156 return;
159 fprintf(fout, "Options:\n");
160 arg_show_usage(fout, all_args);
161 fprintf(fout,
162 "\nOutput File Patterns:\n\n"
163 " The -o argument specifies the name of the file(s) to "
164 "write to. If the\n argument does not include any escape "
165 "characters, the output will be\n written to a single file. "
166 "Otherwise, the filename will be calculated by\n expanding "
167 "the following escape characters:\n");
168 fprintf(fout,
169 "\n\t%%w - Frame width"
170 "\n\t%%h - Frame height"
171 "\n\t%%<n> - Frame number, zero padded to <n> places (1..9)"
172 "\n\n Pattern arguments are only supported in conjunction "
173 "with the --yv12 and\n --i420 options. If the -o option is "
174 "not specified, the output will be\n directed to stdout.\n");
175 fprintf(fout, "\nIncluded decoders:\n\n");
177 for (int i = 0; i < get_aom_decoder_count(); ++i) {
178 const AvxInterface *const decoder = get_aom_decoder_by_index(i);
179 fprintf(fout, " %-6s - %s\n", decoder->name,
180 aom_codec_iface_name(decoder->codec_interface()));
184 void usage_exit(void) {
185 show_help(stderr, 1);
186 exit(EXIT_FAILURE);
189 static int raw_read_frame(FILE *infile, uint8_t **buffer, size_t *bytes_read,
190 size_t *buffer_size) {
191 char raw_hdr[RAW_FRAME_HDR_SZ];
192 size_t frame_size = 0;
194 if (fread(raw_hdr, RAW_FRAME_HDR_SZ, 1, infile) != 1) {
195 if (!feof(infile)) warn("Failed to read RAW frame size\n");
196 } else {
197 const size_t kCorruptFrameThreshold = 256 * 1024 * 1024;
198 const size_t kFrameTooSmallThreshold = 256 * 1024;
199 frame_size = mem_get_le32(raw_hdr);
201 if (frame_size > kCorruptFrameThreshold) {
202 warn("Read invalid frame size (%u)\n", (unsigned int)frame_size);
203 frame_size = 0;
206 if (frame_size < kFrameTooSmallThreshold) {
207 warn("Warning: Read invalid frame size (%u) - not a raw file?\n",
208 (unsigned int)frame_size);
211 if (frame_size > *buffer_size) {
212 uint8_t *new_buf = realloc(*buffer, 2 * frame_size);
213 if (new_buf) {
214 *buffer = new_buf;
215 *buffer_size = 2 * frame_size;
216 } else {
217 warn("Failed to allocate compressed data buffer\n");
218 frame_size = 0;
223 if (!feof(infile)) {
224 if (fread(*buffer, 1, frame_size, infile) != frame_size) {
225 warn("Failed to read full frame\n");
226 return 1;
228 *bytes_read = frame_size;
231 return 0;
234 static int read_frame(struct AvxDecInputContext *input, uint8_t **buf,
235 size_t *bytes_in_buffer, size_t *buffer_size) {
236 switch (input->aom_input_ctx->file_type) {
237 #if CONFIG_WEBM_IO
238 case FILE_TYPE_WEBM:
239 return webm_read_frame(input->webm_ctx, buf, bytes_in_buffer);
240 #endif
241 case FILE_TYPE_RAW:
242 return raw_read_frame(input->aom_input_ctx->file, buf, bytes_in_buffer,
243 buffer_size);
244 case FILE_TYPE_IVF:
245 return ivf_read_frame(input->aom_input_ctx->file, buf, bytes_in_buffer,
246 buffer_size);
247 #if CONFIG_OBU_NO_IVF
248 case FILE_TYPE_OBU:
249 return obu_read_temporal_unit(input->aom_input_ctx->file, buf,
250 #if CONFIG_SCALABILITY
251 bytes_in_buffer, buffer_size, 0);
252 #else
253 bytes_in_buffer, buffer_size);
254 #endif
255 #endif
256 default: return 1;
260 static void update_image_md5(const aom_image_t *img, const int planes[3],
261 MD5Context *md5) {
262 int i, y;
264 for (i = 0; i < 3; ++i) {
265 const int plane = planes[i];
266 const unsigned char *buf = img->planes[plane];
267 const int stride = img->stride[plane];
268 const int w = aom_img_plane_width(img, plane) *
269 ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) ? 2 : 1);
270 const int h = aom_img_plane_height(img, plane);
272 for (y = 0; y < h; ++y) {
273 MD5Update(md5, buf, w);
274 buf += stride;
279 static void write_image_file(const aom_image_t *img, const int *planes,
280 const int num_planes, FILE *file) {
281 int i, y;
282 const int bytes_per_sample = ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) ? 2 : 1);
284 for (i = 0; i < num_planes; ++i) {
285 const int plane = planes[i];
286 const unsigned char *buf = img->planes[plane];
287 const int stride = img->stride[plane];
288 const int w = aom_img_plane_width(img, plane);
289 const int h = aom_img_plane_height(img, plane);
291 for (y = 0; y < h; ++y) {
292 fwrite(buf, bytes_per_sample, w, file);
293 buf += stride;
298 static int file_is_raw(struct AvxInputContext *input) {
299 uint8_t buf[32];
300 int is_raw = 0;
301 aom_codec_stream_info_t si;
303 if (fread(buf, 1, 32, input->file) == 32) {
304 int i;
306 if (mem_get_le32(buf) < 256 * 1024 * 1024) {
307 for (i = 0; i < get_aom_decoder_count(); ++i) {
308 const AvxInterface *const decoder = get_aom_decoder_by_index(i);
309 if (!aom_codec_peek_stream_info(decoder->codec_interface(), buf + 4,
310 32 - 4, &si)) {
311 is_raw = 1;
312 input->fourcc = decoder->fourcc;
313 input->width = si.w;
314 input->height = si.h;
315 input->framerate.numerator = 30;
316 input->framerate.denominator = 1;
317 break;
323 rewind(input->file);
324 return is_raw;
327 static void show_progress(int frame_in, int frame_out, uint64_t dx_time) {
328 fprintf(stderr,
329 "%d decoded frames/%d showed frames in %" PRId64 " us (%.2f fps)\r",
330 frame_in, frame_out, dx_time,
331 (double)frame_out * 1000000.0 / (double)dx_time);
334 struct ExternalFrameBuffer {
335 uint8_t *data;
336 size_t size;
337 int in_use;
340 struct ExternalFrameBufferList {
341 int num_external_frame_buffers;
342 struct ExternalFrameBuffer *ext_fb;
345 // Callback used by libaom to request an external frame buffer. |cb_priv|
346 // Application private data passed into the set function. |min_size| is the
347 // minimum size in bytes needed to decode the next frame. |fb| pointer to the
348 // frame buffer.
349 static int get_av1_frame_buffer(void *cb_priv, size_t min_size,
350 aom_codec_frame_buffer_t *fb) {
351 int i;
352 struct ExternalFrameBufferList *const ext_fb_list =
353 (struct ExternalFrameBufferList *)cb_priv;
354 if (ext_fb_list == NULL) return -1;
356 // Find a free frame buffer.
357 for (i = 0; i < ext_fb_list->num_external_frame_buffers; ++i) {
358 if (!ext_fb_list->ext_fb[i].in_use) break;
361 if (i == ext_fb_list->num_external_frame_buffers) return -1;
363 if (ext_fb_list->ext_fb[i].size < min_size) {
364 free(ext_fb_list->ext_fb[i].data);
365 ext_fb_list->ext_fb[i].data = (uint8_t *)calloc(min_size, sizeof(uint8_t));
366 if (!ext_fb_list->ext_fb[i].data) return -1;
368 ext_fb_list->ext_fb[i].size = min_size;
371 fb->data = ext_fb_list->ext_fb[i].data;
372 fb->size = ext_fb_list->ext_fb[i].size;
373 ext_fb_list->ext_fb[i].in_use = 1;
375 // Set the frame buffer's private data to point at the external frame buffer.
376 fb->priv = &ext_fb_list->ext_fb[i];
377 return 0;
380 // Callback used by libaom when there are no references to the frame buffer.
381 // |cb_priv| user private data passed into the set function. |fb| pointer
382 // to the frame buffer.
383 static int release_av1_frame_buffer(void *cb_priv,
384 aom_codec_frame_buffer_t *fb) {
385 struct ExternalFrameBuffer *const ext_fb =
386 (struct ExternalFrameBuffer *)fb->priv;
387 (void)cb_priv;
388 ext_fb->in_use = 0;
389 return 0;
392 static void generate_filename(const char *pattern, char *out, size_t q_len,
393 unsigned int d_w, unsigned int d_h,
394 unsigned int frame_in) {
395 const char *p = pattern;
396 char *q = out;
398 do {
399 char *next_pat = strchr(p, '%');
401 if (p == next_pat) {
402 size_t pat_len;
404 /* parse the pattern */
405 q[q_len - 1] = '\0';
406 switch (p[1]) {
407 case 'w': snprintf(q, q_len - 1, "%d", d_w); break;
408 case 'h': snprintf(q, q_len - 1, "%d", d_h); break;
409 case '1': snprintf(q, q_len - 1, "%d", frame_in); break;
410 case '2': snprintf(q, q_len - 1, "%02d", frame_in); break;
411 case '3': snprintf(q, q_len - 1, "%03d", frame_in); break;
412 case '4': snprintf(q, q_len - 1, "%04d", frame_in); break;
413 case '5': snprintf(q, q_len - 1, "%05d", frame_in); break;
414 case '6': snprintf(q, q_len - 1, "%06d", frame_in); break;
415 case '7': snprintf(q, q_len - 1, "%07d", frame_in); break;
416 case '8': snprintf(q, q_len - 1, "%08d", frame_in); break;
417 case '9': snprintf(q, q_len - 1, "%09d", frame_in); break;
418 default: die("Unrecognized pattern %%%c\n", p[1]); break;
421 pat_len = strlen(q);
422 if (pat_len >= q_len - 1) die("Output filename too long.\n");
423 q += pat_len;
424 p += 2;
425 q_len -= pat_len;
426 } else {
427 size_t copy_len;
429 /* copy the next segment */
430 if (!next_pat)
431 copy_len = strlen(p);
432 else
433 copy_len = next_pat - p;
435 if (copy_len >= q_len - 1) die("Output filename too long.\n");
437 memcpy(q, p, copy_len);
438 q[copy_len] = '\0';
439 q += copy_len;
440 p += copy_len;
441 q_len -= copy_len;
443 } while (*p);
446 static int is_single_file(const char *outfile_pattern) {
447 const char *p = outfile_pattern;
449 do {
450 p = strchr(p, '%');
451 if (p && p[1] >= '1' && p[1] <= '9')
452 return 0; // pattern contains sequence number, so it's not unique
453 if (p) p++;
454 } while (p);
456 return 1;
459 static void print_md5(unsigned char digest[16], const char *filename) {
460 int i;
462 for (i = 0; i < 16; ++i) printf("%02x", digest[i]);
463 printf(" %s\n", filename);
466 static FILE *open_outfile(const char *name) {
467 if (strcmp("-", name) == 0) {
468 set_binary_mode(stdout);
469 return stdout;
470 } else {
471 FILE *file = fopen(name, "wb");
472 if (!file) fatal("Failed to open output file '%s'", name);
473 return file;
477 static int img_shifted_realloc_required(const aom_image_t *img,
478 const aom_image_t *shifted,
479 aom_img_fmt_t required_fmt) {
480 return img->d_w != shifted->d_w || img->d_h != shifted->d_h ||
481 required_fmt != shifted->fmt;
484 static int main_loop(int argc, const char **argv_) {
485 aom_codec_ctx_t decoder;
486 char *fn = NULL;
487 int i;
488 int ret = EXIT_FAILURE;
489 uint8_t *buf = NULL;
490 size_t bytes_in_buffer = 0, buffer_size = 0;
491 FILE *infile;
492 int frame_in = 0, frame_out = 0, flipuv = 0, noblit = 0;
493 int do_md5 = 0, progress = 0;
494 int stop_after = 0, postproc = 0, summary = 0, quiet = 1;
495 int arg_skip = 0;
496 int keep_going = 0;
497 const AvxInterface *interface = NULL;
498 const AvxInterface *fourcc_interface = NULL;
499 uint64_t dx_time = 0;
500 struct arg arg;
501 char **argv, **argi, **argj;
503 int single_file;
504 int use_y4m = 1;
505 int opt_yv12 = 0;
506 int opt_i420 = 0;
507 int opt_raw = 0;
508 aom_codec_dec_cfg_t cfg = { 0, 0, 0, CONFIG_LOWBITDEPTH, { 1 } };
509 unsigned int output_bit_depth = 0;
510 unsigned int tile_mode = 0;
511 int tile_row = -1;
512 int tile_col = -1;
513 int frames_corrupted = 0;
514 int dec_flags = 0;
515 int do_scale = 0;
516 aom_image_t *scaled_img = NULL;
517 aom_image_t *img_shifted = NULL;
518 int frame_avail, got_data, flush_decoder = 0;
519 int num_external_frame_buffers = 0;
520 struct ExternalFrameBufferList ext_fb_list = { 0, NULL };
522 const char *outfile_pattern = NULL;
523 char outfile_name[PATH_MAX] = { 0 };
524 FILE *outfile = NULL;
526 FILE *framestats_file = NULL;
528 MD5Context md5_ctx;
529 unsigned char md5_digest[16];
531 struct AvxDecInputContext input = { NULL, NULL };
532 struct AvxInputContext aom_input_ctx;
533 #if CONFIG_WEBM_IO
534 struct WebmInputContext webm_ctx;
535 memset(&(webm_ctx), 0, sizeof(webm_ctx));
536 input.webm_ctx = &webm_ctx;
537 #endif
538 input.aom_input_ctx = &aom_input_ctx;
540 /* Parse command line */
541 exec_name = argv_[0];
542 argv = argv_dup(argc - 1, argv_ + 1);
544 for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
545 memset(&arg, 0, sizeof(arg));
546 arg.argv_step = 1;
548 if (arg_match(&arg, &help, argi)) {
549 show_help(stdout, 0);
550 exit(EXIT_SUCCESS);
551 } else if (arg_match(&arg, &codecarg, argi)) {
552 interface = get_aom_decoder_by_name(arg.val);
553 if (!interface)
554 die("Error: Unrecognized argument (%s) to --codec\n", arg.val);
555 } else if (arg_match(&arg, &looparg, argi)) {
556 // no-op
557 } else if (arg_match(&arg, &outputfile, argi)) {
558 outfile_pattern = arg.val;
559 } else if (arg_match(&arg, &use_yv12, argi)) {
560 use_y4m = 0;
561 flipuv = 1;
562 opt_yv12 = 1;
563 opt_i420 = 0;
564 opt_raw = 0;
565 } else if (arg_match(&arg, &use_i420, argi)) {
566 use_y4m = 0;
567 flipuv = 0;
568 opt_yv12 = 0;
569 opt_i420 = 1;
570 opt_raw = 0;
571 } else if (arg_match(&arg, &rawvideo, argi)) {
572 use_y4m = 0;
573 opt_yv12 = 0;
574 opt_i420 = 0;
575 opt_raw = 1;
576 } else if (arg_match(&arg, &flipuvarg, argi)) {
577 flipuv = 1;
578 } else if (arg_match(&arg, &noblitarg, argi)) {
579 noblit = 1;
580 } else if (arg_match(&arg, &progressarg, argi)) {
581 progress = 1;
582 } else if (arg_match(&arg, &limitarg, argi)) {
583 stop_after = arg_parse_uint(&arg);
584 } else if (arg_match(&arg, &skiparg, argi)) {
585 arg_skip = arg_parse_uint(&arg);
586 } else if (arg_match(&arg, &postprocarg, argi)) {
587 postproc = 1;
588 } else if (arg_match(&arg, &md5arg, argi)) {
589 do_md5 = 1;
590 } else if (arg_match(&arg, &framestatsarg, argi)) {
591 framestats_file = fopen(arg.val, "w");
592 if (!framestats_file) {
593 die("Error: Could not open --framestats file (%s) for writing.\n",
594 arg.val);
596 } else if (arg_match(&arg, &summaryarg, argi)) {
597 summary = 1;
598 } else if (arg_match(&arg, &threadsarg, argi)) {
599 cfg.threads = arg_parse_uint(&arg);
600 } else if (arg_match(&arg, &verbosearg, argi)) {
601 quiet = 0;
602 } else if (arg_match(&arg, &scalearg, argi)) {
603 do_scale = 1;
604 } else if (arg_match(&arg, &fb_arg, argi)) {
605 num_external_frame_buffers = arg_parse_uint(&arg);
606 } else if (arg_match(&arg, &continuearg, argi)) {
607 keep_going = 1;
608 } else if (arg_match(&arg, &outbitdeptharg, argi)) {
609 output_bit_depth = arg_parse_uint(&arg);
610 } else if (arg_match(&arg, &tilem, argi)) {
611 tile_mode = arg_parse_int(&arg);
612 } else if (arg_match(&arg, &tiler, argi)) {
613 tile_row = arg_parse_int(&arg);
614 } else if (arg_match(&arg, &tilec, argi)) {
615 tile_col = arg_parse_int(&arg);
616 } else {
617 argj++;
621 /* Check for unrecognized options */
622 for (argi = argv; *argi; argi++)
623 if (argi[0][0] == '-' && strlen(argi[0]) > 1)
624 die("Error: Unrecognized option %s\n", *argi);
626 /* Handle non-option arguments */
627 fn = argv[0];
629 if (!fn) {
630 free(argv);
631 fprintf(stderr, "No input file specified!\n");
632 usage_exit();
634 /* Open file */
635 infile = strcmp(fn, "-") ? fopen(fn, "rb") : set_binary_mode(stdin);
637 if (!infile) {
638 fatal("Failed to open input file '%s'", strcmp(fn, "-") ? fn : "stdin");
640 #if CONFIG_OS_SUPPORT
641 /* Make sure we don't dump to the terminal, unless forced to with -o - */
642 if (!outfile_pattern && isatty(STDOUT_FILENO) && !do_md5 && !noblit) {
643 fprintf(stderr,
644 "Not dumping raw video to your terminal. Use '-o -' to "
645 "override.\n");
646 return EXIT_FAILURE;
648 #endif
649 input.aom_input_ctx->filename = fn;
650 input.aom_input_ctx->file = infile;
651 if (file_is_ivf(input.aom_input_ctx))
652 input.aom_input_ctx->file_type = FILE_TYPE_IVF;
653 #if CONFIG_WEBM_IO
654 else if (file_is_webm(input.webm_ctx, input.aom_input_ctx))
655 input.aom_input_ctx->file_type = FILE_TYPE_WEBM;
656 #endif
657 #if CONFIG_OBU_NO_IVF
658 else if (file_is_obu(input.aom_input_ctx))
659 input.aom_input_ctx->file_type = FILE_TYPE_OBU;
660 #endif
661 else if (file_is_raw(input.aom_input_ctx))
662 input.aom_input_ctx->file_type = FILE_TYPE_RAW;
663 else {
664 fprintf(stderr, "Unrecognized input file type.\n");
665 #if !CONFIG_WEBM_IO
666 fprintf(stderr, "aomdec was built without WebM container support.\n");
667 #endif
668 return EXIT_FAILURE;
671 outfile_pattern = outfile_pattern ? outfile_pattern : "-";
672 single_file = is_single_file(outfile_pattern);
674 if (!noblit && single_file) {
675 generate_filename(outfile_pattern, outfile_name, PATH_MAX,
676 aom_input_ctx.width, aom_input_ctx.height, 0);
677 if (do_md5)
678 MD5Init(&md5_ctx);
679 else
680 outfile = open_outfile(outfile_name);
683 if (use_y4m && !noblit) {
684 if (!single_file) {
685 fprintf(stderr,
686 "YUV4MPEG2 not supported with output patterns,"
687 " try --i420 or --yv12 or --rawvideo.\n");
688 return EXIT_FAILURE;
691 #if CONFIG_WEBM_IO
692 if (aom_input_ctx.file_type == FILE_TYPE_WEBM) {
693 if (webm_guess_framerate(input.webm_ctx, input.aom_input_ctx)) {
694 fprintf(stderr,
695 "Failed to guess framerate -- error parsing "
696 "webm file?\n");
697 return EXIT_FAILURE;
700 #endif
703 fourcc_interface = get_aom_decoder_by_fourcc(aom_input_ctx.fourcc);
704 if (interface && fourcc_interface && interface != fourcc_interface)
705 warn("Header indicates codec: %s\n", fourcc_interface->name);
706 else
707 interface = fourcc_interface;
709 if (!interface) interface = get_aom_decoder_by_index(0);
711 dec_flags = (postproc ? AOM_CODEC_USE_POSTPROC : 0);
712 if (aom_codec_dec_init(&decoder, interface->codec_interface(), &cfg,
713 dec_flags)) {
714 fprintf(stderr, "Failed to initialize decoder: %s\n",
715 aom_codec_error(&decoder));
716 goto fail2;
719 if (!quiet) fprintf(stderr, "%s\n", decoder.name);
721 #if CONFIG_AV1_DECODER
722 if (aom_codec_control(&decoder, AV1_SET_TILE_MODE, tile_mode)) {
723 fprintf(stderr, "Failed to set decode_tile_mode: %s\n",
724 aom_codec_error(&decoder));
725 goto fail;
728 if (aom_codec_control(&decoder, AV1_SET_DECODE_TILE_ROW, tile_row)) {
729 fprintf(stderr, "Failed to set decode_tile_row: %s\n",
730 aom_codec_error(&decoder));
731 goto fail;
734 if (aom_codec_control(&decoder, AV1_SET_DECODE_TILE_COL, tile_col)) {
735 fprintf(stderr, "Failed to set decode_tile_col: %s\n",
736 aom_codec_error(&decoder));
737 goto fail;
739 #endif
741 if (arg_skip) fprintf(stderr, "Skipping first %d frames.\n", arg_skip);
742 while (arg_skip) {
743 if (read_frame(&input, &buf, &bytes_in_buffer, &buffer_size)) break;
744 arg_skip--;
747 if (num_external_frame_buffers > 0) {
748 ext_fb_list.num_external_frame_buffers = num_external_frame_buffers;
749 ext_fb_list.ext_fb = (struct ExternalFrameBuffer *)calloc(
750 num_external_frame_buffers, sizeof(*ext_fb_list.ext_fb));
751 if (aom_codec_set_frame_buffer_functions(&decoder, get_av1_frame_buffer,
752 release_av1_frame_buffer,
753 &ext_fb_list)) {
754 fprintf(stderr, "Failed to configure external frame buffers: %s\n",
755 aom_codec_error(&decoder));
756 goto fail;
760 frame_avail = 1;
761 got_data = 0;
763 if (framestats_file) fprintf(framestats_file, "bytes,qp\r\n");
765 /* Decode file */
766 while (frame_avail || got_data) {
767 aom_codec_iter_t iter = NULL;
768 aom_image_t *img;
769 struct aom_usec_timer timer;
770 int corrupted = 0;
772 frame_avail = 0;
773 if (!stop_after || frame_in < stop_after) {
774 if (!read_frame(&input, &buf, &bytes_in_buffer, &buffer_size)) {
775 frame_avail = 1;
776 frame_in++;
778 aom_usec_timer_start(&timer);
780 if (aom_codec_decode(&decoder, buf, (unsigned int)bytes_in_buffer,
781 NULL)) {
782 const char *detail = aom_codec_error_detail(&decoder);
783 warn("Failed to decode frame %d: %s", frame_in,
784 aom_codec_error(&decoder));
786 if (detail) warn("Additional information: %s", detail);
787 if (!keep_going) goto fail;
790 if (framestats_file) {
791 int qp;
792 if (aom_codec_control(&decoder, AOMD_GET_LAST_QUANTIZER, &qp)) {
793 warn("Failed AOMD_GET_LAST_QUANTIZER: %s",
794 aom_codec_error(&decoder));
795 if (!keep_going) goto fail;
797 fprintf(framestats_file, "%d,%d\r\n", (int)bytes_in_buffer, qp);
800 aom_usec_timer_mark(&timer);
801 dx_time += aom_usec_timer_elapsed(&timer);
802 } else {
803 flush_decoder = 1;
805 } else {
806 flush_decoder = 1;
809 aom_usec_timer_start(&timer);
811 if (flush_decoder) {
812 // Flush the decoder in frame parallel decode.
813 if (aom_codec_decode(&decoder, NULL, 0, NULL)) {
814 warn("Failed to flush decoder: %s", aom_codec_error(&decoder));
818 got_data = 0;
819 if ((img = aom_codec_get_frame(&decoder, &iter))) {
820 ++frame_out;
821 got_data = 1;
824 aom_usec_timer_mark(&timer);
825 dx_time += (unsigned int)aom_usec_timer_elapsed(&timer);
827 if (aom_codec_control(&decoder, AOMD_GET_FRAME_CORRUPTED, &corrupted)) {
828 warn("Failed AOM_GET_FRAME_CORRUPTED: %s", aom_codec_error(&decoder));
829 if (!keep_going) goto fail;
831 frames_corrupted += corrupted;
833 if (progress) show_progress(frame_in, frame_out, dx_time);
835 if (!noblit && img) {
836 const int PLANES_YUV[] = { AOM_PLANE_Y, AOM_PLANE_U, AOM_PLANE_V };
837 const int PLANES_YVU[] = { AOM_PLANE_Y, AOM_PLANE_V, AOM_PLANE_U };
838 const int *planes = flipuv ? PLANES_YVU : PLANES_YUV;
840 if (do_scale) {
841 if (frame_out == 1) {
842 // If the output frames are to be scaled to a fixed display size then
843 // use the width and height specified in the container. If either of
844 // these is set to 0, use the display size set in the first frame
845 // header. If that is unavailable, use the raw decoded size of the
846 // first decoded frame.
847 int render_width = aom_input_ctx.width;
848 int render_height = aom_input_ctx.height;
849 if (!render_width || !render_height) {
850 int render_size[2];
851 if (aom_codec_control(&decoder, AV1D_GET_DISPLAY_SIZE,
852 render_size)) {
853 // As last resort use size of first frame as display size.
854 render_width = img->d_w;
855 render_height = img->d_h;
856 } else {
857 render_width = render_size[0];
858 render_height = render_size[1];
861 scaled_img =
862 aom_img_alloc(NULL, img->fmt, render_width, render_height, 16);
863 scaled_img->bit_depth = img->bit_depth;
866 if (img->d_w != scaled_img->d_w || img->d_h != scaled_img->d_h) {
867 #if CONFIG_LIBYUV
868 libyuv_scale(img, scaled_img, kFilterBox);
869 img = scaled_img;
870 #else
871 fprintf(stderr,
872 "Failed to scale output frame: %s.\n"
873 "libyuv is required for scaling but is currently disabled.\n"
874 "Be sure to specify -DCONFIG_LIBYUV=1 when running cmake.\n",
875 aom_codec_error(&decoder));
876 goto fail;
877 #endif
880 // Default to codec bit depth if output bit depth not set
881 if (!output_bit_depth && single_file && !do_md5) {
882 output_bit_depth = img->bit_depth;
884 // Shift up or down if necessary
885 if (output_bit_depth != 0) {
886 const aom_img_fmt_t shifted_fmt =
887 output_bit_depth == 8
888 ? img->fmt ^ (img->fmt & AOM_IMG_FMT_HIGHBITDEPTH)
889 : img->fmt | AOM_IMG_FMT_HIGHBITDEPTH;
891 if (shifted_fmt != img->fmt || output_bit_depth != img->bit_depth) {
892 if (img_shifted &&
893 img_shifted_realloc_required(img, img_shifted, shifted_fmt)) {
894 aom_img_free(img_shifted);
895 img_shifted = NULL;
897 if (!img_shifted) {
898 img_shifted =
899 aom_img_alloc(NULL, shifted_fmt, img->d_w, img->d_h, 16);
900 img_shifted->bit_depth = output_bit_depth;
902 if (output_bit_depth > img->bit_depth) {
903 aom_img_upshift(img_shifted, img,
904 output_bit_depth - img->bit_depth);
905 } else {
906 aom_img_downshift(img_shifted, img,
907 img->bit_depth - output_bit_depth);
909 img = img_shifted;
913 aom_input_ctx.width = img->d_w;
914 aom_input_ctx.height = img->d_h;
916 #if CONFIG_MONO_VIDEO
917 int num_planes = (!use_y4m && opt_raw && img->monochrome) ? 1 : 3;
918 #else
919 int num_planes = 3;
920 (void)opt_raw;
921 #endif
923 if (single_file) {
924 if (use_y4m) {
925 char y4m_buf[Y4M_BUFFER_SIZE] = { 0 };
926 size_t len = 0;
927 if (img->fmt == AOM_IMG_FMT_I440 || img->fmt == AOM_IMG_FMT_I44016) {
928 fprintf(stderr, "Cannot produce y4m output for 440 sampling.\n");
929 goto fail;
931 if (frame_out == 1) {
932 // Y4M file header
933 len = y4m_write_file_header(
934 y4m_buf, sizeof(y4m_buf), aom_input_ctx.width,
935 aom_input_ctx.height, &aom_input_ctx.framerate, img->fmt,
936 img->bit_depth);
937 if (do_md5) {
938 MD5Update(&md5_ctx, (md5byte *)y4m_buf, (unsigned int)len);
939 } else {
940 fputs(y4m_buf, outfile);
944 // Y4M frame header
945 len = y4m_write_frame_header(y4m_buf, sizeof(y4m_buf));
946 if (do_md5) {
947 MD5Update(&md5_ctx, (md5byte *)y4m_buf, (unsigned int)len);
948 } else {
949 fputs(y4m_buf, outfile);
951 } else {
952 if (frame_out == 1) {
953 // Check if --yv12 or --i420 options are consistent with the
954 // bit-stream decoded
955 if (opt_i420) {
956 if (img->fmt != AOM_IMG_FMT_I420 &&
957 img->fmt != AOM_IMG_FMT_I42016) {
958 fprintf(stderr, "Cannot produce i420 output for bit-stream.\n");
959 goto fail;
962 if (opt_yv12) {
963 if ((img->fmt != AOM_IMG_FMT_I420 &&
964 img->fmt != AOM_IMG_FMT_YV12) ||
965 img->bit_depth != 8) {
966 fprintf(stderr, "Cannot produce yv12 output for bit-stream.\n");
967 goto fail;
973 if (do_md5) {
974 update_image_md5(img, planes, &md5_ctx);
975 } else {
976 write_image_file(img, planes, num_planes, outfile);
978 } else {
979 generate_filename(outfile_pattern, outfile_name, PATH_MAX, img->d_w,
980 img->d_h, frame_in);
981 if (do_md5) {
982 MD5Init(&md5_ctx);
983 update_image_md5(img, planes, &md5_ctx);
984 MD5Final(md5_digest, &md5_ctx);
985 print_md5(md5_digest, outfile_name);
986 } else {
987 outfile = open_outfile(outfile_name);
988 write_image_file(img, planes, num_planes, outfile);
989 fclose(outfile);
995 if (summary || progress) {
996 show_progress(frame_in, frame_out, dx_time);
997 fprintf(stderr, "\n");
1000 if (frames_corrupted) {
1001 fprintf(stderr, "WARNING: %d frames corrupted.\n", frames_corrupted);
1002 } else {
1003 ret = EXIT_SUCCESS;
1006 fail:
1008 if (aom_codec_destroy(&decoder)) {
1009 fprintf(stderr, "Failed to destroy decoder: %s\n",
1010 aom_codec_error(&decoder));
1013 fail2:
1015 if (!noblit && single_file) {
1016 if (do_md5) {
1017 MD5Final(md5_digest, &md5_ctx);
1018 print_md5(md5_digest, outfile_name);
1019 } else {
1020 fclose(outfile);
1024 #if CONFIG_WEBM_IO
1025 if (input.aom_input_ctx->file_type == FILE_TYPE_WEBM)
1026 webm_free(input.webm_ctx);
1027 #endif
1029 if (input.aom_input_ctx->file_type != FILE_TYPE_WEBM) free(buf);
1031 if (scaled_img) aom_img_free(scaled_img);
1032 if (img_shifted) aom_img_free(img_shifted);
1034 for (i = 0; i < ext_fb_list.num_external_frame_buffers; ++i) {
1035 free(ext_fb_list.ext_fb[i].data);
1037 free(ext_fb_list.ext_fb);
1039 fclose(infile);
1040 if (framestats_file) fclose(framestats_file);
1042 free(argv);
1044 return ret;
1047 int main(int argc, const char **argv_) {
1048 unsigned int loops = 1, i;
1049 char **argv, **argi, **argj;
1050 struct arg arg;
1051 int error = 0;
1053 argv = argv_dup(argc - 1, argv_ + 1);
1054 for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
1055 memset(&arg, 0, sizeof(arg));
1056 arg.argv_step = 1;
1058 if (arg_match(&arg, &looparg, argi)) {
1059 loops = arg_parse_uint(&arg);
1060 break;
1063 free(argv);
1064 for (i = 0; !error && i < loops; i++) error = main_loop(argc, argv_);
1065 return error;