AOMedia AV1 Codec
inspect
1/*
2 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3 *
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10 */
11
12// Inspect Decoder
13// ================
14//
15// This is a simple decoder loop that writes JSON stats to stdout. This tool
16// can also be compiled with Emscripten and used as a library.
17
18#include <stdio.h>
19#include <stdlib.h>
20#include <string.h>
21
22#ifdef __EMSCRIPTEN__
23#include <emscripten.h>
24#else
25#define EMSCRIPTEN_KEEPALIVE
26#endif
27
28#include "config/aom_config.h"
29
30#include "aom/aom_decoder.h"
31#include "aom/aomdx.h"
32#include "av1/common/av1_common_int.h"
33
34#if CONFIG_ACCOUNTING
35#include "av1/decoder/accounting.h"
36#endif
37
38#include "av1/decoder/inspection.h"
39#include "common/args.h"
40#include "common/tools_common.h"
41#include "common/video_common.h"
42#include "common/video_reader.h"
43
44// Max JSON buffer size.
45const int MAX_BUFFER = 1024 * 1024 * 256;
46
47typedef enum {
48 ACCOUNTING_LAYER = 1,
49 BLOCK_SIZE_LAYER = 1 << 1,
50 TRANSFORM_SIZE_LAYER = 1 << 2,
51 TRANSFORM_TYPE_LAYER = 1 << 3,
52 MODE_LAYER = 1 << 4,
53 SKIP_LAYER = 1 << 5,
54 FILTER_LAYER = 1 << 6,
55 CDEF_LAYER = 1 << 7,
56 REFERENCE_FRAME_LAYER = 1 << 8,
57 MOTION_VECTORS_LAYER = 1 << 9,
58 UV_MODE_LAYER = 1 << 10,
59 CFL_LAYER = 1 << 11,
60 DUAL_FILTER_LAYER = 1 << 12,
61 Q_INDEX_LAYER = 1 << 13,
62 SEGMENT_ID_LAYER = 1 << 14,
63 MOTION_MODE_LAYER = 1 << 15,
64 COMPOUND_TYPE_LAYER = 1 << 16,
65 INTRABC_LAYER = 1 << 17,
66 PALETTE_LAYER = 1 << 18,
67 UV_PALETTE_LAYER = 1 << 19,
68 ALL_LAYERS = (1 << 20) - 1
69} LayerType;
70
71static LayerType layers = 0;
72
73static int stop_after = 0;
74static int compress = 0;
75
76static const arg_def_t limit_arg =
77 ARG_DEF(NULL, "limit", 1, "Stop decoding after n frames");
78static const arg_def_t dump_all_arg = ARG_DEF("A", "all", 0, "Dump All");
79static const arg_def_t compress_arg =
80 ARG_DEF("x", "compress", 0, "Compress JSON using RLE");
81static const arg_def_t dump_accounting_arg =
82 ARG_DEF("a", "accounting", 0, "Dump Accounting");
83static const arg_def_t dump_block_size_arg =
84 ARG_DEF("bs", "blockSize", 0, "Dump Block Size");
85static const arg_def_t dump_motion_vectors_arg =
86 ARG_DEF("mv", "motionVectors", 0, "Dump Motion Vectors");
87static const arg_def_t dump_transform_size_arg =
88 ARG_DEF("ts", "transformSize", 0, "Dump Transform Size");
89static const arg_def_t dump_transform_type_arg =
90 ARG_DEF("tt", "transformType", 0, "Dump Transform Type");
91static const arg_def_t dump_mode_arg = ARG_DEF("m", "mode", 0, "Dump Mode");
92static const arg_def_t dump_motion_mode_arg =
93 ARG_DEF("mm", "motion_mode", 0, "Dump Motion Modes");
94static const arg_def_t dump_compound_type_arg =
95 ARG_DEF("ct", "compound_type", 0, "Dump Compound Types");
96static const arg_def_t dump_uv_mode_arg =
97 ARG_DEF("uvm", "uv_mode", 0, "Dump UV Intra Prediction Modes");
98static const arg_def_t dump_skip_arg = ARG_DEF("s", "skip", 0, "Dump Skip");
99static const arg_def_t dump_filter_arg =
100 ARG_DEF("f", "filter", 0, "Dump Filter");
101static const arg_def_t dump_cdef_arg = ARG_DEF("c", "cdef", 0, "Dump CDEF");
102static const arg_def_t dump_cfl_arg =
103 ARG_DEF("cfl", "chroma_from_luma", 0, "Dump Chroma from Luma Alphas");
104static const arg_def_t dump_dual_filter_type_arg =
105 ARG_DEF("df", "dualFilterType", 0, "Dump Dual Filter Type");
106static const arg_def_t dump_reference_frame_arg =
107 ARG_DEF("r", "referenceFrame", 0, "Dump Reference Frame");
108static const arg_def_t dump_delta_q_arg =
109 ARG_DEF("dq", "delta_q", 0, "Dump QIndex");
110static const arg_def_t dump_seg_id_arg =
111 ARG_DEF("si", "seg_id", 0, "Dump Segment ID");
112static const arg_def_t dump_intrabc_arg =
113 ARG_DEF("ibc", "intrabc", 0, "Dump If IntraBC Is Used");
114static const arg_def_t dump_palette_arg =
115 ARG_DEF("plt", "palette", 0, "Dump Palette Size");
116static const arg_def_t dump_uv_palette_arg =
117 ARG_DEF("uvp", "uv_palette", 0, "Dump UV Palette Size");
118static const arg_def_t usage_arg = ARG_DEF("h", "help", 0, "Help");
119static const arg_def_t skip_non_transform_arg = ARG_DEF(
120 "snt", "skip_non_transform", 1, "Skip is counted as a non transform.");
121static const arg_def_t combined_arg =
122 ARG_DEF("comb", "combined", 1, "combinining parameters into one output.");
123
124int combined_parm_list[15];
125int combined_parm_count = 0;
126
127static const arg_def_t *main_args[] = { &limit_arg,
128 &dump_all_arg,
129 &compress_arg,
130#if CONFIG_ACCOUNTING
131 &dump_accounting_arg,
132#endif
133 &dump_block_size_arg,
134 &dump_transform_size_arg,
135 &dump_transform_type_arg,
136 &dump_mode_arg,
137 &dump_uv_mode_arg,
138 &dump_motion_mode_arg,
139 &dump_compound_type_arg,
140 &dump_skip_arg,
141 &dump_filter_arg,
142 &dump_cdef_arg,
143 &dump_dual_filter_type_arg,
144 &dump_cfl_arg,
145 &dump_reference_frame_arg,
146 &dump_motion_vectors_arg,
147 &dump_delta_q_arg,
148 &dump_seg_id_arg,
149 &dump_intrabc_arg,
150 &dump_palette_arg,
151 &dump_uv_palette_arg,
152 &usage_arg,
153 &skip_non_transform_arg,
154 &combined_arg,
155 NULL };
156#define ENUM(name) \
157 { #name, name }
158#define LAST_ENUM \
159 { NULL, 0 }
160typedef struct map_entry {
161 const char *name;
162 int value;
163} map_entry;
164
165const map_entry refs_map[] = {
166 ENUM(INTRA_FRAME), ENUM(LAST_FRAME), ENUM(LAST2_FRAME),
167 ENUM(LAST3_FRAME), ENUM(GOLDEN_FRAME), ENUM(BWDREF_FRAME),
168 ENUM(ALTREF2_FRAME), ENUM(ALTREF_FRAME), LAST_ENUM
169};
170
171const map_entry block_size_map[] = {
172 ENUM(BLOCK_4X4), ENUM(BLOCK_4X8), ENUM(BLOCK_8X4),
173 ENUM(BLOCK_8X8), ENUM(BLOCK_8X16), ENUM(BLOCK_16X8),
174 ENUM(BLOCK_16X16), ENUM(BLOCK_16X32), ENUM(BLOCK_32X16),
175 ENUM(BLOCK_32X32), ENUM(BLOCK_32X64), ENUM(BLOCK_64X32),
176 ENUM(BLOCK_64X64), ENUM(BLOCK_64X128), ENUM(BLOCK_128X64),
177 ENUM(BLOCK_128X128), ENUM(BLOCK_4X16), ENUM(BLOCK_16X4),
178 ENUM(BLOCK_8X32), ENUM(BLOCK_32X8), ENUM(BLOCK_16X64),
179 ENUM(BLOCK_64X16), LAST_ENUM
180};
181
182#define TX_SKIP -1
183
184const map_entry tx_size_map[] = {
185 ENUM(TX_4X4), ENUM(TX_8X8), ENUM(TX_16X16), ENUM(TX_32X32),
186 ENUM(TX_64X64), ENUM(TX_4X8), ENUM(TX_8X4), ENUM(TX_8X16),
187 ENUM(TX_16X8), ENUM(TX_16X32), ENUM(TX_32X16), ENUM(TX_32X64),
188 ENUM(TX_64X32), ENUM(TX_4X16), ENUM(TX_16X4), ENUM(TX_8X32),
189 ENUM(TX_32X8), ENUM(TX_16X64), ENUM(TX_64X16), LAST_ENUM
190};
191
192const map_entry tx_type_map[] = { ENUM(DCT_DCT),
193 ENUM(ADST_DCT),
194 ENUM(DCT_ADST),
195 ENUM(ADST_ADST),
196 ENUM(FLIPADST_DCT),
197 ENUM(DCT_FLIPADST),
198 ENUM(FLIPADST_FLIPADST),
199 ENUM(ADST_FLIPADST),
200 ENUM(FLIPADST_ADST),
201 ENUM(IDTX),
202 ENUM(V_DCT),
203 ENUM(H_DCT),
204 ENUM(V_ADST),
205 ENUM(H_ADST),
206 ENUM(V_FLIPADST),
207 ENUM(H_FLIPADST),
208 LAST_ENUM };
209const map_entry dual_filter_map[] = { ENUM(REG_REG), ENUM(REG_SMOOTH),
210 ENUM(REG_SHARP), ENUM(SMOOTH_REG),
211 ENUM(SMOOTH_SMOOTH), ENUM(SMOOTH_SHARP),
212 ENUM(SHARP_REG), ENUM(SHARP_SMOOTH),
213 ENUM(SHARP_SHARP), LAST_ENUM };
214
215const map_entry prediction_mode_map[] = {
216 ENUM(DC_PRED), ENUM(V_PRED), ENUM(H_PRED),
217 ENUM(D45_PRED), ENUM(D135_PRED), ENUM(D113_PRED),
218 ENUM(D157_PRED), ENUM(D203_PRED), ENUM(D67_PRED),
219 ENUM(SMOOTH_PRED), ENUM(SMOOTH_V_PRED), ENUM(SMOOTH_H_PRED),
220 ENUM(PAETH_PRED), ENUM(NEARESTMV), ENUM(NEARMV),
221 ENUM(GLOBALMV), ENUM(NEWMV), ENUM(NEAREST_NEARESTMV),
222 ENUM(NEAR_NEARMV), ENUM(NEAREST_NEWMV), ENUM(NEW_NEARESTMV),
223 ENUM(NEAR_NEWMV), ENUM(NEW_NEARMV), ENUM(GLOBAL_GLOBALMV),
224 ENUM(NEW_NEWMV), ENUM(INTRA_INVALID), LAST_ENUM
225};
226
227const map_entry motion_mode_map[] = { ENUM(SIMPLE_TRANSLATION),
228 ENUM(OBMC_CAUSAL), // 2-sided OBMC
229 ENUM(WARPED_CAUSAL), // 2-sided WARPED
230 LAST_ENUM };
231
232const map_entry compound_type_map[] = { ENUM(COMPOUND_AVERAGE),
233 ENUM(COMPOUND_WEDGE),
234 ENUM(COMPOUND_DIFFWTD), LAST_ENUM };
235
236const map_entry uv_prediction_mode_map[] = {
237 ENUM(UV_DC_PRED), ENUM(UV_V_PRED),
238 ENUM(UV_H_PRED), ENUM(UV_D45_PRED),
239 ENUM(UV_D135_PRED), ENUM(UV_D113_PRED),
240 ENUM(UV_D157_PRED), ENUM(UV_D203_PRED),
241 ENUM(UV_D67_PRED), ENUM(UV_SMOOTH_PRED),
242 ENUM(UV_SMOOTH_V_PRED), ENUM(UV_SMOOTH_H_PRED),
243 ENUM(UV_PAETH_PRED), ENUM(UV_CFL_PRED),
244 ENUM(UV_MODE_INVALID), LAST_ENUM
245};
246#define NO_SKIP 0
247#define SKIP 1
248
249const map_entry skip_map[] = { ENUM(SKIP), ENUM(NO_SKIP), LAST_ENUM };
250
251const map_entry intrabc_map[] = { { "INTRABC", 1 },
252 { "NO_INTRABC", 0 },
253 LAST_ENUM };
254
255const map_entry palette_map[] = {
256 { "ZERO_COLORS", 0 }, { "TWO_COLORS", 2 }, { "THREE_COLORS", 3 },
257 { "FOUR_COLORS", 4 }, { "FIVE_COLORS", 5 }, { "SIX_COLORS", 6 },
258 { "SEVEN_COLORS", 7 }, { "EIGHT_COLORS", 8 }, LAST_ENUM
259};
260
261const map_entry config_map[] = { ENUM(MI_SIZE), LAST_ENUM };
262
263static const char *exec_name;
264
265struct parm_offset {
266 char parm[60];
267 char offset;
268};
269struct parm_offset parm_offsets[] = {
270 { "blockSize", offsetof(insp_mi_data, bsize) },
271 { "transformSize", offsetof(insp_mi_data, tx_size) },
272 { "transformType", offsetof(insp_mi_data, tx_type) },
273 { "dualFilterType", offsetof(insp_mi_data, dual_filter_type) },
274 { "mode", offsetof(insp_mi_data, mode) },
275 { "uv_mode", offsetof(insp_mi_data, uv_mode) },
276 { "motion_mode", offsetof(insp_mi_data, motion_mode) },
277 { "compound_type", offsetof(insp_mi_data, compound_type) },
278 { "referenceFrame", offsetof(insp_mi_data, ref_frame) },
279 { "skip", offsetof(insp_mi_data, skip) },
280};
281int parm_count = sizeof(parm_offsets) / sizeof(parm_offsets[0]);
282
283int convert_to_indices(char *str, int *indices, int maxCount, int *count) {
284 *count = 0;
285 do {
286 char *comma = strchr(str, ',');
287 int length = (comma ? (int)(comma - str) : (int)strlen(str));
288 int i;
289 for (i = 0; i < parm_count; ++i) {
290 if (!strncmp(str, parm_offsets[i].parm, length)) {
291 break;
292 }
293 }
294 if (i == parm_count) return 0;
295 indices[(*count)++] = i;
296 if (*count > maxCount) return 0;
297 str += length + 1;
298 } while (strlen(str) > 0);
299 return 1;
300}
301
302insp_frame_data frame_data;
303int frame_count = 0;
304int decoded_frame_count = 0;
305aom_codec_ctx_t codec;
306AvxVideoReader *reader = NULL;
307const AvxVideoInfo *info = NULL;
308aom_image_t *img = NULL;
309
310void on_frame_decoded_dump(char *json) {
311#ifdef __EMSCRIPTEN__
312 EM_ASM_({ Module.on_frame_decoded_json($0); }, json);
313#else
314 printf("%s", json);
315#endif
316}
317
318// Writing out the JSON buffer using snprintf is very slow, especially when
319// compiled with emscripten, these functions speed things up quite a bit.
320int put_str(char *buffer, const char *str) {
321 int i;
322 for (i = 0; str[i] != '\0'; i++) {
323 buffer[i] = str[i];
324 }
325 return i;
326}
327
328int put_str_with_escape(char *buffer, const char *str) {
329 int i;
330 int j = 0;
331 for (i = 0; str[i] != '\0'; i++) {
332 if (str[i] < ' ') {
333 continue;
334 } else if (str[i] == '"' || str[i] == '\\') {
335 buffer[j++] = '\\';
336 }
337 buffer[j++] = str[i];
338 }
339 return j;
340}
341
342int put_num(char *buffer, char prefix, int num, char suffix) {
343 int i = 0;
344 char *buf = buffer;
345 int is_neg = 0;
346 if (prefix) {
347 buf[i++] = prefix;
348 }
349 if (num == 0) {
350 buf[i++] = '0';
351 } else {
352 if (num < 0) {
353 num = -num;
354 is_neg = 1;
355 }
356 int s = i;
357 while (num != 0) {
358 buf[i++] = '0' + (num % 10);
359 num = num / 10;
360 }
361 if (is_neg) {
362 buf[i++] = '-';
363 }
364 int e = i - 1;
365 while (s < e) {
366 int t = buf[s];
367 buf[s] = buf[e];
368 buf[e] = t;
369 s++;
370 e--;
371 }
372 }
373 if (suffix) {
374 buf[i++] = suffix;
375 }
376 return i;
377}
378
379int put_map(char *buffer, const map_entry *map) {
380 char *buf = buffer;
381 const map_entry *entry = map;
382 while (entry->name != NULL) {
383 *(buf++) = '"';
384 buf += put_str(buf, entry->name);
385 *(buf++) = '"';
386 buf += put_num(buf, ':', entry->value, 0);
387 entry++;
388 if (entry->name != NULL) {
389 *(buf++) = ',';
390 }
391 }
392 return (int)(buf - buffer);
393}
394
395int put_reference_frame(char *buffer) {
396 const int mi_rows = frame_data.mi_rows;
397 const int mi_cols = frame_data.mi_cols;
398 char *buf = buffer;
399 int r, c, t;
400 buf += put_str(buf, " \"referenceFrameMap\": {");
401 buf += put_map(buf, refs_map);
402 buf += put_str(buf, "},\n");
403 buf += put_str(buf, " \"referenceFrame\": [");
404 for (r = 0; r < mi_rows; ++r) {
405 *(buf++) = '[';
406 for (c = 0; c < mi_cols; ++c) {
407 insp_mi_data *mi = &frame_data.mi_grid[r * mi_cols + c];
408 buf += put_num(buf, '[', mi->ref_frame[0], 0);
409 buf += put_num(buf, ',', mi->ref_frame[1], ']');
410 if (compress) { // RLE
411 for (t = c + 1; t < mi_cols; ++t) {
412 insp_mi_data *next_mi = &frame_data.mi_grid[r * mi_cols + t];
413 if (mi->ref_frame[0] != next_mi->ref_frame[0] ||
414 mi->ref_frame[1] != next_mi->ref_frame[1]) {
415 break;
416 }
417 }
418 if (t - c > 1) {
419 *(buf++) = ',';
420 buf += put_num(buf, '[', t - c - 1, ']');
421 c = t - 1;
422 }
423 }
424 if (c < mi_cols - 1) *(buf++) = ',';
425 }
426 *(buf++) = ']';
427 if (r < mi_rows - 1) *(buf++) = ',';
428 }
429 buf += put_str(buf, "],\n");
430 return (int)(buf - buffer);
431}
432
433int put_motion_vectors(char *buffer) {
434 const int mi_rows = frame_data.mi_rows;
435 const int mi_cols = frame_data.mi_cols;
436 char *buf = buffer;
437 int r, c, t;
438 buf += put_str(buf, " \"motionVectors\": [");
439 for (r = 0; r < mi_rows; ++r) {
440 *(buf++) = '[';
441 for (c = 0; c < mi_cols; ++c) {
442 insp_mi_data *mi = &frame_data.mi_grid[r * mi_cols + c];
443 buf += put_num(buf, '[', mi->mv[0].col, 0);
444 buf += put_num(buf, ',', mi->mv[0].row, 0);
445 buf += put_num(buf, ',', mi->mv[1].col, 0);
446 buf += put_num(buf, ',', mi->mv[1].row, ']');
447 if (compress) { // RLE
448 for (t = c + 1; t < mi_cols; ++t) {
449 insp_mi_data *next_mi = &frame_data.mi_grid[r * mi_cols + t];
450 if (mi->mv[0].col != next_mi->mv[0].col ||
451 mi->mv[0].row != next_mi->mv[0].row ||
452 mi->mv[1].col != next_mi->mv[1].col ||
453 mi->mv[1].row != next_mi->mv[1].row) {
454 break;
455 }
456 }
457 if (t - c > 1) {
458 *(buf++) = ',';
459 buf += put_num(buf, '[', t - c - 1, ']');
460 c = t - 1;
461 }
462 }
463 if (c < mi_cols - 1) *(buf++) = ',';
464 }
465 *(buf++) = ']';
466 if (r < mi_rows - 1) *(buf++) = ',';
467 }
468 buf += put_str(buf, "],\n");
469 return (int)(buf - buffer);
470}
471
472int put_combined(char *buffer) {
473 const int mi_rows = frame_data.mi_rows;
474 const int mi_cols = frame_data.mi_cols;
475 char *buf = buffer;
476 int r, c, p;
477 buf += put_str(buf, " \"");
478 for (p = 0; p < combined_parm_count; ++p) {
479 if (p) buf += put_str(buf, "&");
480 buf += put_str(buf, parm_offsets[combined_parm_list[p]].parm);
481 }
482 buf += put_str(buf, "\": [");
483 for (r = 0; r < mi_rows; ++r) {
484 *(buf++) = '[';
485 for (c = 0; c < mi_cols; ++c) {
486 insp_mi_data *mi = &frame_data.mi_grid[r * mi_cols + c];
487 *(buf++) = '[';
488 for (p = 0; p < combined_parm_count; ++p) {
489 if (p) *(buf++) = ',';
490 int16_t *v = (int16_t *)(((int8_t *)mi) +
491 parm_offsets[combined_parm_list[p]].offset);
492 buf += put_num(buf, 0, v[0], 0);
493 }
494 *(buf++) = ']';
495 if (c < mi_cols - 1) *(buf++) = ',';
496 }
497 *(buf++) = ']';
498 if (r < mi_rows - 1) *(buf++) = ',';
499 }
500 buf += put_str(buf, "],\n");
501 return (int)(buf - buffer);
502}
503
504int put_block_info(char *buffer, const map_entry *map, const char *name,
505 size_t offset, int len) {
506 const int mi_rows = frame_data.mi_rows;
507 const int mi_cols = frame_data.mi_cols;
508 char *buf = buffer;
509 int r, c, t, i;
510 if (compress && len == 1) {
511 die("Can't encode scalars as arrays when RLE compression is enabled.");
512 }
513 if (map) {
514 buf += snprintf(buf, MAX_BUFFER, " \"%sMap\": {", name);
515 buf += put_map(buf, map);
516 buf += put_str(buf, "},\n");
517 }
518 buf += snprintf(buf, MAX_BUFFER, " \"%s\": [", name);
519 for (r = 0; r < mi_rows; ++r) {
520 *(buf++) = '[';
521 for (c = 0; c < mi_cols; ++c) {
522 insp_mi_data *mi = &frame_data.mi_grid[r * mi_cols + c];
523 int16_t *v = (int16_t *)(((int8_t *)mi) + offset);
524 if (len == 0) {
525 buf += put_num(buf, 0, v[0], 0);
526 } else {
527 buf += put_str(buf, "[");
528 for (i = 0; i < len; i++) {
529 buf += put_num(buf, 0, v[i], 0);
530 if (i < len - 1) {
531 buf += put_str(buf, ",");
532 }
533 }
534 buf += put_str(buf, "]");
535 }
536 if (compress) { // RLE
537 for (t = c + 1; t < mi_cols; ++t) {
538 insp_mi_data *next_mi = &frame_data.mi_grid[r * mi_cols + t];
539 int16_t *nv = (int16_t *)(((int8_t *)next_mi) + offset);
540 int same = 0;
541 if (len == 0) {
542 same = v[0] == nv[0];
543 } else {
544 for (i = 0; i < len; i++) {
545 same = v[i] == nv[i];
546 if (!same) {
547 break;
548 }
549 }
550 }
551 if (!same) {
552 break;
553 }
554 }
555 if (t - c > 1) {
556 *(buf++) = ',';
557 buf += put_num(buf, '[', t - c - 1, ']');
558 c = t - 1;
559 }
560 }
561 if (c < mi_cols - 1) *(buf++) = ',';
562 }
563 *(buf++) = ']';
564 if (r < mi_rows - 1) *(buf++) = ',';
565 }
566 buf += put_str(buf, "],\n");
567 return (int)(buf - buffer);
568}
569
570#if CONFIG_ACCOUNTING
571int put_accounting(char *buffer) {
572 char *buf = buffer;
573 int i;
574 const Accounting *accounting = frame_data.accounting;
575 if (accounting == NULL) {
576 printf("XXX\n");
577 return 0;
578 }
579 const int num_syms = accounting->syms.num_syms;
580 const int num_strs = accounting->syms.dictionary.num_strs;
581 buf += put_str(buf, " \"symbolsMap\": [");
582 for (i = 0; i < num_strs; i++) {
583 buf += snprintf(buf, MAX_BUFFER, "\"%s\"",
584 accounting->syms.dictionary.strs[i]);
585 if (i < num_strs - 1) *(buf++) = ',';
586 }
587 buf += put_str(buf, "],\n");
588 buf += put_str(buf, " \"symbols\": [\n ");
589 AccountingSymbolContext context;
590 context.x = -2;
591 context.y = -2;
592 AccountingSymbol *sym;
593 for (i = 0; i < num_syms; i++) {
594 sym = &accounting->syms.syms[i];
595 if (memcmp(&context, &sym->context, sizeof(AccountingSymbolContext)) != 0) {
596 buf += put_num(buf, '[', sym->context.x, 0);
597 buf += put_num(buf, ',', sym->context.y, ']');
598 } else {
599 buf += put_num(buf, '[', sym->id, 0);
600 buf += put_num(buf, ',', sym->bits, 0);
601 buf += put_num(buf, ',', sym->samples, ']');
602 }
603 context = sym->context;
604 if (i < num_syms - 1) *(buf++) = ',';
605 }
606 buf += put_str(buf, "],\n");
607 return (int)(buf - buffer);
608}
609#endif
610
611int skip_non_transform = 0;
612
613void inspect(void *pbi, void *data) {
614 /* Fetch frame data. */
615 ifd_inspect(&frame_data, pbi, skip_non_transform);
616
617 // Show existing frames just show a reference buffer we've already decoded.
618 // There's no information to show.
619 if (frame_data.show_existing_frame) return;
620
621 (void)data;
622 // We allocate enough space and hope we don't write out of bounds. Totally
623 // unsafe but this speeds things up, especially when compiled to Javascript.
624 char *buffer = aom_malloc(MAX_BUFFER);
625 if (!buffer) {
626 fprintf(stderr, "Error allocating inspect info buffer\n");
627 abort();
628 }
629 char *buf = buffer;
630 buf += put_str(buf, "{\n");
631 if (layers & BLOCK_SIZE_LAYER) {
632 buf += put_block_info(buf, block_size_map, "blockSize",
633 offsetof(insp_mi_data, bsize), 0);
634 }
635 if (layers & TRANSFORM_SIZE_LAYER) {
636 buf += put_block_info(buf, tx_size_map, "transformSize",
637 offsetof(insp_mi_data, tx_size), 0);
638 }
639 if (layers & TRANSFORM_TYPE_LAYER) {
640 buf += put_block_info(buf, tx_type_map, "transformType",
641 offsetof(insp_mi_data, tx_type), 0);
642 }
643 if (layers & DUAL_FILTER_LAYER) {
644 buf += put_block_info(buf, dual_filter_map, "dualFilterType",
645 offsetof(insp_mi_data, dual_filter_type), 0);
646 }
647 if (layers & MODE_LAYER) {
648 buf += put_block_info(buf, prediction_mode_map, "mode",
649 offsetof(insp_mi_data, mode), 0);
650 }
651 if (layers & UV_MODE_LAYER) {
652 buf += put_block_info(buf, uv_prediction_mode_map, "uv_mode",
653 offsetof(insp_mi_data, uv_mode), 0);
654 }
655 if (layers & MOTION_MODE_LAYER) {
656 buf += put_block_info(buf, motion_mode_map, "motion_mode",
657 offsetof(insp_mi_data, motion_mode), 0);
658 }
659 if (layers & COMPOUND_TYPE_LAYER) {
660 buf += put_block_info(buf, compound_type_map, "compound_type",
661 offsetof(insp_mi_data, compound_type), 0);
662 }
663 if (layers & SKIP_LAYER) {
664 buf +=
665 put_block_info(buf, skip_map, "skip", offsetof(insp_mi_data, skip), 0);
666 }
667 if (layers & FILTER_LAYER) {
668 buf +=
669 put_block_info(buf, NULL, "filter", offsetof(insp_mi_data, filter), 2);
670 }
671 if (layers & CDEF_LAYER) {
672 buf += put_block_info(buf, NULL, "cdef_level",
673 offsetof(insp_mi_data, cdef_level), 0);
674 buf += put_block_info(buf, NULL, "cdef_strength",
675 offsetof(insp_mi_data, cdef_strength), 0);
676 }
677 if (layers & CFL_LAYER) {
678 buf += put_block_info(buf, NULL, "cfl_alpha_idx",
679 offsetof(insp_mi_data, cfl_alpha_idx), 0);
680 buf += put_block_info(buf, NULL, "cfl_alpha_sign",
681 offsetof(insp_mi_data, cfl_alpha_sign), 0);
682 }
683 if (layers & Q_INDEX_LAYER) {
684 buf += put_block_info(buf, NULL, "delta_q",
685 offsetof(insp_mi_data, current_qindex), 0);
686 }
687 if (layers & SEGMENT_ID_LAYER) {
688 buf += put_block_info(buf, NULL, "seg_id",
689 offsetof(insp_mi_data, segment_id), 0);
690 }
691 if (layers & MOTION_VECTORS_LAYER) {
692 buf += put_motion_vectors(buf);
693 }
694 if (layers & INTRABC_LAYER) {
695 buf += put_block_info(buf, intrabc_map, "intrabc",
696 offsetof(insp_mi_data, intrabc), 0);
697 }
698 if (layers & PALETTE_LAYER) {
699 buf += put_block_info(buf, palette_map, "palette",
700 offsetof(insp_mi_data, palette), 0);
701 }
702 if (layers & UV_PALETTE_LAYER) {
703 buf += put_block_info(buf, palette_map, "uv_palette",
704 offsetof(insp_mi_data, uv_palette), 0);
705 }
706 if (combined_parm_count > 0) buf += put_combined(buf);
707 if (layers & REFERENCE_FRAME_LAYER) {
708 buf += put_block_info(buf, refs_map, "referenceFrame",
709 offsetof(insp_mi_data, ref_frame), 2);
710 }
711#if CONFIG_ACCOUNTING
712 if (layers & ACCOUNTING_LAYER) {
713 buf += put_accounting(buf);
714 }
715#endif
716 buf +=
717 snprintf(buf, MAX_BUFFER, " \"frame\": %d,\n", frame_data.frame_number);
718 buf += snprintf(buf, MAX_BUFFER, " \"showFrame\": %d,\n",
719 frame_data.show_frame);
720 buf += snprintf(buf, MAX_BUFFER, " \"frameType\": %d,\n",
721 frame_data.frame_type);
722 buf += snprintf(buf, MAX_BUFFER, " \"baseQIndex\": %d,\n",
723 frame_data.base_qindex);
724 buf += snprintf(buf, MAX_BUFFER, " \"tileCols\": %d,\n",
725 frame_data.tile_mi_cols);
726 buf += snprintf(buf, MAX_BUFFER, " \"tileRows\": %d,\n",
727 frame_data.tile_mi_rows);
728 buf += snprintf(buf, MAX_BUFFER, " \"deltaQPresentFlag\": %d,\n",
729 frame_data.delta_q_present_flag);
730 buf += snprintf(buf, MAX_BUFFER, " \"deltaQRes\": %d,\n",
731 frame_data.delta_q_res);
732 buf += put_str(buf, " \"config\": {");
733 buf += put_map(buf, config_map);
734 buf += put_str(buf, "},\n");
735 buf += put_str(buf, " \"configString\": \"");
736 buf += put_str_with_escape(buf, aom_codec_build_config());
737 buf += put_str(buf, "\"\n");
738 decoded_frame_count++;
739 buf += put_str(buf, "},\n");
740 *(buf++) = 0;
741 on_frame_decoded_dump(buffer);
742 aom_free(buffer);
743}
744
745void ifd_init_cb(void) {
747 ii.inspect_cb = inspect;
748 ii.inspect_ctx = NULL;
750}
751
752EMSCRIPTEN_KEEPALIVE
753int open_file(char *file) {
754 if (file == NULL) {
755 // The JS analyzer puts the .ivf file at this location.
756 file = "/tmp/input.ivf";
757 }
758 reader = aom_video_reader_open(file);
759 if (!reader) die("Failed to open %s for reading.", file);
760 info = aom_video_reader_get_info(reader);
761 aom_codec_iface_t *decoder = get_aom_decoder_by_fourcc(info->codec_fourcc);
762 if (!decoder) die("Unknown input codec.");
763 fprintf(stderr, "Using %s\n", aom_codec_iface_name(decoder));
764 if (aom_codec_dec_init(&codec, decoder, NULL, 0))
765 die("Failed to initialize decoder.");
766 ifd_init(&frame_data, info->frame_width, info->frame_height);
767 ifd_init_cb();
768 return EXIT_SUCCESS;
769}
770
772int have_frame = 0;
773const unsigned char *frame;
774const unsigned char *end_frame;
775size_t frame_size = 0;
776
777EMSCRIPTEN_KEEPALIVE
778int read_frame(void) {
779 img = NULL;
780
781 // This loop skips over any frames that are show_existing_frames, as
782 // there is nothing to analyze.
783 do {
784 if (!have_frame) {
785 if (!aom_video_reader_read_frame(reader)) return EXIT_FAILURE;
786 frame = aom_video_reader_get_frame(reader, &frame_size);
787
788 have_frame = 1;
789 end_frame = frame + frame_size;
790 }
791
792 if (aom_codec_decode(&codec, frame, (unsigned int)frame_size, &adr) !=
793 AOM_CODEC_OK) {
794 die_codec(&codec, "Failed to decode frame.");
795 }
796
797 frame = adr.buf;
798 frame_size = end_frame - frame;
799 if (frame == end_frame) have_frame = 0;
800 } while (adr.show_existing);
801
802 int got_any_frames = 0;
803 aom_image_t *frame_img;
804 struct av1_ref_frame ref_dec;
805 ref_dec.idx = adr.idx;
806
807 // ref_dec.idx is the index to the reference buffer idx to AV1_GET_REFERENCE
808 // if its -1 the decoder didn't update any reference buffer and the only
809 // way to see the frame is aom_codec_get_frame.
810 if (ref_dec.idx == -1) {
811 aom_codec_iter_t iter = NULL;
812 img = frame_img = aom_codec_get_frame(&codec, &iter);
813 ++frame_count;
814 got_any_frames = 1;
815 } else if (!aom_codec_control(&codec, AV1_GET_REFERENCE, &ref_dec)) {
816 img = frame_img = &ref_dec.img;
817 ++frame_count;
818 got_any_frames = 1;
819 }
820 if (!got_any_frames) {
821 return EXIT_FAILURE;
822 }
823 return EXIT_SUCCESS;
824}
825
826EMSCRIPTEN_KEEPALIVE
827const char *get_aom_codec_build_config(void) {
828 return aom_codec_build_config();
829}
830
831EMSCRIPTEN_KEEPALIVE
832int get_bit_depth(void) { return img->bit_depth; }
833
834EMSCRIPTEN_KEEPALIVE
835int get_bits_per_sample(void) { return img->bps; }
836
837EMSCRIPTEN_KEEPALIVE
838int get_image_format(void) { return img->fmt; }
839
840EMSCRIPTEN_KEEPALIVE
841unsigned char *get_plane(int plane) { return img->planes[plane]; }
842
843EMSCRIPTEN_KEEPALIVE
844int get_plane_stride(int plane) { return img->stride[plane]; }
845
846EMSCRIPTEN_KEEPALIVE
847int get_plane_width(int plane) { return aom_img_plane_width(img, plane); }
848
849EMSCRIPTEN_KEEPALIVE
850int get_plane_height(int plane) { return aom_img_plane_height(img, plane); }
851
852EMSCRIPTEN_KEEPALIVE
853int get_frame_width(void) { return info->frame_width; }
854
855EMSCRIPTEN_KEEPALIVE
856int get_frame_height(void) { return info->frame_height; }
857
858static void parse_args(char **argv) {
859 char **argi, **argj;
860 struct arg arg;
861 (void)dump_accounting_arg;
862 (void)dump_cdef_arg;
863 for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
864 arg.argv_step = 1;
865 if (arg_match(&arg, &dump_block_size_arg, argi)) layers |= BLOCK_SIZE_LAYER;
866#if CONFIG_ACCOUNTING
867 else if (arg_match(&arg, &dump_accounting_arg, argi))
868 layers |= ACCOUNTING_LAYER;
869#endif
870 else if (arg_match(&arg, &dump_transform_size_arg, argi))
871 layers |= TRANSFORM_SIZE_LAYER;
872 else if (arg_match(&arg, &dump_transform_type_arg, argi))
873 layers |= TRANSFORM_TYPE_LAYER;
874 else if (arg_match(&arg, &dump_mode_arg, argi))
875 layers |= MODE_LAYER;
876 else if (arg_match(&arg, &dump_uv_mode_arg, argi))
877 layers |= UV_MODE_LAYER;
878 else if (arg_match(&arg, &dump_motion_mode_arg, argi))
879 layers |= MOTION_MODE_LAYER;
880 else if (arg_match(&arg, &dump_compound_type_arg, argi))
881 layers |= COMPOUND_TYPE_LAYER;
882 else if (arg_match(&arg, &dump_skip_arg, argi))
883 layers |= SKIP_LAYER;
884 else if (arg_match(&arg, &dump_filter_arg, argi))
885 layers |= FILTER_LAYER;
886 else if (arg_match(&arg, &dump_cdef_arg, argi))
887 layers |= CDEF_LAYER;
888 else if (arg_match(&arg, &dump_cfl_arg, argi))
889 layers |= CFL_LAYER;
890 else if (arg_match(&arg, &dump_reference_frame_arg, argi))
891 layers |= REFERENCE_FRAME_LAYER;
892 else if (arg_match(&arg, &dump_motion_vectors_arg, argi))
893 layers |= MOTION_VECTORS_LAYER;
894 else if (arg_match(&arg, &dump_dual_filter_type_arg, argi))
895 layers |= DUAL_FILTER_LAYER;
896 else if (arg_match(&arg, &dump_delta_q_arg, argi))
897 layers |= Q_INDEX_LAYER;
898 else if (arg_match(&arg, &dump_seg_id_arg, argi))
899 layers |= SEGMENT_ID_LAYER;
900 else if (arg_match(&arg, &dump_intrabc_arg, argi))
901 layers |= INTRABC_LAYER;
902 else if (arg_match(&arg, &dump_palette_arg, argi))
903 layers |= PALETTE_LAYER;
904 else if (arg_match(&arg, &dump_uv_palette_arg, argi))
905 layers |= UV_PALETTE_LAYER;
906 else if (arg_match(&arg, &dump_all_arg, argi))
907 layers |= ALL_LAYERS;
908 else if (arg_match(&arg, &compress_arg, argi))
909 compress = 1;
910 else if (arg_match(&arg, &usage_arg, argi))
911 usage_exit();
912 else if (arg_match(&arg, &limit_arg, argi))
913 stop_after = arg_parse_uint(&arg);
914 else if (arg_match(&arg, &skip_non_transform_arg, argi))
915 skip_non_transform = arg_parse_uint(&arg);
916 else if (arg_match(&arg, &combined_arg, argi))
917 convert_to_indices(
918 (char *)arg.val, combined_parm_list,
919 sizeof(combined_parm_list) / sizeof(combined_parm_list[0]),
920 &combined_parm_count);
921 else
922 argj++;
923 }
924}
925
926static const char *exec_name;
927
928void usage_exit(void) {
929 fprintf(stderr, "Usage: %s src_filename <options>\n", exec_name);
930 fprintf(stderr, "\nOptions:\n");
931 arg_show_usage(stderr, main_args);
932 exit(EXIT_FAILURE);
933}
934
935EMSCRIPTEN_KEEPALIVE
936int main(int argc, char **argv) {
937 exec_name = argv[0];
938 parse_args(argv);
939 if (argc >= 2) {
940 open_file(argv[1]);
941 printf("[\n");
942 while (1) {
943 if (stop_after && (decoded_frame_count >= stop_after)) break;
944 if (read_frame()) break;
945 }
946 printf("null\n");
947 printf("]");
948 } else {
949 usage_exit();
950 }
951}
952
953EMSCRIPTEN_KEEPALIVE
954void quit(void) {
955 if (aom_codec_destroy(&codec)) die_codec(&codec, "Failed to destroy codec");
956 aom_video_reader_close(reader);
957}
958
959EMSCRIPTEN_KEEPALIVE
960void set_layers(LayerType v) { layers = v; }
961
962EMSCRIPTEN_KEEPALIVE
963void set_compress(int v) { compress = v; }
Describes the decoder algorithm interface to applications.
int aom_img_plane_height(const aom_image_t *img, int plane)
Get the height of a plane.
int aom_img_plane_width(const aom_image_t *img, int plane)
Get the width of a plane.
Provides definitions for using AOM or AV1 within the aom Decoder interface.
struct Accounting Accounting
Definition aomdx.h:50
@ AV1_SET_INSPECTION_CALLBACK
Codec control function to set an aom_inspect_cb callback that is invoked each time a frame is decoded...
Definition aomdx.h:382
@ AV1_GET_REFERENCE
Codec control function to get a pointer to a reference frame.
Definition aom.h:51
const char * aom_codec_iface_name(aom_codec_iface_t *iface)
Return the name for a given interface.
aom_codec_err_t aom_codec_control(aom_codec_ctx_t *ctx, int ctrl_id,...)
Algorithm Control.
const struct aom_codec_iface aom_codec_iface_t
Codec interface structure.
Definition aom_codec.h:254
const char * aom_codec_build_config(void)
Return the build configuration.
aom_codec_err_t aom_codec_destroy(aom_codec_ctx_t *ctx)
Destroy a codec instance.
const void * aom_codec_iter_t
Iterator.
Definition aom_codec.h:288
@ AOM_CODEC_OK
Operation completed without error.
Definition aom_codec.h:157
aom_image_t * aom_codec_get_frame(aom_codec_ctx_t *ctx, aom_codec_iter_t *iter)
Decoded frames iterator.
aom_codec_err_t aom_codec_decode(aom_codec_ctx_t *ctx, const uint8_t *data, size_t data_sz, void *user_priv)
Decode data.
#define aom_codec_dec_init(ctx, iface, cfg, flags)
Convenience macro for aom_codec_dec_init_ver()
Definition aom_decoder.h:129
Structure to collect a buffer index when inspecting.
Definition aomdx.h:78
const unsigned char * buf
Definition aomdx.h:80
int show_existing
Definition aomdx.h:84
int idx
Definition aomdx.h:82
Codec context structure.
Definition aom_codec.h:298
Image Descriptor.
Definition aom_image.h:182
unsigned int bit_depth
Definition aom_image.h:194
aom_img_fmt_t fmt
Definition aom_image.h:183
int stride[3]
Definition aom_image.h:216
int bps
Definition aom_image.h:219
unsigned char * planes[3]
Definition aom_image.h:215
Structure to hold inspection callback and context.
Definition aomdx.h:64
void * inspect_ctx
Definition aomdx.h:69
aom_inspect_cb inspect_cb
Definition aomdx.h:66
AV1 specific reference frame data struct.
Definition aom.h:89
aom_image_t img
Definition aom.h:92
int idx
Definition aom.h:90