• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3  *
4  * This source code is subject to the terms of the BSD 2 Clause License and
5  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6  * was not distributed with this source code in the LICENSE file, you can
7  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8  * Media Patent License 1.0 was not distributed with this source code in the
9  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10  */
11 
12 // Inspect Decoder
13 // ================
14 //
15 // This is a simple decoder loop that writes JSON stats to stdout. This tool
16 // can also be compiled with Emscripten and used as a library.
17 
18 #include <stdio.h>
19 #include <stdlib.h>
20 #include <string.h>
21 
22 #ifdef __EMSCRIPTEN__
23 #include <emscripten.h>
24 #else
25 #define EMSCRIPTEN_KEEPALIVE
26 #endif
27 
28 #include "config/aom_config.h"
29 
30 #include "aom/aom_decoder.h"
31 #include "aom/aomdx.h"
32 #include "av1/common/av1_common_int.h"
33 
34 #if CONFIG_ACCOUNTING
35 #include "av1/decoder/accounting.h"
36 #endif
37 
38 #include "av1/decoder/inspection.h"
39 #include "common/args.h"
40 #include "common/tools_common.h"
41 #include "common/video_common.h"
42 #include "common/video_reader.h"
43 
44 // Max JSON buffer size.
45 const int MAX_BUFFER = 1024 * 1024 * 256;
46 
47 typedef enum {
48   ACCOUNTING_LAYER = 1,
49   BLOCK_SIZE_LAYER = 1 << 1,
50   TRANSFORM_SIZE_LAYER = 1 << 2,
51   TRANSFORM_TYPE_LAYER = 1 << 3,
52   MODE_LAYER = 1 << 4,
53   SKIP_LAYER = 1 << 5,
54   FILTER_LAYER = 1 << 6,
55   CDEF_LAYER = 1 << 7,
56   REFERENCE_FRAME_LAYER = 1 << 8,
57   MOTION_VECTORS_LAYER = 1 << 9,
58   UV_MODE_LAYER = 1 << 10,
59   CFL_LAYER = 1 << 11,
60   DUAL_FILTER_LAYER = 1 << 12,
61   Q_INDEX_LAYER = 1 << 13,
62   SEGMENT_ID_LAYER = 1 << 14,
63   MOTION_MODE_LAYER = 1 << 15,
64   COMPOUND_TYPE_LAYER = 1 << 16,
65   INTRABC_LAYER = 1 << 17,
66   PALETTE_LAYER = 1 << 18,
67   UV_PALETTE_LAYER = 1 << 19,
68   ALL_LAYERS = (1 << 20) - 1
69 } LayerType;
70 
71 static LayerType layers = 0;
72 
73 static int stop_after = 0;
74 static int compress = 0;
75 
76 static const arg_def_t limit_arg =
77     ARG_DEF(NULL, "limit", 1, "Stop decoding after n frames");
78 static const arg_def_t dump_all_arg = ARG_DEF("A", "all", 0, "Dump All");
79 static const arg_def_t compress_arg =
80     ARG_DEF("x", "compress", 0, "Compress JSON using RLE");
81 static const arg_def_t dump_accounting_arg =
82     ARG_DEF("a", "accounting", 0, "Dump Accounting");
83 static const arg_def_t dump_block_size_arg =
84     ARG_DEF("bs", "blockSize", 0, "Dump Block Size");
85 static const arg_def_t dump_motion_vectors_arg =
86     ARG_DEF("mv", "motionVectors", 0, "Dump Motion Vectors");
87 static const arg_def_t dump_transform_size_arg =
88     ARG_DEF("ts", "transformSize", 0, "Dump Transform Size");
89 static const arg_def_t dump_transform_type_arg =
90     ARG_DEF("tt", "transformType", 0, "Dump Transform Type");
91 static const arg_def_t dump_mode_arg = ARG_DEF("m", "mode", 0, "Dump Mode");
92 static const arg_def_t dump_motion_mode_arg =
93     ARG_DEF("mm", "motion_mode", 0, "Dump Motion Modes");
94 static const arg_def_t dump_compound_type_arg =
95     ARG_DEF("ct", "compound_type", 0, "Dump Compound Types");
96 static const arg_def_t dump_uv_mode_arg =
97     ARG_DEF("uvm", "uv_mode", 0, "Dump UV Intra Prediction Modes");
98 static const arg_def_t dump_skip_arg = ARG_DEF("s", "skip", 0, "Dump Skip");
99 static const arg_def_t dump_filter_arg =
100     ARG_DEF("f", "filter", 0, "Dump Filter");
101 static const arg_def_t dump_cdef_arg = ARG_DEF("c", "cdef", 0, "Dump CDEF");
102 static const arg_def_t dump_cfl_arg =
103     ARG_DEF("cfl", "chroma_from_luma", 0, "Dump Chroma from Luma Alphas");
104 static const arg_def_t dump_dual_filter_type_arg =
105     ARG_DEF("df", "dualFilterType", 0, "Dump Dual Filter Type");
106 static const arg_def_t dump_reference_frame_arg =
107     ARG_DEF("r", "referenceFrame", 0, "Dump Reference Frame");
108 static const arg_def_t dump_delta_q_arg =
109     ARG_DEF("dq", "delta_q", 0, "Dump QIndex");
110 static const arg_def_t dump_seg_id_arg =
111     ARG_DEF("si", "seg_id", 0, "Dump Segment ID");
112 static const arg_def_t dump_intrabc_arg =
113     ARG_DEF("ibc", "intrabc", 0, "Dump If IntraBC Is Used");
114 static const arg_def_t dump_palette_arg =
115     ARG_DEF("plt", "palette", 0, "Dump Palette Size");
116 static const arg_def_t dump_uv_palette_arg =
117     ARG_DEF("uvp", "uv_palette", 0, "Dump UV Palette Size");
118 static const arg_def_t usage_arg = ARG_DEF("h", "help", 0, "Help");
119 static const arg_def_t skip_non_transform_arg = ARG_DEF(
120     "snt", "skip_non_transform", 1, "Skip is counted as a non transform.");
121 static const arg_def_t combined_arg =
122     ARG_DEF("comb", "combined", 1, "combinining parameters into one output.");
123 
124 int combined_parm_list[15];
125 int combined_parm_count = 0;
126 
127 static const arg_def_t *main_args[] = { &limit_arg,
128                                         &dump_all_arg,
129                                         &compress_arg,
130 #if CONFIG_ACCOUNTING
131                                         &dump_accounting_arg,
132 #endif
133                                         &dump_block_size_arg,
134                                         &dump_transform_size_arg,
135                                         &dump_transform_type_arg,
136                                         &dump_mode_arg,
137                                         &dump_uv_mode_arg,
138                                         &dump_motion_mode_arg,
139                                         &dump_compound_type_arg,
140                                         &dump_skip_arg,
141                                         &dump_filter_arg,
142                                         &dump_cdef_arg,
143                                         &dump_dual_filter_type_arg,
144                                         &dump_cfl_arg,
145                                         &dump_reference_frame_arg,
146                                         &dump_motion_vectors_arg,
147                                         &dump_delta_q_arg,
148                                         &dump_seg_id_arg,
149                                         &dump_intrabc_arg,
150                                         &dump_palette_arg,
151                                         &dump_uv_palette_arg,
152                                         &usage_arg,
153                                         &skip_non_transform_arg,
154                                         &combined_arg,
155                                         NULL };
156 #define ENUM(name) \
157   { #name, name }
158 #define LAST_ENUM \
159   { NULL, 0 }
160 typedef struct map_entry {
161   const char *name;
162   int value;
163 } map_entry;
164 
165 const map_entry refs_map[] = {
166   ENUM(INTRA_FRAME),   ENUM(LAST_FRAME),   ENUM(LAST2_FRAME),
167   ENUM(LAST3_FRAME),   ENUM(GOLDEN_FRAME), ENUM(BWDREF_FRAME),
168   ENUM(ALTREF2_FRAME), ENUM(ALTREF_FRAME), LAST_ENUM
169 };
170 
171 const map_entry block_size_map[] = {
172   ENUM(BLOCK_4X4),     ENUM(BLOCK_4X8),    ENUM(BLOCK_8X4),
173   ENUM(BLOCK_8X8),     ENUM(BLOCK_8X16),   ENUM(BLOCK_16X8),
174   ENUM(BLOCK_16X16),   ENUM(BLOCK_16X32),  ENUM(BLOCK_32X16),
175   ENUM(BLOCK_32X32),   ENUM(BLOCK_32X64),  ENUM(BLOCK_64X32),
176   ENUM(BLOCK_64X64),   ENUM(BLOCK_64X128), ENUM(BLOCK_128X64),
177   ENUM(BLOCK_128X128), ENUM(BLOCK_4X16),   ENUM(BLOCK_16X4),
178   ENUM(BLOCK_8X32),    ENUM(BLOCK_32X8),   ENUM(BLOCK_16X64),
179   ENUM(BLOCK_64X16),   LAST_ENUM
180 };
181 
182 #define TX_SKIP -1
183 
184 const map_entry tx_size_map[] = {
185   ENUM(TX_4X4),   ENUM(TX_8X8),   ENUM(TX_16X16), ENUM(TX_32X32),
186   ENUM(TX_64X64), ENUM(TX_4X8),   ENUM(TX_8X4),   ENUM(TX_8X16),
187   ENUM(TX_16X8),  ENUM(TX_16X32), ENUM(TX_32X16), ENUM(TX_32X64),
188   ENUM(TX_64X32), ENUM(TX_4X16),  ENUM(TX_16X4),  ENUM(TX_8X32),
189   ENUM(TX_32X8),  ENUM(TX_16X64), ENUM(TX_64X16), LAST_ENUM
190 };
191 
192 const map_entry tx_type_map[] = { ENUM(DCT_DCT),
193                                   ENUM(ADST_DCT),
194                                   ENUM(DCT_ADST),
195                                   ENUM(ADST_ADST),
196                                   ENUM(FLIPADST_DCT),
197                                   ENUM(DCT_FLIPADST),
198                                   ENUM(FLIPADST_FLIPADST),
199                                   ENUM(ADST_FLIPADST),
200                                   ENUM(FLIPADST_ADST),
201                                   ENUM(IDTX),
202                                   ENUM(V_DCT),
203                                   ENUM(H_DCT),
204                                   ENUM(V_ADST),
205                                   ENUM(H_ADST),
206                                   ENUM(V_FLIPADST),
207                                   ENUM(H_FLIPADST),
208                                   LAST_ENUM };
209 const map_entry dual_filter_map[] = { ENUM(REG_REG),       ENUM(REG_SMOOTH),
210                                       ENUM(REG_SHARP),     ENUM(SMOOTH_REG),
211                                       ENUM(SMOOTH_SMOOTH), ENUM(SMOOTH_SHARP),
212                                       ENUM(SHARP_REG),     ENUM(SHARP_SMOOTH),
213                                       ENUM(SHARP_SHARP),   LAST_ENUM };
214 
215 const map_entry prediction_mode_map[] = {
216   ENUM(DC_PRED),     ENUM(V_PRED),        ENUM(H_PRED),
217   ENUM(D45_PRED),    ENUM(D135_PRED),     ENUM(D113_PRED),
218   ENUM(D157_PRED),   ENUM(D203_PRED),     ENUM(D67_PRED),
219   ENUM(SMOOTH_PRED), ENUM(SMOOTH_V_PRED), ENUM(SMOOTH_H_PRED),
220   ENUM(PAETH_PRED),  ENUM(NEARESTMV),     ENUM(NEARMV),
221   ENUM(GLOBALMV),    ENUM(NEWMV),         ENUM(NEAREST_NEARESTMV),
222   ENUM(NEAR_NEARMV), ENUM(NEAREST_NEWMV), ENUM(NEW_NEARESTMV),
223   ENUM(NEAR_NEWMV),  ENUM(NEW_NEARMV),    ENUM(GLOBAL_GLOBALMV),
224   ENUM(NEW_NEWMV),   ENUM(INTRA_INVALID), LAST_ENUM
225 };
226 
227 const map_entry motion_mode_map[] = { ENUM(SIMPLE_TRANSLATION),
228                                       ENUM(OBMC_CAUSAL),    // 2-sided OBMC
229                                       ENUM(WARPED_CAUSAL),  // 2-sided WARPED
230                                       LAST_ENUM };
231 
232 const map_entry compound_type_map[] = { ENUM(COMPOUND_AVERAGE),
233                                         ENUM(COMPOUND_WEDGE),
234                                         ENUM(COMPOUND_DIFFWTD), LAST_ENUM };
235 
236 const map_entry uv_prediction_mode_map[] = {
237   ENUM(UV_DC_PRED),       ENUM(UV_V_PRED),
238   ENUM(UV_H_PRED),        ENUM(UV_D45_PRED),
239   ENUM(UV_D135_PRED),     ENUM(UV_D113_PRED),
240   ENUM(UV_D157_PRED),     ENUM(UV_D203_PRED),
241   ENUM(UV_D67_PRED),      ENUM(UV_SMOOTH_PRED),
242   ENUM(UV_SMOOTH_V_PRED), ENUM(UV_SMOOTH_H_PRED),
243   ENUM(UV_PAETH_PRED),    ENUM(UV_CFL_PRED),
244   ENUM(UV_MODE_INVALID),  LAST_ENUM
245 };
246 #define NO_SKIP 0
247 #define SKIP 1
248 
249 const map_entry skip_map[] = { ENUM(SKIP), ENUM(NO_SKIP), LAST_ENUM };
250 
251 const map_entry intrabc_map[] = { { "INTRABC", 1 },
252                                   { "NO_INTRABC", 0 },
253                                   LAST_ENUM };
254 
255 const map_entry palette_map[] = {
256   { "ZERO_COLORS", 0 },  { "TWO_COLORS", 2 },   { "THREE_COLORS", 3 },
257   { "FOUR_COLORS", 4 },  { "FIVE_COLORS", 5 },  { "SIX_COLORS", 6 },
258   { "SEVEN_COLORS", 7 }, { "EIGHT_COLORS", 8 }, LAST_ENUM
259 };
260 
261 const map_entry config_map[] = { ENUM(MI_SIZE), LAST_ENUM };
262 
263 static const char *exec_name;
264 
265 struct parm_offset {
266   char parm[60];
267   char offset;
268 };
269 struct parm_offset parm_offsets[] = {
270   { "blockSize", offsetof(insp_mi_data, bsize) },
271   { "transformSize", offsetof(insp_mi_data, tx_size) },
272   { "transformType", offsetof(insp_mi_data, tx_type) },
273   { "dualFilterType", offsetof(insp_mi_data, dual_filter_type) },
274   { "mode", offsetof(insp_mi_data, mode) },
275   { "uv_mode", offsetof(insp_mi_data, uv_mode) },
276   { "motion_mode", offsetof(insp_mi_data, motion_mode) },
277   { "compound_type", offsetof(insp_mi_data, compound_type) },
278   { "referenceFrame", offsetof(insp_mi_data, ref_frame) },
279   { "skip", offsetof(insp_mi_data, skip) },
280 };
281 int parm_count = sizeof(parm_offsets) / sizeof(parm_offsets[0]);
282 
convert_to_indices(char * str,int * indices,int maxCount,int * count)283 int convert_to_indices(char *str, int *indices, int maxCount, int *count) {
284   *count = 0;
285   do {
286     char *comma = strchr(str, ',');
287     int length = (comma ? (int)(comma - str) : (int)strlen(str));
288     int i;
289     for (i = 0; i < parm_count; ++i) {
290       if (!strncmp(str, parm_offsets[i].parm, length)) {
291         break;
292       }
293     }
294     if (i == parm_count) return 0;
295     indices[(*count)++] = i;
296     if (*count > maxCount) return 0;
297     str += length + 1;
298   } while (strlen(str) > 0);
299   return 1;
300 }
301 
302 insp_frame_data frame_data;
303 int frame_count = 0;
304 int decoded_frame_count = 0;
305 aom_codec_ctx_t codec;
306 AvxVideoReader *reader = NULL;
307 const AvxVideoInfo *info = NULL;
308 aom_image_t *img = NULL;
309 
on_frame_decoded_dump(char * json)310 void on_frame_decoded_dump(char *json) {
311 #ifdef __EMSCRIPTEN__
312   EM_ASM_({ Module.on_frame_decoded_json($0); }, json);
313 #else
314   printf("%s", json);
315 #endif
316 }
317 
318 // Writing out the JSON buffer using snprintf is very slow, especially when
319 // compiled with emscripten, these functions speed things up quite a bit.
put_str(char * buffer,const char * str)320 int put_str(char *buffer, const char *str) {
321   int i;
322   for (i = 0; str[i] != '\0'; i++) {
323     buffer[i] = str[i];
324   }
325   return i;
326 }
327 
put_str_with_escape(char * buffer,const char * str)328 int put_str_with_escape(char *buffer, const char *str) {
329   int i;
330   int j = 0;
331   for (i = 0; str[i] != '\0'; i++) {
332     if (str[i] < ' ') {
333       continue;
334     } else if (str[i] == '"' || str[i] == '\\') {
335       buffer[j++] = '\\';
336     }
337     buffer[j++] = str[i];
338   }
339   return j;
340 }
341 
put_num(char * buffer,char prefix,int num,char suffix)342 int put_num(char *buffer, char prefix, int num, char suffix) {
343   int i = 0;
344   char *buf = buffer;
345   int is_neg = 0;
346   if (prefix) {
347     buf[i++] = prefix;
348   }
349   if (num == 0) {
350     buf[i++] = '0';
351   } else {
352     if (num < 0) {
353       num = -num;
354       is_neg = 1;
355     }
356     int s = i;
357     while (num != 0) {
358       buf[i++] = '0' + (num % 10);
359       num = num / 10;
360     }
361     if (is_neg) {
362       buf[i++] = '-';
363     }
364     int e = i - 1;
365     while (s < e) {
366       int t = buf[s];
367       buf[s] = buf[e];
368       buf[e] = t;
369       s++;
370       e--;
371     }
372   }
373   if (suffix) {
374     buf[i++] = suffix;
375   }
376   return i;
377 }
378 
put_map(char * buffer,const map_entry * map)379 int put_map(char *buffer, const map_entry *map) {
380   char *buf = buffer;
381   const map_entry *entry = map;
382   while (entry->name != NULL) {
383     *(buf++) = '"';
384     buf += put_str(buf, entry->name);
385     *(buf++) = '"';
386     buf += put_num(buf, ':', entry->value, 0);
387     entry++;
388     if (entry->name != NULL) {
389       *(buf++) = ',';
390     }
391   }
392   return (int)(buf - buffer);
393 }
394 
put_reference_frame(char * buffer)395 int put_reference_frame(char *buffer) {
396   const int mi_rows = frame_data.mi_rows;
397   const int mi_cols = frame_data.mi_cols;
398   char *buf = buffer;
399   int r, c, t;
400   buf += put_str(buf, "  \"referenceFrameMap\": {");
401   buf += put_map(buf, refs_map);
402   buf += put_str(buf, "},\n");
403   buf += put_str(buf, "  \"referenceFrame\": [");
404   for (r = 0; r < mi_rows; ++r) {
405     *(buf++) = '[';
406     for (c = 0; c < mi_cols; ++c) {
407       insp_mi_data *mi = &frame_data.mi_grid[r * mi_cols + c];
408       buf += put_num(buf, '[', mi->ref_frame[0], 0);
409       buf += put_num(buf, ',', mi->ref_frame[1], ']');
410       if (compress) {  // RLE
411         for (t = c + 1; t < mi_cols; ++t) {
412           insp_mi_data *next_mi = &frame_data.mi_grid[r * mi_cols + t];
413           if (mi->ref_frame[0] != next_mi->ref_frame[0] ||
414               mi->ref_frame[1] != next_mi->ref_frame[1]) {
415             break;
416           }
417         }
418         if (t - c > 1) {
419           *(buf++) = ',';
420           buf += put_num(buf, '[', t - c - 1, ']');
421           c = t - 1;
422         }
423       }
424       if (c < mi_cols - 1) *(buf++) = ',';
425     }
426     *(buf++) = ']';
427     if (r < mi_rows - 1) *(buf++) = ',';
428   }
429   buf += put_str(buf, "],\n");
430   return (int)(buf - buffer);
431 }
432 
put_motion_vectors(char * buffer)433 int put_motion_vectors(char *buffer) {
434   const int mi_rows = frame_data.mi_rows;
435   const int mi_cols = frame_data.mi_cols;
436   char *buf = buffer;
437   int r, c, t;
438   buf += put_str(buf, "  \"motionVectors\": [");
439   for (r = 0; r < mi_rows; ++r) {
440     *(buf++) = '[';
441     for (c = 0; c < mi_cols; ++c) {
442       insp_mi_data *mi = &frame_data.mi_grid[r * mi_cols + c];
443       buf += put_num(buf, '[', mi->mv[0].col, 0);
444       buf += put_num(buf, ',', mi->mv[0].row, 0);
445       buf += put_num(buf, ',', mi->mv[1].col, 0);
446       buf += put_num(buf, ',', mi->mv[1].row, ']');
447       if (compress) {  // RLE
448         for (t = c + 1; t < mi_cols; ++t) {
449           insp_mi_data *next_mi = &frame_data.mi_grid[r * mi_cols + t];
450           if (mi->mv[0].col != next_mi->mv[0].col ||
451               mi->mv[0].row != next_mi->mv[0].row ||
452               mi->mv[1].col != next_mi->mv[1].col ||
453               mi->mv[1].row != next_mi->mv[1].row) {
454             break;
455           }
456         }
457         if (t - c > 1) {
458           *(buf++) = ',';
459           buf += put_num(buf, '[', t - c - 1, ']');
460           c = t - 1;
461         }
462       }
463       if (c < mi_cols - 1) *(buf++) = ',';
464     }
465     *(buf++) = ']';
466     if (r < mi_rows - 1) *(buf++) = ',';
467   }
468   buf += put_str(buf, "],\n");
469   return (int)(buf - buffer);
470 }
471 
put_combined(char * buffer)472 int put_combined(char *buffer) {
473   const int mi_rows = frame_data.mi_rows;
474   const int mi_cols = frame_data.mi_cols;
475   char *buf = buffer;
476   int r, c, p;
477   buf += put_str(buf, "  \"");
478   for (p = 0; p < combined_parm_count; ++p) {
479     if (p) buf += put_str(buf, "&");
480     buf += put_str(buf, parm_offsets[combined_parm_list[p]].parm);
481   }
482   buf += put_str(buf, "\": [");
483   for (r = 0; r < mi_rows; ++r) {
484     *(buf++) = '[';
485     for (c = 0; c < mi_cols; ++c) {
486       insp_mi_data *mi = &frame_data.mi_grid[r * mi_cols + c];
487       *(buf++) = '[';
488       for (p = 0; p < combined_parm_count; ++p) {
489         if (p) *(buf++) = ',';
490         int16_t *v = (int16_t *)(((int8_t *)mi) +
491                                  parm_offsets[combined_parm_list[p]].offset);
492         buf += put_num(buf, 0, v[0], 0);
493       }
494       *(buf++) = ']';
495       if (c < mi_cols - 1) *(buf++) = ',';
496     }
497     *(buf++) = ']';
498     if (r < mi_rows - 1) *(buf++) = ',';
499   }
500   buf += put_str(buf, "],\n");
501   return (int)(buf - buffer);
502 }
503 
put_block_info(char * buffer,const map_entry * map,const char * name,size_t offset,int len)504 int put_block_info(char *buffer, const map_entry *map, const char *name,
505                    size_t offset, int len) {
506   const int mi_rows = frame_data.mi_rows;
507   const int mi_cols = frame_data.mi_cols;
508   char *buf = buffer;
509   int r, c, t, i;
510   if (compress && len == 1) {
511     die("Can't encode scalars as arrays when RLE compression is enabled.");
512   }
513   if (map) {
514     buf += snprintf(buf, MAX_BUFFER, "  \"%sMap\": {", name);
515     buf += put_map(buf, map);
516     buf += put_str(buf, "},\n");
517   }
518   buf += snprintf(buf, MAX_BUFFER, "  \"%s\": [", name);
519   for (r = 0; r < mi_rows; ++r) {
520     *(buf++) = '[';
521     for (c = 0; c < mi_cols; ++c) {
522       insp_mi_data *mi = &frame_data.mi_grid[r * mi_cols + c];
523       int16_t *v = (int16_t *)(((int8_t *)mi) + offset);
524       if (len == 0) {
525         buf += put_num(buf, 0, v[0], 0);
526       } else {
527         buf += put_str(buf, "[");
528         for (i = 0; i < len; i++) {
529           buf += put_num(buf, 0, v[i], 0);
530           if (i < len - 1) {
531             buf += put_str(buf, ",");
532           }
533         }
534         buf += put_str(buf, "]");
535       }
536       if (compress) {  // RLE
537         for (t = c + 1; t < mi_cols; ++t) {
538           insp_mi_data *next_mi = &frame_data.mi_grid[r * mi_cols + t];
539           int16_t *nv = (int16_t *)(((int8_t *)next_mi) + offset);
540           int same = 0;
541           if (len == 0) {
542             same = v[0] == nv[0];
543           } else {
544             for (i = 0; i < len; i++) {
545               same = v[i] == nv[i];
546               if (!same) {
547                 break;
548               }
549             }
550           }
551           if (!same) {
552             break;
553           }
554         }
555         if (t - c > 1) {
556           *(buf++) = ',';
557           buf += put_num(buf, '[', t - c - 1, ']');
558           c = t - 1;
559         }
560       }
561       if (c < mi_cols - 1) *(buf++) = ',';
562     }
563     *(buf++) = ']';
564     if (r < mi_rows - 1) *(buf++) = ',';
565   }
566   buf += put_str(buf, "],\n");
567   return (int)(buf - buffer);
568 }
569 
570 #if CONFIG_ACCOUNTING
put_accounting(char * buffer)571 int put_accounting(char *buffer) {
572   char *buf = buffer;
573   int i;
574   const Accounting *accounting = frame_data.accounting;
575   if (accounting == NULL) {
576     printf("XXX\n");
577     return 0;
578   }
579   const int num_syms = accounting->syms.num_syms;
580   const int num_strs = accounting->syms.dictionary.num_strs;
581   buf += put_str(buf, "  \"symbolsMap\": [");
582   for (i = 0; i < num_strs; i++) {
583     buf += snprintf(buf, MAX_BUFFER, "\"%s\"",
584                     accounting->syms.dictionary.strs[i]);
585     if (i < num_strs - 1) *(buf++) = ',';
586   }
587   buf += put_str(buf, "],\n");
588   buf += put_str(buf, "  \"symbols\": [\n    ");
589   AccountingSymbolContext context;
590   context.x = -2;
591   context.y = -2;
592   AccountingSymbol *sym;
593   for (i = 0; i < num_syms; i++) {
594     sym = &accounting->syms.syms[i];
595     if (memcmp(&context, &sym->context, sizeof(AccountingSymbolContext)) != 0) {
596       buf += put_num(buf, '[', sym->context.x, 0);
597       buf += put_num(buf, ',', sym->context.y, ']');
598     } else {
599       buf += put_num(buf, '[', sym->id, 0);
600       buf += put_num(buf, ',', sym->bits, 0);
601       buf += put_num(buf, ',', sym->samples, ']');
602     }
603     context = sym->context;
604     if (i < num_syms - 1) *(buf++) = ',';
605   }
606   buf += put_str(buf, "],\n");
607   return (int)(buf - buffer);
608 }
609 #endif
610 
611 int skip_non_transform = 0;
612 
inspect(void * pbi,void * data)613 void inspect(void *pbi, void *data) {
614   /* Fetch frame data. */
615   ifd_inspect(&frame_data, pbi, skip_non_transform);
616 
617   // Show existing frames just show a reference buffer we've already decoded.
618   // There's no information to show.
619   if (frame_data.show_existing_frame) return;
620 
621   (void)data;
622   // We allocate enough space and hope we don't write out of bounds. Totally
623   // unsafe but this speeds things up, especially when compiled to Javascript.
624   char *buffer = aom_malloc(MAX_BUFFER);
625   if (!buffer) {
626     fprintf(stderr, "Error allocating inspect info buffer\n");
627     abort();
628   }
629   char *buf = buffer;
630   buf += put_str(buf, "{\n");
631   if (layers & BLOCK_SIZE_LAYER) {
632     buf += put_block_info(buf, block_size_map, "blockSize",
633                           offsetof(insp_mi_data, bsize), 0);
634   }
635   if (layers & TRANSFORM_SIZE_LAYER) {
636     buf += put_block_info(buf, tx_size_map, "transformSize",
637                           offsetof(insp_mi_data, tx_size), 0);
638   }
639   if (layers & TRANSFORM_TYPE_LAYER) {
640     buf += put_block_info(buf, tx_type_map, "transformType",
641                           offsetof(insp_mi_data, tx_type), 0);
642   }
643   if (layers & DUAL_FILTER_LAYER) {
644     buf += put_block_info(buf, dual_filter_map, "dualFilterType",
645                           offsetof(insp_mi_data, dual_filter_type), 0);
646   }
647   if (layers & MODE_LAYER) {
648     buf += put_block_info(buf, prediction_mode_map, "mode",
649                           offsetof(insp_mi_data, mode), 0);
650   }
651   if (layers & UV_MODE_LAYER) {
652     buf += put_block_info(buf, uv_prediction_mode_map, "uv_mode",
653                           offsetof(insp_mi_data, uv_mode), 0);
654   }
655   if (layers & MOTION_MODE_LAYER) {
656     buf += put_block_info(buf, motion_mode_map, "motion_mode",
657                           offsetof(insp_mi_data, motion_mode), 0);
658   }
659   if (layers & COMPOUND_TYPE_LAYER) {
660     buf += put_block_info(buf, compound_type_map, "compound_type",
661                           offsetof(insp_mi_data, compound_type), 0);
662   }
663   if (layers & SKIP_LAYER) {
664     buf +=
665         put_block_info(buf, skip_map, "skip", offsetof(insp_mi_data, skip), 0);
666   }
667   if (layers & FILTER_LAYER) {
668     buf +=
669         put_block_info(buf, NULL, "filter", offsetof(insp_mi_data, filter), 2);
670   }
671   if (layers & CDEF_LAYER) {
672     buf += put_block_info(buf, NULL, "cdef_level",
673                           offsetof(insp_mi_data, cdef_level), 0);
674     buf += put_block_info(buf, NULL, "cdef_strength",
675                           offsetof(insp_mi_data, cdef_strength), 0);
676   }
677   if (layers & CFL_LAYER) {
678     buf += put_block_info(buf, NULL, "cfl_alpha_idx",
679                           offsetof(insp_mi_data, cfl_alpha_idx), 0);
680     buf += put_block_info(buf, NULL, "cfl_alpha_sign",
681                           offsetof(insp_mi_data, cfl_alpha_sign), 0);
682   }
683   if (layers & Q_INDEX_LAYER) {
684     buf += put_block_info(buf, NULL, "delta_q",
685                           offsetof(insp_mi_data, current_qindex), 0);
686   }
687   if (layers & SEGMENT_ID_LAYER) {
688     buf += put_block_info(buf, NULL, "seg_id",
689                           offsetof(insp_mi_data, segment_id), 0);
690   }
691   if (layers & MOTION_VECTORS_LAYER) {
692     buf += put_motion_vectors(buf);
693   }
694   if (layers & INTRABC_LAYER) {
695     buf += put_block_info(buf, intrabc_map, "intrabc",
696                           offsetof(insp_mi_data, intrabc), 0);
697   }
698   if (layers & PALETTE_LAYER) {
699     buf += put_block_info(buf, palette_map, "palette",
700                           offsetof(insp_mi_data, palette), 0);
701   }
702   if (layers & UV_PALETTE_LAYER) {
703     buf += put_block_info(buf, palette_map, "uv_palette",
704                           offsetof(insp_mi_data, uv_palette), 0);
705   }
706   if (combined_parm_count > 0) buf += put_combined(buf);
707   if (layers & REFERENCE_FRAME_LAYER) {
708     buf += put_block_info(buf, refs_map, "referenceFrame",
709                           offsetof(insp_mi_data, ref_frame), 2);
710   }
711 #if CONFIG_ACCOUNTING
712   if (layers & ACCOUNTING_LAYER) {
713     buf += put_accounting(buf);
714   }
715 #endif
716   buf +=
717       snprintf(buf, MAX_BUFFER, "  \"frame\": %d,\n", frame_data.frame_number);
718   buf += snprintf(buf, MAX_BUFFER, "  \"showFrame\": %d,\n",
719                   frame_data.show_frame);
720   buf += snprintf(buf, MAX_BUFFER, "  \"frameType\": %d,\n",
721                   frame_data.frame_type);
722   buf += snprintf(buf, MAX_BUFFER, "  \"baseQIndex\": %d,\n",
723                   frame_data.base_qindex);
724   buf += snprintf(buf, MAX_BUFFER, "  \"tileCols\": %d,\n",
725                   frame_data.tile_mi_cols);
726   buf += snprintf(buf, MAX_BUFFER, "  \"tileRows\": %d,\n",
727                   frame_data.tile_mi_rows);
728   buf += snprintf(buf, MAX_BUFFER, "  \"deltaQPresentFlag\": %d,\n",
729                   frame_data.delta_q_present_flag);
730   buf += snprintf(buf, MAX_BUFFER, "  \"deltaQRes\": %d,\n",
731                   frame_data.delta_q_res);
732   buf += put_str(buf, "  \"config\": {");
733   buf += put_map(buf, config_map);
734   buf += put_str(buf, "},\n");
735   buf += put_str(buf, "  \"configString\": \"");
736   buf += put_str_with_escape(buf, aom_codec_build_config());
737   buf += put_str(buf, "\"\n");
738   decoded_frame_count++;
739   buf += put_str(buf, "},\n");
740   *(buf++) = 0;
741   on_frame_decoded_dump(buffer);
742   aom_free(buffer);
743 }
744 
ifd_init_cb(void)745 void ifd_init_cb(void) {
746   aom_inspect_init ii;
747   ii.inspect_cb = inspect;
748   ii.inspect_ctx = NULL;
749   aom_codec_control(&codec, AV1_SET_INSPECTION_CALLBACK, &ii);
750 }
751 
752 EMSCRIPTEN_KEEPALIVE
open_file(char * file)753 int open_file(char *file) {
754   if (file == NULL) {
755     // The JS analyzer puts the .ivf file at this location.
756     file = "/tmp/input.ivf";
757   }
758   reader = aom_video_reader_open(file);
759   if (!reader) die("Failed to open %s for reading.", file);
760   info = aom_video_reader_get_info(reader);
761   aom_codec_iface_t *decoder = get_aom_decoder_by_fourcc(info->codec_fourcc);
762   if (!decoder) die("Unknown input codec.");
763   fprintf(stderr, "Using %s\n", aom_codec_iface_name(decoder));
764   if (aom_codec_dec_init(&codec, decoder, NULL, 0))
765     die("Failed to initialize decoder.");
766   ifd_init(&frame_data, info->frame_width, info->frame_height);
767   ifd_init_cb();
768   return EXIT_SUCCESS;
769 }
770 
771 Av1DecodeReturn adr;
772 int have_frame = 0;
773 const unsigned char *frame;
774 const unsigned char *end_frame;
775 size_t frame_size = 0;
776 
777 EMSCRIPTEN_KEEPALIVE
read_frame(void)778 int read_frame(void) {
779   img = NULL;
780 
781   // This loop skips over any frames that are show_existing_frames,  as
782   // there is nothing to analyze.
783   do {
784     if (!have_frame) {
785       if (!aom_video_reader_read_frame(reader)) return EXIT_FAILURE;
786       frame = aom_video_reader_get_frame(reader, &frame_size);
787 
788       have_frame = 1;
789       end_frame = frame + frame_size;
790     }
791 
792     if (aom_codec_decode(&codec, frame, (unsigned int)frame_size, &adr) !=
793         AOM_CODEC_OK) {
794       die_codec(&codec, "Failed to decode frame.");
795     }
796 
797     frame = adr.buf;
798     frame_size = end_frame - frame;
799     if (frame == end_frame) have_frame = 0;
800   } while (adr.show_existing);
801 
802   int got_any_frames = 0;
803   aom_image_t *frame_img;
804   struct av1_ref_frame ref_dec;
805   ref_dec.idx = adr.idx;
806 
807   // ref_dec.idx is the index to the reference buffer idx to AV1_GET_REFERENCE
808   // if its -1 the decoder didn't update any reference buffer and the only
809   // way to see the frame is aom_codec_get_frame.
810   if (ref_dec.idx == -1) {
811     aom_codec_iter_t iter = NULL;
812     img = frame_img = aom_codec_get_frame(&codec, &iter);
813     ++frame_count;
814     got_any_frames = 1;
815   } else if (!aom_codec_control(&codec, AV1_GET_REFERENCE, &ref_dec)) {
816     img = frame_img = &ref_dec.img;
817     ++frame_count;
818     got_any_frames = 1;
819   }
820   if (!got_any_frames) {
821     return EXIT_FAILURE;
822   }
823   return EXIT_SUCCESS;
824 }
825 
826 EMSCRIPTEN_KEEPALIVE
get_aom_codec_build_config(void)827 const char *get_aom_codec_build_config(void) {
828   return aom_codec_build_config();
829 }
830 
831 EMSCRIPTEN_KEEPALIVE
get_bit_depth(void)832 int get_bit_depth(void) { return img->bit_depth; }
833 
834 EMSCRIPTEN_KEEPALIVE
get_bits_per_sample(void)835 int get_bits_per_sample(void) { return img->bps; }
836 
837 EMSCRIPTEN_KEEPALIVE
get_image_format(void)838 int get_image_format(void) { return img->fmt; }
839 
840 EMSCRIPTEN_KEEPALIVE
get_plane(int plane)841 unsigned char *get_plane(int plane) { return img->planes[plane]; }
842 
843 EMSCRIPTEN_KEEPALIVE
get_plane_stride(int plane)844 int get_plane_stride(int plane) { return img->stride[plane]; }
845 
846 EMSCRIPTEN_KEEPALIVE
get_plane_width(int plane)847 int get_plane_width(int plane) { return aom_img_plane_width(img, plane); }
848 
849 EMSCRIPTEN_KEEPALIVE
get_plane_height(int plane)850 int get_plane_height(int plane) { return aom_img_plane_height(img, plane); }
851 
852 EMSCRIPTEN_KEEPALIVE
get_frame_width(void)853 int get_frame_width(void) { return info->frame_width; }
854 
855 EMSCRIPTEN_KEEPALIVE
get_frame_height(void)856 int get_frame_height(void) { return info->frame_height; }
857 
parse_args(char ** argv)858 static void parse_args(char **argv) {
859   char **argi, **argj;
860   struct arg arg;
861   (void)dump_accounting_arg;
862   (void)dump_cdef_arg;
863   for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
864     arg.argv_step = 1;
865     if (arg_match(&arg, &dump_block_size_arg, argi)) layers |= BLOCK_SIZE_LAYER;
866 #if CONFIG_ACCOUNTING
867     else if (arg_match(&arg, &dump_accounting_arg, argi))
868       layers |= ACCOUNTING_LAYER;
869 #endif
870     else if (arg_match(&arg, &dump_transform_size_arg, argi))
871       layers |= TRANSFORM_SIZE_LAYER;
872     else if (arg_match(&arg, &dump_transform_type_arg, argi))
873       layers |= TRANSFORM_TYPE_LAYER;
874     else if (arg_match(&arg, &dump_mode_arg, argi))
875       layers |= MODE_LAYER;
876     else if (arg_match(&arg, &dump_uv_mode_arg, argi))
877       layers |= UV_MODE_LAYER;
878     else if (arg_match(&arg, &dump_motion_mode_arg, argi))
879       layers |= MOTION_MODE_LAYER;
880     else if (arg_match(&arg, &dump_compound_type_arg, argi))
881       layers |= COMPOUND_TYPE_LAYER;
882     else if (arg_match(&arg, &dump_skip_arg, argi))
883       layers |= SKIP_LAYER;
884     else if (arg_match(&arg, &dump_filter_arg, argi))
885       layers |= FILTER_LAYER;
886     else if (arg_match(&arg, &dump_cdef_arg, argi))
887       layers |= CDEF_LAYER;
888     else if (arg_match(&arg, &dump_cfl_arg, argi))
889       layers |= CFL_LAYER;
890     else if (arg_match(&arg, &dump_reference_frame_arg, argi))
891       layers |= REFERENCE_FRAME_LAYER;
892     else if (arg_match(&arg, &dump_motion_vectors_arg, argi))
893       layers |= MOTION_VECTORS_LAYER;
894     else if (arg_match(&arg, &dump_dual_filter_type_arg, argi))
895       layers |= DUAL_FILTER_LAYER;
896     else if (arg_match(&arg, &dump_delta_q_arg, argi))
897       layers |= Q_INDEX_LAYER;
898     else if (arg_match(&arg, &dump_seg_id_arg, argi))
899       layers |= SEGMENT_ID_LAYER;
900     else if (arg_match(&arg, &dump_intrabc_arg, argi))
901       layers |= INTRABC_LAYER;
902     else if (arg_match(&arg, &dump_palette_arg, argi))
903       layers |= PALETTE_LAYER;
904     else if (arg_match(&arg, &dump_uv_palette_arg, argi))
905       layers |= UV_PALETTE_LAYER;
906     else if (arg_match(&arg, &dump_all_arg, argi))
907       layers |= ALL_LAYERS;
908     else if (arg_match(&arg, &compress_arg, argi))
909       compress = 1;
910     else if (arg_match(&arg, &usage_arg, argi))
911       usage_exit();
912     else if (arg_match(&arg, &limit_arg, argi))
913       stop_after = arg_parse_uint(&arg);
914     else if (arg_match(&arg, &skip_non_transform_arg, argi))
915       skip_non_transform = arg_parse_uint(&arg);
916     else if (arg_match(&arg, &combined_arg, argi))
917       convert_to_indices(
918           (char *)arg.val, combined_parm_list,
919           sizeof(combined_parm_list) / sizeof(combined_parm_list[0]),
920           &combined_parm_count);
921     else
922       argj++;
923   }
924 }
925 
926 static const char *exec_name;
927 
usage_exit(void)928 void usage_exit(void) {
929   fprintf(stderr, "Usage: %s src_filename <options>\n", exec_name);
930   fprintf(stderr, "\nOptions:\n");
931   arg_show_usage(stderr, main_args);
932   exit(EXIT_FAILURE);
933 }
934 
935 EMSCRIPTEN_KEEPALIVE
main(int argc,char ** argv)936 int main(int argc, char **argv) {
937   exec_name = argv[0];
938   parse_args(argv);
939   if (argc >= 2) {
940     open_file(argv[1]);
941     printf("[\n");
942     while (1) {
943       if (stop_after && (decoded_frame_count >= stop_after)) break;
944       if (read_frame()) break;
945     }
946     printf("null\n");
947     printf("]");
948   } else {
949     usage_exit();
950   }
951 }
952 
953 EMSCRIPTEN_KEEPALIVE
quit(void)954 void quit(void) {
955   if (aom_codec_destroy(&codec)) die_codec(&codec, "Failed to destroy codec");
956   aom_video_reader_close(reader);
957 }
958 
959 EMSCRIPTEN_KEEPALIVE
set_layers(LayerType v)960 void set_layers(LayerType v) { layers = v; }
961 
962 EMSCRIPTEN_KEEPALIVE
set_compress(int v)963 void set_compress(int v) { compress = v; }
964