• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (c) 2011 Stefano Sabatini
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 /**
22  * @file
23  * filter for showing textual audio frame information
24  */
25 
26 #include <inttypes.h>
27 #include <stddef.h>
28 
29 #include "libavutil/adler32.h"
30 #include "libavutil/attributes.h"
31 #include "libavutil/channel_layout.h"
32 #include "libavutil/common.h"
33 #include "libavutil/downmix_info.h"
34 #include "libavutil/intreadwrite.h"
35 #include "libavutil/mem.h"
36 #include "libavutil/replaygain.h"
37 #include "libavutil/timestamp.h"
38 #include "libavutil/samplefmt.h"
39 
40 #include "libavcodec/defs.h"
41 
42 #include "audio.h"
43 #include "avfilter.h"
44 #include "internal.h"
45 
46 typedef struct AShowInfoContext {
47     /**
48      * Scratch space for individual plane checksums for planar audio
49      */
50     uint32_t *plane_checksums;
51 } AShowInfoContext;
52 
uninit(AVFilterContext * ctx)53 static av_cold void uninit(AVFilterContext *ctx)
54 {
55     AShowInfoContext *s = ctx->priv;
56     av_freep(&s->plane_checksums);
57 }
58 
dump_matrixenc(AVFilterContext * ctx,AVFrameSideData * sd)59 static void dump_matrixenc(AVFilterContext *ctx, AVFrameSideData *sd)
60 {
61     enum AVMatrixEncoding enc;
62 
63     av_log(ctx, AV_LOG_INFO, "matrix encoding: ");
64 
65     if (sd->size < sizeof(enum AVMatrixEncoding)) {
66         av_log(ctx, AV_LOG_INFO, "invalid data");
67         return;
68     }
69 
70     enc = *(enum AVMatrixEncoding *)sd->data;
71     switch (enc) {
72     case AV_MATRIX_ENCODING_NONE:           av_log(ctx, AV_LOG_INFO, "none");                break;
73     case AV_MATRIX_ENCODING_DOLBY:          av_log(ctx, AV_LOG_INFO, "Dolby Surround");      break;
74     case AV_MATRIX_ENCODING_DPLII:          av_log(ctx, AV_LOG_INFO, "Dolby Pro Logic II");  break;
75     case AV_MATRIX_ENCODING_DPLIIX:         av_log(ctx, AV_LOG_INFO, "Dolby Pro Logic IIx"); break;
76     case AV_MATRIX_ENCODING_DPLIIZ:         av_log(ctx, AV_LOG_INFO, "Dolby Pro Logic IIz"); break;
77     case AV_MATRIX_ENCODING_DOLBYEX:        av_log(ctx, AV_LOG_INFO, "Dolby EX");            break;
78     case AV_MATRIX_ENCODING_DOLBYHEADPHONE: av_log(ctx, AV_LOG_INFO, "Dolby Headphone");     break;
79     default:                                av_log(ctx, AV_LOG_WARNING, "unknown");          break;
80     }
81 }
82 
dump_downmix(AVFilterContext * ctx,AVFrameSideData * sd)83 static void dump_downmix(AVFilterContext *ctx, AVFrameSideData *sd)
84 {
85     AVDownmixInfo *di;
86 
87     av_log(ctx, AV_LOG_INFO, "downmix: ");
88     if (sd->size < sizeof(*di)) {
89         av_log(ctx, AV_LOG_INFO, "invalid data");
90         return;
91     }
92 
93     di = (AVDownmixInfo *)sd->data;
94 
95     av_log(ctx, AV_LOG_INFO, "preferred downmix type - ");
96     switch (di->preferred_downmix_type) {
97     case AV_DOWNMIX_TYPE_LORO:    av_log(ctx, AV_LOG_INFO, "Lo/Ro");              break;
98     case AV_DOWNMIX_TYPE_LTRT:    av_log(ctx, AV_LOG_INFO, "Lt/Rt");              break;
99     case AV_DOWNMIX_TYPE_DPLII:   av_log(ctx, AV_LOG_INFO, "Dolby Pro Logic II"); break;
100     default:                      av_log(ctx, AV_LOG_WARNING, "unknown");         break;
101     }
102 
103     av_log(ctx, AV_LOG_INFO, " Mix levels: center %f (%f ltrt) - "
104            "surround %f (%f ltrt) - lfe %f",
105            di->center_mix_level, di->center_mix_level_ltrt,
106            di->surround_mix_level, di->surround_mix_level_ltrt,
107            di->lfe_mix_level);
108 }
109 
print_gain(AVFilterContext * ctx,const char * str,int32_t gain)110 static void print_gain(AVFilterContext *ctx, const char *str, int32_t gain)
111 {
112     av_log(ctx, AV_LOG_INFO, "%s - ", str);
113     if (gain == INT32_MIN)
114         av_log(ctx, AV_LOG_INFO, "unknown");
115     else
116         av_log(ctx, AV_LOG_INFO, "%f", gain / 100000.0f);
117     av_log(ctx, AV_LOG_INFO, ", ");
118 }
119 
print_peak(AVFilterContext * ctx,const char * str,uint32_t peak)120 static void print_peak(AVFilterContext *ctx, const char *str, uint32_t peak)
121 {
122     av_log(ctx, AV_LOG_INFO, "%s - ", str);
123     if (!peak)
124         av_log(ctx, AV_LOG_INFO, "unknown");
125     else
126         av_log(ctx, AV_LOG_INFO, "%f", (float)peak / UINT32_MAX);
127     av_log(ctx, AV_LOG_INFO, ", ");
128 }
129 
dump_replaygain(AVFilterContext * ctx,AVFrameSideData * sd)130 static void dump_replaygain(AVFilterContext *ctx, AVFrameSideData *sd)
131 {
132     AVReplayGain *rg;
133 
134     av_log(ctx, AV_LOG_INFO, "replaygain: ");
135     if (sd->size < sizeof(*rg)) {
136         av_log(ctx, AV_LOG_INFO, "invalid data");
137         return;
138     }
139     rg = (AVReplayGain*)sd->data;
140 
141     print_gain(ctx, "track gain", rg->track_gain);
142     print_peak(ctx, "track peak", rg->track_peak);
143     print_gain(ctx, "album gain", rg->album_gain);
144     print_peak(ctx, "album peak", rg->album_peak);
145 }
146 
dump_audio_service_type(AVFilterContext * ctx,AVFrameSideData * sd)147 static void dump_audio_service_type(AVFilterContext *ctx, AVFrameSideData *sd)
148 {
149     enum AVAudioServiceType *ast;
150 
151     av_log(ctx, AV_LOG_INFO, "audio service type: ");
152     if (sd->size < sizeof(*ast)) {
153         av_log(ctx, AV_LOG_INFO, "invalid data");
154         return;
155     }
156     ast = (enum AVAudioServiceType*)sd->data;
157     switch (*ast) {
158     case AV_AUDIO_SERVICE_TYPE_MAIN:              av_log(ctx, AV_LOG_INFO, "Main Audio Service"); break;
159     case AV_AUDIO_SERVICE_TYPE_EFFECTS:           av_log(ctx, AV_LOG_INFO, "Effects");            break;
160     case AV_AUDIO_SERVICE_TYPE_VISUALLY_IMPAIRED: av_log(ctx, AV_LOG_INFO, "Visually Impaired");  break;
161     case AV_AUDIO_SERVICE_TYPE_HEARING_IMPAIRED:  av_log(ctx, AV_LOG_INFO, "Hearing Impaired");   break;
162     case AV_AUDIO_SERVICE_TYPE_DIALOGUE:          av_log(ctx, AV_LOG_INFO, "Dialogue");           break;
163     case AV_AUDIO_SERVICE_TYPE_COMMENTARY:        av_log(ctx, AV_LOG_INFO, "Commentary");         break;
164     case AV_AUDIO_SERVICE_TYPE_EMERGENCY:         av_log(ctx, AV_LOG_INFO, "Emergency");          break;
165     case AV_AUDIO_SERVICE_TYPE_VOICE_OVER:        av_log(ctx, AV_LOG_INFO, "Voice Over");         break;
166     case AV_AUDIO_SERVICE_TYPE_KARAOKE:           av_log(ctx, AV_LOG_INFO, "Karaoke");            break;
167     default:                                      av_log(ctx, AV_LOG_INFO, "unknown");            break;
168     }
169 }
170 
dump_unknown(AVFilterContext * ctx,AVFrameSideData * sd)171 static void dump_unknown(AVFilterContext *ctx, AVFrameSideData *sd)
172 {
173     av_log(ctx, AV_LOG_INFO, "unknown side data type: %d, size "
174            "%"SIZE_SPECIFIER" bytes", sd->type, sd->size);
175 }
176 
filter_frame(AVFilterLink * inlink,AVFrame * buf)177 static int filter_frame(AVFilterLink *inlink, AVFrame *buf)
178 {
179     AVFilterContext *ctx = inlink->dst;
180     AShowInfoContext *s  = ctx->priv;
181 #if FF_API_OLD_CHANNEL_LAYOUT
182     AVChannelLayout layout = { 0 };
183 #endif
184     char chlayout_str[128];
185     uint32_t checksum = 0;
186     int channels    = inlink->ch_layout.nb_channels;
187     int planar      = av_sample_fmt_is_planar(buf->format);
188     int block_align = av_get_bytes_per_sample(buf->format) * (planar ? 1 : channels);
189     int data_size   = buf->nb_samples * block_align;
190     int planes      = planar ? channels : 1;
191     int i;
192     void *tmp_ptr = av_realloc_array(s->plane_checksums, channels, sizeof(*s->plane_checksums));
193 
194     if (!tmp_ptr)
195         return AVERROR(ENOMEM);
196     s->plane_checksums = tmp_ptr;
197 
198     for (i = 0; i < planes; i++) {
199         uint8_t *data = buf->extended_data[i];
200 
201         s->plane_checksums[i] = av_adler32_update(0, data, data_size);
202         checksum = i ? av_adler32_update(checksum, data, data_size) :
203                        s->plane_checksums[0];
204     }
205 
206 #if FF_API_OLD_CHANNEL_LAYOUT
207 FF_DISABLE_DEPRECATION_WARNINGS
208     if (av_channel_layout_from_mask(&layout, buf->channel_layout)) {
209         av_channel_layout_describe(&layout, chlayout_str, sizeof(chlayout_str));
210 FF_ENABLE_DEPRECATION_WARNINGS
211     } else if (buf->ch_layout.nb_channels)
212 #endif
213     av_channel_layout_describe(&buf->ch_layout, chlayout_str, sizeof(chlayout_str));
214 
215     av_log(ctx, AV_LOG_INFO,
216            "n:%"PRId64" pts:%s pts_time:%s pos:%"PRId64" "
217            "fmt:%s channels:%d chlayout:%s rate:%d nb_samples:%d "
218            "checksum:%08"PRIX32" ",
219            inlink->frame_count_out,
220            av_ts2str(buf->pts), av_ts2timestr(buf->pts, &inlink->time_base),
221            buf->pkt_pos,
222            av_get_sample_fmt_name(buf->format), buf->ch_layout.nb_channels, chlayout_str,
223            buf->sample_rate, buf->nb_samples,
224            checksum);
225 
226     av_log(ctx, AV_LOG_INFO, "plane_checksums: [ ");
227     for (i = 0; i < planes; i++)
228         av_log(ctx, AV_LOG_INFO, "%08"PRIX32" ", s->plane_checksums[i]);
229     av_log(ctx, AV_LOG_INFO, "]\n");
230 
231     for (i = 0; i < buf->nb_side_data; i++) {
232         AVFrameSideData *sd = buf->side_data[i];
233 
234         av_log(ctx, AV_LOG_INFO, "  side data - ");
235         switch (sd->type) {
236         case AV_FRAME_DATA_MATRIXENCODING: dump_matrixenc (ctx, sd); break;
237         case AV_FRAME_DATA_DOWNMIX_INFO:   dump_downmix   (ctx, sd); break;
238         case AV_FRAME_DATA_REPLAYGAIN:     dump_replaygain(ctx, sd); break;
239         case AV_FRAME_DATA_AUDIO_SERVICE_TYPE: dump_audio_service_type(ctx, sd); break;
240         default:                           dump_unknown   (ctx, sd); break;
241         }
242 
243         av_log(ctx, AV_LOG_INFO, "\n");
244     }
245 
246     return ff_filter_frame(inlink->dst->outputs[0], buf);
247 }
248 
249 static const AVFilterPad inputs[] = {
250     {
251         .name         = "default",
252         .type         = AVMEDIA_TYPE_AUDIO,
253         .filter_frame = filter_frame,
254     },
255 };
256 
257 static const AVFilterPad outputs[] = {
258     {
259         .name = "default",
260         .type = AVMEDIA_TYPE_AUDIO,
261     },
262 };
263 
264 const AVFilter ff_af_ashowinfo = {
265     .name        = "ashowinfo",
266     .description = NULL_IF_CONFIG_SMALL("Show textual information for each audio frame."),
267     .priv_size   = sizeof(AShowInfoContext),
268     .uninit      = uninit,
269     .flags       = AVFILTER_FLAG_METADATA_ONLY,
270     FILTER_INPUTS(inputs),
271     FILTER_OUTPUTS(outputs),
272 };
273