• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Realmedia RTSP protocol (RDT) support.
3  * Copyright (c) 2007 Ronald S. Bultje
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 /**
23  * @file
24  * @brief Realmedia RTSP protocol (RDT) support
25  * @author Ronald S. Bultje <rbultje@ronald.bitfreak.net>
26  */
27 
28 #include "avformat.h"
29 #include "libavutil/avstring.h"
30 #include "rtpdec.h"
31 #include "rdt.h"
32 #include "libavutil/base64.h"
33 #include "libavutil/md5.h"
34 #include "rm.h"
35 #include "internal.h"
36 #include "avio_internal.h"
37 #include "libavcodec/get_bits.h"
38 
39 struct RDTDemuxContext {
40     AVFormatContext *ic; /**< the containing (RTSP) demux context */
41     /** Each RDT stream-set (represented by one RTSPStream) can contain
42      * multiple streams (of the same content, but with possibly different
43      * codecs/bitrates). Each such stream is represented by one AVStream
44      * in the AVFormatContext, and this variable points to the offset in
45      * that array such that the first is the first stream of this set. */
46     AVStream **streams;
47     int n_streams; /**< streams with identical content in this set */
48     void *dynamic_protocol_context;
49     DynamicPayloadPacketHandlerProc parse_packet;
50     uint32_t prev_timestamp;
51     int prev_set_id, prev_stream_id;
52 };
53 
54 RDTDemuxContext *
ff_rdt_parse_open(AVFormatContext * ic,int first_stream_of_set_idx,void * priv_data,const RTPDynamicProtocolHandler * handler)55 ff_rdt_parse_open(AVFormatContext *ic, int first_stream_of_set_idx,
56                   void *priv_data, const RTPDynamicProtocolHandler *handler)
57 {
58     RDTDemuxContext *s = av_mallocz(sizeof(RDTDemuxContext));
59     if (!s)
60         return NULL;
61 
62     s->ic = ic;
63     s->streams = &ic->streams[first_stream_of_set_idx];
64     do {
65         s->n_streams++;
66     } while (first_stream_of_set_idx + s->n_streams < ic->nb_streams &&
67              s->streams[s->n_streams]->id == s->streams[0]->id);
68     s->prev_set_id    = -1;
69     s->prev_stream_id = -1;
70     s->prev_timestamp = -1;
71     s->parse_packet = handler ? handler->parse_packet : NULL;
72     s->dynamic_protocol_context = priv_data;
73 
74     return s;
75 }
76 
77 void
ff_rdt_parse_close(RDTDemuxContext * s)78 ff_rdt_parse_close(RDTDemuxContext *s)
79 {
80     av_free(s);
81 }
82 
83 struct PayloadContext {
84     AVFormatContext *rmctx;
85     int nb_rmst;
86     RMStream **rmst;
87     uint8_t *mlti_data;
88     unsigned int mlti_data_size;
89     char buffer[RTP_MAX_PACKET_LENGTH + AV_INPUT_BUFFER_PADDING_SIZE];
90     int audio_pkt_cnt; /**< remaining audio packets in rmdec */
91 };
92 
93 void
ff_rdt_calc_response_and_checksum(char response[41],char chksum[9],const char * challenge)94 ff_rdt_calc_response_and_checksum(char response[41], char chksum[9],
95                                   const char *challenge)
96 {
97     int ch_len = strlen (challenge), i;
98     unsigned char zres[16],
99         buf[64] = { 0xa1, 0xe9, 0x14, 0x9d, 0x0e, 0x6b, 0x3b, 0x59 };
100 #define XOR_TABLE_SIZE 37
101     static const unsigned char xor_table[XOR_TABLE_SIZE] = {
102         0x05, 0x18, 0x74, 0xd0, 0x0d, 0x09, 0x02, 0x53,
103         0xc0, 0x01, 0x05, 0x05, 0x67, 0x03, 0x19, 0x70,
104         0x08, 0x27, 0x66, 0x10, 0x10, 0x72, 0x08, 0x09,
105         0x63, 0x11, 0x03, 0x71, 0x08, 0x08, 0x70, 0x02,
106         0x10, 0x57, 0x05, 0x18, 0x54 };
107 
108     /* some (length) checks */
109     if (ch_len == 40) /* what a hack... */
110         ch_len = 32;
111     else if (ch_len > 56)
112         ch_len = 56;
113     memcpy(buf + 8, challenge, ch_len);
114 
115     /* xor challenge bytewise with xor_table */
116     for (i = 0; i < XOR_TABLE_SIZE; i++)
117         buf[8 + i] ^= xor_table[i];
118 
119     av_md5_sum(zres, buf, 64);
120     ff_data_to_hex(response, zres, 16, 1);
121 
122     /* add tail */
123     strcpy (response + 32, "01d0a8e3");
124 
125     /* calculate checksum */
126     for (i = 0; i < 8; i++)
127         chksum[i] = response[i * 4];
128     chksum[8] = 0;
129 }
130 
131 static int
rdt_load_mdpr(PayloadContext * rdt,AVStream * st,int rule_nr)132 rdt_load_mdpr (PayloadContext *rdt, AVStream *st, int rule_nr)
133 {
134     FFIOContext pb0;
135     AVIOContext *const pb = &pb0.pub;
136     unsigned int size;
137     uint32_t tag;
138 
139     /**
140      * Layout of the MLTI chunk:
141      * 4: MLTI
142      * 2: number of streams
143      * Then for each stream ([number_of_streams] times):
144      *     2: mdpr index
145      * 2: number of mdpr chunks
146      * Then for each mdpr chunk ([number_of_mdpr_chunks] times):
147      *     4: size
148      *     [size]: data
149      * we skip MDPR chunks until we reach the one of the stream
150      * we're interested in, and forward that ([size]+[data]) to
151      * the RM demuxer to parse the stream-specific header data.
152      */
153     if (!rdt->mlti_data)
154         return -1;
155     ffio_init_context(&pb0, rdt->mlti_data, rdt->mlti_data_size, 0,
156                   NULL, NULL, NULL, NULL);
157     tag = avio_rl32(pb);
158     if (tag == MKTAG('M', 'L', 'T', 'I')) {
159         int num, chunk_nr;
160 
161         /* read index of MDPR chunk numbers */
162         num = avio_rb16(pb);
163         if (rule_nr < 0 || rule_nr >= num)
164             return -1;
165         avio_skip(pb, rule_nr * 2);
166         chunk_nr = avio_rb16(pb);
167         avio_skip(pb, (num - 1 - rule_nr) * 2);
168 
169         /* read MDPR chunks */
170         num = avio_rb16(pb);
171         if (chunk_nr >= num)
172             return -1;
173         while (chunk_nr--)
174             avio_skip(pb, avio_rb32(pb));
175         size = avio_rb32(pb);
176     } else {
177         size = rdt->mlti_data_size;
178         avio_seek(pb, 0, SEEK_SET);
179     }
180     if (ff_rm_read_mdpr_codecdata(rdt->rmctx, pb, st, rdt->rmst[st->index], size, NULL) < 0)
181         return -1;
182 
183     return 0;
184 }
185 
186 /**
187  * Actual data handling.
188  */
189 
190 int
ff_rdt_parse_header(const uint8_t * buf,int len,int * pset_id,int * pseq_no,int * pstream_id,int * pis_keyframe,uint32_t * ptimestamp)191 ff_rdt_parse_header(const uint8_t *buf, int len,
192                     int *pset_id, int *pseq_no, int *pstream_id,
193                     int *pis_keyframe, uint32_t *ptimestamp)
194 {
195     GetBitContext gb;
196     int consumed = 0, set_id, seq_no, stream_id, is_keyframe,
197         len_included, need_reliable;
198     uint32_t timestamp;
199 
200     /* skip status packets */
201     while (len >= 5 && buf[1] == 0xFF /* status packet */) {
202         int pkt_len;
203 
204         if (!(buf[0] & 0x80))
205             return -1; /* not followed by a data packet */
206 
207         pkt_len = AV_RB16(buf+3);
208         buf += pkt_len;
209         len -= pkt_len;
210         consumed += pkt_len;
211     }
212     if (len < 16)
213         return -1;
214     /**
215      * Layout of the header (in bits):
216      * 1:  len_included
217      *     Flag indicating whether this header includes a length field;
218      *     this can be used to concatenate multiple RDT packets in a
219      *     single UDP/TCP data frame and is used to precede RDT data
220      *     by stream status packets
221      * 1:  need_reliable
222      *     Flag indicating whether this header includes a "reliable
223      *     sequence number"; these are apparently sequence numbers of
224      *     data packets alone. For data packets, this flag is always
225      *     set, according to the Real documentation [1]
226      * 5:  set_id
227      *     ID of a set of streams of identical content, possibly with
228      *     different codecs or bitrates
229      * 1:  is_reliable
230      *     Flag set for certain streams deemed less tolerable for packet
231      *     loss
232      * 16: seq_no
233      *     Packet sequence number; if >=0xFF00, this is a non-data packet
234      *     containing stream status info, the second byte indicates the
235      *     type of status packet (see wireshark docs / source code [2])
236      * if (len_included) {
237      *     16: packet_len
238      * } else {
239      *     packet_len = remainder of UDP/TCP frame
240      * }
241      * 1:  is_back_to_back
242      *     Back-to-Back flag; used for timing, set for one in every 10
243      *     packets, according to the Real documentation [1]
244      * 1:  is_slow_data
245      *     Slow-data flag; currently unused, according to Real docs [1]
246      * 5:  stream_id
247      *     ID of the stream within this particular set of streams
248      * 1:  is_no_keyframe
249      *     Non-keyframe flag (unset if packet belongs to a keyframe)
250      * 32: timestamp (PTS)
251      * if (set_id == 0x1F) {
252      *     16: set_id (extended set-of-streams ID; see set_id)
253      * }
254      * if (need_reliable) {
255      *     16: reliable_seq_no
256      *         Reliable sequence number (see need_reliable)
257      * }
258      * if (stream_id == 0x3F) {
259      *     16: stream_id (extended stream ID; see stream_id)
260      * }
261      * [1] https://protocol.helixcommunity.org/files/2005/devdocs/RDT_Feature_Level_20.txt
262      * [2] http://www.wireshark.org/docs/dfref/r/rdt.html and
263      *     http://anonsvn.wireshark.org/viewvc/trunk/epan/dissectors/packet-rdt.c
264      */
265     init_get_bits(&gb, buf, len << 3);
266     len_included  = get_bits1(&gb);
267     need_reliable = get_bits1(&gb);
268     set_id        = get_bits(&gb, 5);
269     skip_bits(&gb, 1);
270     seq_no        = get_bits(&gb, 16);
271     if (len_included)
272         skip_bits(&gb, 16);
273     skip_bits(&gb, 2);
274     stream_id     = get_bits(&gb, 5);
275     is_keyframe   = !get_bits1(&gb);
276     timestamp     = get_bits_long(&gb, 32);
277     if (set_id == 0x1f)
278         set_id    = get_bits(&gb, 16);
279     if (need_reliable)
280         skip_bits(&gb, 16);
281     if (stream_id == 0x1f)
282         stream_id = get_bits(&gb, 16);
283 
284     if (pset_id)      *pset_id      = set_id;
285     if (pseq_no)      *pseq_no      = seq_no;
286     if (pstream_id)   *pstream_id   = stream_id;
287     if (pis_keyframe) *pis_keyframe = is_keyframe;
288     if (ptimestamp)   *ptimestamp   = timestamp;
289 
290     return consumed + (get_bits_count(&gb) >> 3);
291 }
292 
293 /**< return 0 on packet, no more left, 1 on packet, 1 on partial packet... */
294 static int
rdt_parse_packet(AVFormatContext * ctx,PayloadContext * rdt,AVStream * st,AVPacket * pkt,uint32_t * timestamp,const uint8_t * buf,int len,uint16_t rtp_seq,int flags)295 rdt_parse_packet (AVFormatContext *ctx, PayloadContext *rdt, AVStream *st,
296                   AVPacket *pkt, uint32_t *timestamp,
297                   const uint8_t *buf, int len, uint16_t rtp_seq, int flags)
298 {
299     int seq = 1, res;
300 
301     if (rdt->audio_pkt_cnt == 0) {
302         FFIOContext pb;
303         int pos, rmflags;
304 
305         ffio_init_context(&pb, (uint8_t *)buf, len, 0, NULL, NULL, NULL, NULL);
306         rmflags = (flags & RTP_FLAG_KEY) ? 2 : 0;
307         res = ff_rm_parse_packet(rdt->rmctx, &pb.pub, st, rdt->rmst[st->index],
308                                  len, pkt, &seq, rmflags, *timestamp);
309         pos = avio_tell(&pb.pub);
310         if (res < 0)
311             return res;
312         if (res > 0) {
313             if (st->codecpar->codec_id == AV_CODEC_ID_AAC) {
314                 memcpy (rdt->buffer, buf + pos, len - pos);
315                 rdt->rmctx->pb = avio_alloc_context (rdt->buffer, len - pos, 0,
316                                                     NULL, NULL, NULL, NULL);
317             }
318             goto get_cache;
319         }
320     } else {
321 get_cache:
322         rdt->audio_pkt_cnt =
323             ff_rm_retrieve_cache (rdt->rmctx, rdt->rmctx->pb,
324                                   st, rdt->rmst[st->index], pkt);
325         if (rdt->audio_pkt_cnt == 0 &&
326             st->codecpar->codec_id == AV_CODEC_ID_AAC)
327             avio_context_free(&rdt->rmctx->pb);
328     }
329     pkt->stream_index = st->index;
330     pkt->pts = *timestamp;
331 
332     return rdt->audio_pkt_cnt > 0;
333 }
334 
335 int
ff_rdt_parse_packet(RDTDemuxContext * s,AVPacket * pkt,uint8_t ** bufptr,int len)336 ff_rdt_parse_packet(RDTDemuxContext *s, AVPacket *pkt,
337                     uint8_t **bufptr, int len)
338 {
339     uint8_t *buf = bufptr ? *bufptr : NULL;
340     int seq_no, flags = 0, stream_id, set_id, is_keyframe;
341     uint32_t timestamp;
342     int rv= 0;
343 
344     if (!s->parse_packet)
345         return -1;
346 
347     if (!buf && s->prev_stream_id != -1) {
348         /* return the next packets, if any */
349         timestamp= 0; ///< Should not be used if buf is NULL, but should be set to the timestamp of the packet returned....
350         rv= s->parse_packet(s->ic, s->dynamic_protocol_context,
351                             s->streams[s->prev_stream_id],
352                             pkt, &timestamp, NULL, 0, 0, flags);
353         return rv;
354     }
355 
356     if (len < 12)
357         return -1;
358     rv = ff_rdt_parse_header(buf, len, &set_id, &seq_no, &stream_id, &is_keyframe, &timestamp);
359     if (rv < 0)
360         return rv;
361     if (is_keyframe &&
362         (set_id != s->prev_set_id || timestamp != s->prev_timestamp ||
363          stream_id != s->prev_stream_id)) {
364         flags |= RTP_FLAG_KEY;
365         s->prev_set_id    = set_id;
366         s->prev_timestamp = timestamp;
367     }
368     s->prev_stream_id = stream_id;
369     buf += rv;
370     len -= rv;
371 
372      if (s->prev_stream_id >= s->n_streams) {
373          s->prev_stream_id = -1;
374          return -1;
375      }
376 
377     rv = s->parse_packet(s->ic, s->dynamic_protocol_context,
378                          s->streams[s->prev_stream_id],
379                          pkt, &timestamp, buf, len, 0, flags);
380 
381     return rv;
382 }
383 
384 void
ff_rdt_subscribe_rule(char * cmd,int size,int stream_nr,int rule_nr)385 ff_rdt_subscribe_rule (char *cmd, int size,
386                        int stream_nr, int rule_nr)
387 {
388     av_strlcatf(cmd, size, "stream=%d;rule=%d,stream=%d;rule=%d",
389                 stream_nr, rule_nr * 2, stream_nr, rule_nr * 2 + 1);
390 }
391 
392 static unsigned char *
rdt_parse_b64buf(unsigned int * target_len,const char * p)393 rdt_parse_b64buf (unsigned int *target_len, const char *p)
394 {
395     unsigned char *target;
396     int len = strlen(p);
397     if (*p == '\"') {
398         p++;
399         len -= 2; /* skip embracing " at start/end */
400     }
401     *target_len = len * 3 / 4;
402     target = av_mallocz(*target_len + AV_INPUT_BUFFER_PADDING_SIZE);
403     if (!target)
404         return NULL;
405     av_base64_decode(target, p, *target_len);
406     return target;
407 }
408 
409 static int
rdt_parse_sdp_line(AVFormatContext * s,int st_index,PayloadContext * rdt,const char * line)410 rdt_parse_sdp_line (AVFormatContext *s, int st_index,
411                     PayloadContext *rdt, const char *line)
412 {
413     AVStream *stream = s->streams[st_index];
414     const char *p = line;
415 
416     if (av_strstart(p, "OpaqueData:buffer;", &p)) {
417         rdt->mlti_data = rdt_parse_b64buf(&rdt->mlti_data_size, p);
418     } else if (av_strstart(p, "StartTime:integer;", &p))
419         ffstream(stream)->first_dts = atoi(p);
420     else if (av_strstart(p, "ASMRuleBook:string;", &p)) {
421         int n, first = -1;
422 
423         for (n = 0; n < s->nb_streams; n++)
424             if (s->streams[n]->id == stream->id) {
425                 int count = s->streams[n]->index + 1, err;
426                 if (first == -1) first = n;
427                 if (rdt->nb_rmst < count) {
428                     if ((err = av_reallocp(&rdt->rmst,
429                                            count * sizeof(*rdt->rmst))) < 0) {
430                         rdt->nb_rmst = 0;
431                         return err;
432                     }
433                     memset(rdt->rmst + rdt->nb_rmst, 0,
434                            (count - rdt->nb_rmst) * sizeof(*rdt->rmst));
435                     rdt->nb_rmst = count;
436                 }
437                 rdt->rmst[s->streams[n]->index] = ff_rm_alloc_rmstream();
438                 if (!rdt->rmst[s->streams[n]->index])
439                     return AVERROR(ENOMEM);
440                 rdt_load_mdpr(rdt, s->streams[n], (n - first) * 2);
441            }
442     }
443 
444     return 0;
445 }
446 
447 static void
real_parse_asm_rule(AVStream * st,const char * p,const char * end)448 real_parse_asm_rule(AVStream *st, const char *p, const char *end)
449 {
450     do {
451         /* can be either averagebandwidth= or AverageBandwidth= */
452         if (sscanf(p, " %*1[Aa]verage%*1[Bb]andwidth=%"SCNd64, &st->codecpar->bit_rate) == 1)
453             break;
454         if (!(p = strchr(p, ',')) || p > end)
455             p = end;
456         p++;
457     } while (p < end);
458 }
459 
460 static AVStream *
add_dstream(AVFormatContext * s,AVStream * orig_st)461 add_dstream(AVFormatContext *s, AVStream *orig_st)
462 {
463     AVStream *st;
464 
465     if (!(st = avformat_new_stream(s, NULL)))
466         return NULL;
467     st->id = orig_st->id;
468     st->codecpar->codec_type = orig_st->codecpar->codec_type;
469     ffstream(st)->first_dts  = ffstream(orig_st)->first_dts;
470 
471     return st;
472 }
473 
474 static void
real_parse_asm_rulebook(AVFormatContext * s,AVStream * orig_st,const char * p)475 real_parse_asm_rulebook(AVFormatContext *s, AVStream *orig_st,
476                         const char *p)
477 {
478     const char *end;
479     int n_rules = 0, odd = 0;
480     AVStream *st;
481 
482     /**
483      * The ASMRuleBook contains a list of comma-separated strings per rule,
484      * and each rule is separated by a ;. The last one also has a ; at the
485      * end so we can use it as delimiter.
486      * Every rule occurs twice, once for when the RTSP packet header marker
487      * is set and once for if it isn't. We only read the first because we
488      * don't care much (that's what the "odd" variable is for).
489      * Each rule contains a set of one or more statements, optionally
490      * preceded by a single condition. If there's a condition, the rule
491      * starts with a '#'. Multiple conditions are merged between brackets,
492      * so there are never multiple conditions spread out over separate
493      * statements. Generally, these conditions are bitrate limits (min/max)
494      * for multi-bitrate streams.
495      */
496     if (*p == '\"') p++;
497     while (1) {
498         if (!(end = strchr(p, ';')))
499             break;
500         if (!odd && end != p) {
501             if (n_rules > 0)
502                 st = add_dstream(s, orig_st);
503             else
504                 st = orig_st;
505             if (!st)
506                 break;
507             real_parse_asm_rule(st, p, end);
508             n_rules++;
509         }
510         p = end + 1;
511         odd ^= 1;
512     }
513 }
514 
515 void
ff_real_parse_sdp_a_line(AVFormatContext * s,int stream_index,const char * line)516 ff_real_parse_sdp_a_line (AVFormatContext *s, int stream_index,
517                           const char *line)
518 {
519     const char *p = line;
520 
521     if (av_strstart(p, "ASMRuleBook:string;", &p))
522         real_parse_asm_rulebook(s, s->streams[stream_index], p);
523 }
524 
525 
526 
rdt_init(AVFormatContext * s,int st_index,PayloadContext * rdt)527 static av_cold int rdt_init(AVFormatContext *s, int st_index, PayloadContext *rdt)
528 {
529     int ret;
530 
531     rdt->rmctx = avformat_alloc_context();
532     if (!rdt->rmctx)
533         return AVERROR(ENOMEM);
534 
535     if ((ret = ff_copy_whiteblacklists(rdt->rmctx, s)) < 0)
536         return ret;
537 
538     return avformat_open_input(&rdt->rmctx, "", &ff_rdt_demuxer, NULL);
539 }
540 
541 static void
rdt_close_context(PayloadContext * rdt)542 rdt_close_context (PayloadContext *rdt)
543 {
544     int i;
545 
546     for (i = 0; i < rdt->nb_rmst; i++)
547         if (rdt->rmst[i]) {
548             ff_rm_free_rmstream(rdt->rmst[i]);
549             av_freep(&rdt->rmst[i]);
550         }
551     if (rdt->rmctx)
552         avformat_close_input(&rdt->rmctx);
553     av_freep(&rdt->mlti_data);
554     av_freep(&rdt->rmst);
555 }
556 
557 #define RDT_HANDLER(n, s, t) \
558 const RTPDynamicProtocolHandler ff_rdt_ ## n ## _handler = { \
559     .enc_name         = s, \
560     .codec_type       = t, \
561     .codec_id         = AV_CODEC_ID_NONE, \
562     .priv_data_size   = sizeof(PayloadContext), \
563     .init             = rdt_init, \
564     .parse_sdp_a_line = rdt_parse_sdp_line, \
565     .close            = rdt_close_context, \
566     .parse_packet     = rdt_parse_packet \
567 }
568 
569 RDT_HANDLER(live_video, "x-pn-multirate-realvideo-live", AVMEDIA_TYPE_VIDEO);
570 RDT_HANDLER(live_audio, "x-pn-multirate-realaudio-live", AVMEDIA_TYPE_AUDIO);
571 RDT_HANDLER(video,      "x-pn-realvideo",                AVMEDIA_TYPE_VIDEO);
572 RDT_HANDLER(audio,      "x-pn-realaudio",                AVMEDIA_TYPE_AUDIO);
573 
574