1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * RTP AMR Depacketizer, RFC 3267
3cabdff1aSopenharmony_ci * Copyright (c) 2010 Martin Storsjo
4cabdff1aSopenharmony_ci *
5cabdff1aSopenharmony_ci * This file is part of FFmpeg.
6cabdff1aSopenharmony_ci *
7cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
8cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
9cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
10cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
11cabdff1aSopenharmony_ci *
12cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
13cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
14cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15cabdff1aSopenharmony_ci * Lesser General Public License for more details.
16cabdff1aSopenharmony_ci *
17cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
18cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
19cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20cabdff1aSopenharmony_ci */
21cabdff1aSopenharmony_ci
22cabdff1aSopenharmony_ci#include "libavutil/channel_layout.h"
23cabdff1aSopenharmony_ci#include "avformat.h"
24cabdff1aSopenharmony_ci#include "rtpdec_formats.h"
25cabdff1aSopenharmony_ci#include "libavutil/avstring.h"
26cabdff1aSopenharmony_ci
27cabdff1aSopenharmony_cistatic const uint8_t frame_sizes_nb[16] = {
28cabdff1aSopenharmony_ci    12, 13, 15, 17, 19, 20, 26, 31, 5, 0, 0, 0, 0, 0, 0, 0
29cabdff1aSopenharmony_ci};
30cabdff1aSopenharmony_cistatic const uint8_t frame_sizes_wb[16] = {
31cabdff1aSopenharmony_ci    17, 23, 32, 36, 40, 46, 50, 58, 60, 5, 5, 0, 0, 0, 0, 0
32cabdff1aSopenharmony_ci};
33cabdff1aSopenharmony_ci
34cabdff1aSopenharmony_cistruct PayloadContext {
35cabdff1aSopenharmony_ci    int octet_align;
36cabdff1aSopenharmony_ci    int crc;
37cabdff1aSopenharmony_ci    int interleaving;
38cabdff1aSopenharmony_ci    int channels;
39cabdff1aSopenharmony_ci};
40cabdff1aSopenharmony_ci
41cabdff1aSopenharmony_cistatic av_cold int amr_init(AVFormatContext *s, int st_index, PayloadContext *data)
42cabdff1aSopenharmony_ci{
43cabdff1aSopenharmony_ci    data->channels = 1;
44cabdff1aSopenharmony_ci    return 0;
45cabdff1aSopenharmony_ci}
46cabdff1aSopenharmony_ci
47cabdff1aSopenharmony_cistatic int amr_handle_packet(AVFormatContext *ctx, PayloadContext *data,
48cabdff1aSopenharmony_ci                             AVStream *st, AVPacket *pkt, uint32_t *timestamp,
49cabdff1aSopenharmony_ci                             const uint8_t *buf, int len, uint16_t seq,
50cabdff1aSopenharmony_ci                             int flags)
51cabdff1aSopenharmony_ci{
52cabdff1aSopenharmony_ci    const uint8_t *frame_sizes = NULL;
53cabdff1aSopenharmony_ci    int frames;
54cabdff1aSopenharmony_ci    int i, ret;
55cabdff1aSopenharmony_ci    const uint8_t *speech_data;
56cabdff1aSopenharmony_ci    uint8_t *ptr;
57cabdff1aSopenharmony_ci
58cabdff1aSopenharmony_ci    if (st->codecpar->codec_id == AV_CODEC_ID_AMR_NB) {
59cabdff1aSopenharmony_ci        frame_sizes = frame_sizes_nb;
60cabdff1aSopenharmony_ci    } else if (st->codecpar->codec_id == AV_CODEC_ID_AMR_WB) {
61cabdff1aSopenharmony_ci        frame_sizes = frame_sizes_wb;
62cabdff1aSopenharmony_ci    } else {
63cabdff1aSopenharmony_ci        av_log(ctx, AV_LOG_ERROR, "Bad codec ID\n");
64cabdff1aSopenharmony_ci        return AVERROR_INVALIDDATA;
65cabdff1aSopenharmony_ci    }
66cabdff1aSopenharmony_ci
67cabdff1aSopenharmony_ci    if (st->codecpar->ch_layout.nb_channels != 1) {
68cabdff1aSopenharmony_ci        av_log(ctx, AV_LOG_ERROR, "Only mono AMR is supported\n");
69cabdff1aSopenharmony_ci        return AVERROR_INVALIDDATA;
70cabdff1aSopenharmony_ci    }
71cabdff1aSopenharmony_ci    av_channel_layout_default(&st->codecpar->ch_layout, 1);
72cabdff1aSopenharmony_ci
73cabdff1aSopenharmony_ci    /* The AMR RTP packet consists of one header byte, followed
74cabdff1aSopenharmony_ci     * by one TOC byte for each AMR frame in the packet, followed
75cabdff1aSopenharmony_ci     * by the speech data for all the AMR frames.
76cabdff1aSopenharmony_ci     *
77cabdff1aSopenharmony_ci     * The header byte contains only a codec mode request, for
78cabdff1aSopenharmony_ci     * requesting what kind of AMR data the sender wants to
79cabdff1aSopenharmony_ci     * receive. Not used at the moment.
80cabdff1aSopenharmony_ci     */
81cabdff1aSopenharmony_ci
82cabdff1aSopenharmony_ci    /* Count the number of frames in the packet. The highest bit
83cabdff1aSopenharmony_ci     * is set in a TOC byte if there are more frames following.
84cabdff1aSopenharmony_ci     */
85cabdff1aSopenharmony_ci    for (frames = 1; frames < len && (buf[frames] & 0x80); frames++) ;
86cabdff1aSopenharmony_ci
87cabdff1aSopenharmony_ci    if (1 + frames >= len) {
88cabdff1aSopenharmony_ci        /* We hit the end of the packet while counting frames. */
89cabdff1aSopenharmony_ci        av_log(ctx, AV_LOG_ERROR, "No speech data found\n");
90cabdff1aSopenharmony_ci        return AVERROR_INVALIDDATA;
91cabdff1aSopenharmony_ci    }
92cabdff1aSopenharmony_ci
93cabdff1aSopenharmony_ci    speech_data = buf + 1 + frames;
94cabdff1aSopenharmony_ci
95cabdff1aSopenharmony_ci    /* Everything except the codec mode request byte should be output. */
96cabdff1aSopenharmony_ci    if ((ret = av_new_packet(pkt, len - 1)) < 0) {
97cabdff1aSopenharmony_ci        av_log(ctx, AV_LOG_ERROR, "Out of memory\n");
98cabdff1aSopenharmony_ci        return ret;
99cabdff1aSopenharmony_ci    }
100cabdff1aSopenharmony_ci    pkt->stream_index = st->index;
101cabdff1aSopenharmony_ci    ptr = pkt->data;
102cabdff1aSopenharmony_ci
103cabdff1aSopenharmony_ci    for (i = 0; i < frames; i++) {
104cabdff1aSopenharmony_ci        uint8_t toc = buf[1 + i];
105cabdff1aSopenharmony_ci        int frame_size = frame_sizes[(toc >> 3) & 0x0f];
106cabdff1aSopenharmony_ci
107cabdff1aSopenharmony_ci        if (speech_data + frame_size > buf + len) {
108cabdff1aSopenharmony_ci            /* Too little speech data */
109cabdff1aSopenharmony_ci            av_log(ctx, AV_LOG_WARNING, "Too little speech data in the RTP packet\n");
110cabdff1aSopenharmony_ci            /* Set the unwritten part of the packet to zero. */
111cabdff1aSopenharmony_ci            memset(ptr, 0, pkt->data + pkt->size - ptr);
112cabdff1aSopenharmony_ci            pkt->size = ptr - pkt->data;
113cabdff1aSopenharmony_ci            return 0;
114cabdff1aSopenharmony_ci        }
115cabdff1aSopenharmony_ci
116cabdff1aSopenharmony_ci        /* Extract the AMR frame mode from the TOC byte */
117cabdff1aSopenharmony_ci        *ptr++ = toc & 0x7C;
118cabdff1aSopenharmony_ci
119cabdff1aSopenharmony_ci        /* Copy the speech data */
120cabdff1aSopenharmony_ci        memcpy(ptr, speech_data, frame_size);
121cabdff1aSopenharmony_ci        speech_data += frame_size;
122cabdff1aSopenharmony_ci        ptr += frame_size;
123cabdff1aSopenharmony_ci    }
124cabdff1aSopenharmony_ci
125cabdff1aSopenharmony_ci    if (speech_data < buf + len) {
126cabdff1aSopenharmony_ci        av_log(ctx, AV_LOG_WARNING, "Too much speech data in the RTP packet?\n");
127cabdff1aSopenharmony_ci        /* Set the unwritten part of the packet to zero. */
128cabdff1aSopenharmony_ci        memset(ptr, 0, pkt->data + pkt->size - ptr);
129cabdff1aSopenharmony_ci        pkt->size = ptr - pkt->data;
130cabdff1aSopenharmony_ci    }
131cabdff1aSopenharmony_ci
132cabdff1aSopenharmony_ci    return 0;
133cabdff1aSopenharmony_ci}
134cabdff1aSopenharmony_ci
135cabdff1aSopenharmony_cistatic int amr_parse_fmtp(AVFormatContext *s,
136cabdff1aSopenharmony_ci                          AVStream *stream, PayloadContext *data,
137cabdff1aSopenharmony_ci                          const char *attr, const char *value)
138cabdff1aSopenharmony_ci{
139cabdff1aSopenharmony_ci    /* Some AMR SDP configurations contain "octet-align", without
140cabdff1aSopenharmony_ci     * the trailing =1. Therefore, if the value is empty,
141cabdff1aSopenharmony_ci     * interpret it as "1".
142cabdff1aSopenharmony_ci     */
143cabdff1aSopenharmony_ci    if (!strcmp(value, "")) {
144cabdff1aSopenharmony_ci        av_log(s, AV_LOG_WARNING, "AMR fmtp attribute %s had "
145cabdff1aSopenharmony_ci                                  "nonstandard empty value\n", attr);
146cabdff1aSopenharmony_ci        value = "1";
147cabdff1aSopenharmony_ci    }
148cabdff1aSopenharmony_ci    if (!strcmp(attr, "octet-align"))
149cabdff1aSopenharmony_ci        data->octet_align = atoi(value);
150cabdff1aSopenharmony_ci    else if (!strcmp(attr, "crc"))
151cabdff1aSopenharmony_ci        data->crc = atoi(value);
152cabdff1aSopenharmony_ci    else if (!strcmp(attr, "interleaving"))
153cabdff1aSopenharmony_ci        data->interleaving = atoi(value);
154cabdff1aSopenharmony_ci    else if (!strcmp(attr, "channels"))
155cabdff1aSopenharmony_ci        data->channels = atoi(value);
156cabdff1aSopenharmony_ci    return 0;
157cabdff1aSopenharmony_ci}
158cabdff1aSopenharmony_ci
159cabdff1aSopenharmony_cistatic int amr_parse_sdp_line(AVFormatContext *s, int st_index,
160cabdff1aSopenharmony_ci                              PayloadContext *data, const char *line)
161cabdff1aSopenharmony_ci{
162cabdff1aSopenharmony_ci    const char *p;
163cabdff1aSopenharmony_ci    int ret;
164cabdff1aSopenharmony_ci
165cabdff1aSopenharmony_ci    if (st_index < 0)
166cabdff1aSopenharmony_ci        return 0;
167cabdff1aSopenharmony_ci
168cabdff1aSopenharmony_ci    /* Parse an fmtp line this one:
169cabdff1aSopenharmony_ci     * a=fmtp:97 octet-align=1; interleaving=0
170cabdff1aSopenharmony_ci     * That is, a normal fmtp: line followed by semicolon & space
171cabdff1aSopenharmony_ci     * separated key/value pairs.
172cabdff1aSopenharmony_ci     */
173cabdff1aSopenharmony_ci    if (av_strstart(line, "fmtp:", &p)) {
174cabdff1aSopenharmony_ci        ret = ff_parse_fmtp(s, s->streams[st_index], data, p, amr_parse_fmtp);
175cabdff1aSopenharmony_ci        if (!data->octet_align || data->crc ||
176cabdff1aSopenharmony_ci            data->interleaving || data->channels != 1) {
177cabdff1aSopenharmony_ci            av_log(s, AV_LOG_ERROR, "Unsupported RTP/AMR configuration!\n");
178cabdff1aSopenharmony_ci            return -1;
179cabdff1aSopenharmony_ci        }
180cabdff1aSopenharmony_ci        return ret;
181cabdff1aSopenharmony_ci    }
182cabdff1aSopenharmony_ci    return 0;
183cabdff1aSopenharmony_ci}
184cabdff1aSopenharmony_ci
185cabdff1aSopenharmony_ciconst RTPDynamicProtocolHandler ff_amr_nb_dynamic_handler = {
186cabdff1aSopenharmony_ci    .enc_name         = "AMR",
187cabdff1aSopenharmony_ci    .codec_type       = AVMEDIA_TYPE_AUDIO,
188cabdff1aSopenharmony_ci    .codec_id         = AV_CODEC_ID_AMR_NB,
189cabdff1aSopenharmony_ci    .priv_data_size   = sizeof(PayloadContext),
190cabdff1aSopenharmony_ci    .init             = amr_init,
191cabdff1aSopenharmony_ci    .parse_sdp_a_line = amr_parse_sdp_line,
192cabdff1aSopenharmony_ci    .parse_packet     = amr_handle_packet,
193cabdff1aSopenharmony_ci};
194cabdff1aSopenharmony_ci
195cabdff1aSopenharmony_ciconst RTPDynamicProtocolHandler ff_amr_wb_dynamic_handler = {
196cabdff1aSopenharmony_ci    .enc_name         = "AMR-WB",
197cabdff1aSopenharmony_ci    .codec_type       = AVMEDIA_TYPE_AUDIO,
198cabdff1aSopenharmony_ci    .codec_id         = AV_CODEC_ID_AMR_WB,
199cabdff1aSopenharmony_ci    .priv_data_size   = sizeof(PayloadContext),
200cabdff1aSopenharmony_ci    .init             = amr_init,
201cabdff1aSopenharmony_ci    .parse_sdp_a_line = amr_parse_sdp_line,
202cabdff1aSopenharmony_ci    .parse_packet     = amr_handle_packet,
203cabdff1aSopenharmony_ci};
204