xref: /third_party/ffmpeg/libavformat/amvenc.c (revision cabdff1a)
1/*
2 * AMV muxer
3 *
4 * Copyright (C) 2020 Zane van Iperen (zane@zanevaniperen.com)
5 *
6 * This file is part of FFmpeg.
7 *
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
12 *
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22#include "avformat.h"
23#include "riff.h"
24#include "internal.h"
25#include "avio_internal.h"
26#include "libavutil/intreadwrite.h"
27#include "libavutil/avassert.h"
28
29/*
30 * Things to note:
31 * - AMV is a hard-coded (and broken) subset of AVI. It's not worth sullying the
32 *   existing AVI muxer with its filth.
33 * - No separate demuxer as the existing AVI demuxer can handle these.
34 * - The sizes of certain tags are deliberately set to 0 as some players break
35 *   when they're set correctly. Ditto with some header fields.
36 * - There is no index.
37 * - Players are **very** sensitive to the frame order and sizes.
38 *   - Frames must be strictly interleaved as V-A, any V-V or A-A will
39 *     cause crashes.
40 *   - Variable video frame sizes seem to be handled fine.
41 *   - Variable audio frame sizes cause crashes.
42 *   - If audio is shorter than video, it's padded with silence.
43 *   - If video is shorter than audio, the most recent frame is repeated.
44 */
45
46#define AMV_STREAM_COUNT     2
47#define AMV_STREAM_VIDEO     0
48#define AMV_STREAM_AUDIO     1
49#define AMV_VIDEO_STRH_SIZE 56
50#define AMV_VIDEO_STRF_SIZE 36
51#define AMV_AUDIO_STRH_SIZE 48
52#define AMV_AUDIO_STRF_SIZE 20 /* sizeof(WAVEFORMATEX) + 2 */
53
54typedef struct AMVContext
55{
56    int64_t riff_start;
57    int64_t movi_list;
58    int64_t offset_duration;
59    int     last_stream;
60
61    int32_t us_per_frame; /* Microseconds per frame.         */
62
63    int32_t aframe_size;  /* Expected audio frame size.      */
64    int32_t ablock_align; /* Expected audio block align.     */
65    AVPacket *apad;       /* Dummy audio packet for padding; not owned by us. */
66    AVPacket *vpad;       /* Most recent video frame, for padding. */
67
68    /*
69     * Cumulative PTS values for each stream, used for the final
70     * duration calculcation.
71     */
72    int64_t lastpts[AMV_STREAM_COUNT];
73} AMVContext;
74
75/* ff_{start,end}_tag(), but sets the size to 0. */
76static int64_t amv_start_tag(AVIOContext *pb, const char *tag)
77{
78    ffio_wfourcc(pb, tag);
79    avio_wl32(pb, 0);
80    return avio_tell(pb);
81}
82
83static void amv_end_tag(AVIOContext *pb, int64_t start)
84{
85    int64_t pos;
86    av_assert0((start&1) == 0);
87
88    pos = avio_tell(pb);
89    if (pos & 1)
90        avio_w8(pb, 0);
91}
92
93static av_cold int amv_init(AVFormatContext *s)
94{
95    AMVContext *amv = s->priv_data;
96    AVStream   *vst, *ast;
97    int ret;
98
99    amv->last_stream  = -1;
100
101    if (s->nb_streams != AMV_STREAM_COUNT) {
102        av_log(s, AV_LOG_ERROR, "AMV files only support 2 streams\n");
103        return AVERROR(EINVAL);
104    }
105
106    vst = s->streams[AMV_STREAM_VIDEO];
107    ast = s->streams[AMV_STREAM_AUDIO];
108
109    if (vst->codecpar->codec_id != AV_CODEC_ID_AMV) {
110        av_log(s, AV_LOG_ERROR, "First AMV stream must be %s\n",
111                avcodec_get_name(AV_CODEC_ID_AMV));
112        return AVERROR(EINVAL);
113    }
114
115    if (ast->codecpar->codec_id != AV_CODEC_ID_ADPCM_IMA_AMV) {
116        av_log(s, AV_LOG_ERROR, "Second AMV stream must be %s\n",
117                avcodec_get_name(AV_CODEC_ID_ADPCM_IMA_AMV));
118        return AVERROR(EINVAL);
119    }
120
121    /* These files are broken-enough as they are. They shouldn't be streamed. */
122    if (!(s->pb->seekable & AVIO_SEEKABLE_NORMAL)) {
123        av_log(s, AV_LOG_ERROR, "Stream not seekable, unable to write output file\n");
124        return AVERROR(EINVAL);
125    }
126
127    amv->us_per_frame = av_rescale(AV_TIME_BASE, vst->time_base.num, vst->time_base.den);
128    amv->aframe_size  = av_rescale(ast->codecpar->sample_rate, amv->us_per_frame, AV_TIME_BASE);
129    amv->ablock_align = 8 + (FFALIGN(amv->aframe_size, 2) / 2);
130
131    av_log(s, AV_LOG_TRACE, "us_per_frame = %d\n", amv->us_per_frame);
132    av_log(s, AV_LOG_TRACE, "aframe_size  = %d\n", amv->aframe_size);
133    av_log(s, AV_LOG_TRACE, "ablock_align = %d\n", amv->ablock_align);
134
135    /*
136     * Bail if the framerate's too high. Prevents the audio frame size from
137     * getting too small. 63fps is the closest value to 60fps that divides
138     * cleanly, so cap it there.
139     */
140    if (amv->us_per_frame < 15873) {
141        av_log(s, AV_LOG_ERROR, "Refusing to mux >63fps video\n");
142        return AVERROR(EINVAL);
143    }
144
145    /*
146     * frame_size will be set if coming from the encoder.
147     * Make sure the its been configured correctly. The audio frame duration
148     * needs to match that of the video.
149     */
150    if (ast->codecpar->frame_size) {
151        AVCodecParameters *par = ast->codecpar;
152        int bad = 0;
153
154        if (par->frame_size != amv->aframe_size) {
155            av_log(s, AV_LOG_ERROR, "Invalid audio frame size. Got %d, wanted %d\n",
156                   par->frame_size, amv->aframe_size);
157            bad = 1;
158        }
159
160        if (par->block_align != amv->ablock_align) {
161            av_log(s, AV_LOG_ERROR, "Invalid audio block align. Got %d, wanted %d\n",
162                   par->block_align, amv->ablock_align);
163            bad = 1;
164        }
165
166        if (bad) {
167            av_log(s, AV_LOG_ERROR, "Try -block_size %d\n", amv->aframe_size);
168            return AVERROR(EINVAL);
169        }
170
171        if (ast->codecpar->sample_rate % amv->aframe_size) {
172            av_log(s, AV_LOG_ERROR, "Audio sample rate not a multiple of the frame size.\n"
173                "Please change video frame rate. Suggested rates: 10,14,15,18,21,25,30\n");
174            return AVERROR(EINVAL);
175        }
176    } else {
177        /* If remuxing from the same source, then this will match the video. */
178        int32_t aus = av_rescale(AV_TIME_BASE, ast->time_base.num, ast->time_base.den);
179        if (aus != amv->us_per_frame) {
180            av_log(s, AV_LOG_ERROR, "Cannot remux streams with a different time base\n");
181            return AVERROR(EINVAL);
182        }
183    }
184
185    /* Allocate and fill dummy packet so we can pad the audio. */
186    amv->apad = ffformatcontext(s)->pkt;
187    if ((ret = av_new_packet(amv->apad, amv->ablock_align)) < 0) {
188        return ret;
189    }
190
191    amv->apad->stream_index = AMV_STREAM_AUDIO;
192    memset(amv->apad->data, 0, amv->ablock_align);
193    AV_WL32(amv->apad->data + 4, amv->aframe_size);
194
195    amv->vpad = av_packet_alloc();
196    if (!amv->vpad) {
197        return AVERROR(ENOMEM);
198    }
199    amv->vpad->stream_index = AMV_STREAM_VIDEO;
200    amv->vpad->duration     = 1;
201    return 0;
202}
203
204static void amv_deinit(AVFormatContext *s)
205{
206    AMVContext *amv = s->priv_data;
207
208    av_packet_free(&amv->vpad);
209}
210
211static void amv_write_vlist(AVFormatContext *s, AVCodecParameters *par)
212{
213    int64_t tag_list, tag_str;
214
215    av_assert0(par->codec_id == AV_CODEC_ID_AMV);
216
217    tag_list = amv_start_tag(s->pb, "LIST");
218    ffio_wfourcc(s->pb, "strl");
219    tag_str = ff_start_tag(s->pb, "strh");
220    ffio_fill(s->pb, 0, AMV_VIDEO_STRH_SIZE);
221    ff_end_tag(s->pb, tag_str);
222
223    tag_str = ff_start_tag(s->pb, "strf");
224    ffio_fill(s->pb, 0, AMV_VIDEO_STRF_SIZE);
225    ff_end_tag(s->pb, tag_str);
226
227    amv_end_tag(s->pb, tag_list);
228}
229
230static void amv_write_alist(AVFormatContext *s, AVCodecParameters *par)
231{
232    uint8_t buf[AMV_AUDIO_STRF_SIZE];
233    AVIOContext *pb = s->pb;
234    int64_t tag_list, tag_str;
235
236    av_assert0(par->codec_id == AV_CODEC_ID_ADPCM_IMA_AMV);
237
238    tag_list = amv_start_tag(pb, "LIST");
239    ffio_wfourcc(pb, "strl");
240    tag_str = ff_start_tag(pb, "strh");
241    ffio_fill(s->pb, 0, AMV_AUDIO_STRH_SIZE);
242    ff_end_tag(pb, tag_str);
243
244    /* Bodge an (incorrect) WAVEFORMATEX (+2 pad bytes) */
245    tag_str = ff_start_tag(pb, "strf");
246    AV_WL16(buf +  0, 1);
247    AV_WL16(buf +  2, par->ch_layout.nb_channels);
248    AV_WL32(buf +  4, par->sample_rate);
249    AV_WL32(buf +  8, par->sample_rate * par->ch_layout.nb_channels * 2);
250    AV_WL16(buf + 12, 2);
251    AV_WL16(buf + 14, 16);
252    AV_WL16(buf + 16, 0);
253    AV_WL16(buf + 18, 0);
254    avio_write(pb, buf, AMV_AUDIO_STRF_SIZE);
255    ff_end_tag(pb, tag_str);
256
257    amv_end_tag(pb, tag_list);
258}
259
260static int amv_write_header(AVFormatContext *s)
261{
262    AMVContext *amv = s->priv_data;
263    AVIOContext *pb = s->pb;
264    AVStream *vst   = s->streams[AMV_STREAM_VIDEO];
265    AVStream *ast   = s->streams[AMV_STREAM_AUDIO];
266    uint8_t amvh[56] = {0};
267    int64_t list1;
268
269    amv->riff_start = amv_start_tag(pb, "RIFF");
270    ffio_wfourcc(pb, "AMV ");
271    list1 = amv_start_tag(pb, "LIST");
272    ffio_wfourcc(pb, "hdrl");
273
274    ffio_wfourcc(pb, "amvh");
275    avio_wl32(pb, 56);
276
277    AV_WL32(amvh +  0, amv->us_per_frame);
278    AV_WL32(amvh + 32, vst->codecpar->width);
279    AV_WL32(amvh + 36, vst->codecpar->height);
280    AV_WL32(amvh + 40, vst->time_base.den);
281    AV_WL32(amvh + 44, vst->time_base.num);
282    AV_WL32(amvh + 48, 0);
283    AV_WL32(amvh + 52, 0); /* duration, filled in later. */
284
285    avio_write(pb, amvh, sizeof(amvh));
286    amv->offset_duration = avio_tell(pb) - 4;
287
288    amv_write_vlist(s, vst->codecpar);
289    amv_write_alist(s, ast->codecpar);
290    amv_end_tag(pb, list1);
291
292    amv->movi_list = amv_start_tag(pb, "LIST");
293    ffio_wfourcc(pb, "movi");
294    return 0;
295}
296
297static int amv_write_packet_internal(AVFormatContext *s, AVPacket *pkt)
298{
299    AMVContext *amv = s->priv_data;
300
301    if (pkt->stream_index == AMV_STREAM_VIDEO)
302        ffio_wfourcc(s->pb, "00dc");
303    else if (pkt->stream_index == AMV_STREAM_AUDIO)
304        ffio_wfourcc(s->pb, "01wb");
305    else
306        av_assert0(0);
307
308    if (pkt->stream_index == AMV_STREAM_AUDIO && pkt->size != amv->ablock_align) {
309        /* Can happen when remuxing files produced by another encoder. */
310        av_log(s, AV_LOG_WARNING, "Invalid audio packet size (%d != %d)\n",
311               pkt->size, amv->ablock_align);
312    }
313
314    avio_wl32(s->pb, pkt->size);
315    avio_write(s->pb, pkt->data, pkt->size);
316
317    amv->lastpts[pkt->stream_index] += pkt->duration;
318    amv->last_stream = pkt->stream_index;
319    return 0;
320}
321
322static int amv_pad(AVFormatContext *s, AVPacket *pkt)
323{
324    AMVContext *amv = s->priv_data;
325    int stream_index = pkt->stream_index;
326
327    if (stream_index != amv->last_stream)
328        return 0;
329
330    stream_index = (stream_index + 1) % s->nb_streams;
331    if (stream_index == AMV_STREAM_VIDEO)
332        return amv_write_packet_internal(s, amv->vpad);
333    else if (stream_index == AMV_STREAM_AUDIO)
334        return amv_write_packet_internal(s, amv->apad);
335    else
336        av_assert0(0);
337
338    return AVERROR(EINVAL);
339}
340
341static int amv_write_packet(AVFormatContext *s, AVPacket *pkt)
342{
343    AMVContext *amv = s->priv_data;
344    int ret;
345
346    /* Add a dummy frame if we've received two of the same index. */
347    if ((ret = amv_pad(s, pkt)) < 0)
348        return ret;
349
350    if ((ret = amv_write_packet_internal(s, pkt)) < 0)
351        return ret;
352
353    if (pkt->stream_index == AMV_STREAM_VIDEO) {
354        /* Save the last packet for padding. */
355        av_packet_unref(amv->vpad);
356        if ((ret = av_packet_ref(amv->vpad, pkt)) < 0)
357            return ret;
358    }
359
360    return 0;
361}
362
363static int amv_write_trailer(AVFormatContext *s)
364{
365    AMVContext *amv = s->priv_data;
366    AVStream   *vst = s->streams[AMV_STREAM_VIDEO];
367    AVStream   *ast = s->streams[AMV_STREAM_AUDIO];
368    int64_t maxpts, ret;
369    int hh, mm, ss;
370
371    /* Pad-out one last audio frame if needed. */
372    if (amv->last_stream == AMV_STREAM_VIDEO) {
373        if ((ret = amv_write_packet_internal(s, amv->apad)) < 0)
374            return ret;
375    }
376
377    amv_end_tag(s->pb, amv->movi_list);
378    amv_end_tag(s->pb, amv->riff_start);
379
380    ffio_wfourcc(s->pb, "AMV_");
381    ffio_wfourcc(s->pb, "END_");
382
383    if ((ret = avio_seek(s->pb, amv->offset_duration, SEEK_SET)) < 0)
384        return ret;
385
386    /* Go back and write the duration. */
387    maxpts = FFMAX(
388        av_rescale_q(amv->lastpts[AMV_STREAM_VIDEO], vst->time_base, AV_TIME_BASE_Q),
389        av_rescale_q(amv->lastpts[AMV_STREAM_AUDIO], ast->time_base, AV_TIME_BASE_Q)
390    );
391
392    ss  = maxpts / AV_TIME_BASE;
393    mm  = ss / 60;
394    hh  = mm / 60;
395    ss %= 60;
396    mm %= 60;
397
398    avio_w8(s->pb, ss);
399    avio_w8(s->pb, mm);
400    avio_wl16(s->pb, hh);
401    return 0;
402}
403
404const AVOutputFormat ff_amv_muxer = {
405    .name           = "amv",
406    .long_name      = NULL_IF_CONFIG_SMALL("AMV"),
407    .mime_type      = "video/amv",
408    .extensions     = "amv",
409    .priv_data_size = sizeof(AMVContext),
410    .audio_codec    = AV_CODEC_ID_ADPCM_IMA_AMV,
411    .video_codec    = AV_CODEC_ID_AMV,
412    .init           = amv_init,
413    .deinit         = amv_deinit,
414    .write_header   = amv_write_header,
415    .write_packet   = amv_write_packet,
416    .write_trailer  = amv_write_trailer,
417};
418