4 * Copyright (C) 2020 Zane van Iperen (zane@zanevaniperen.com)
6 * This file is part of FFmpeg.
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26 #include "avio_internal.h"
27 #include "libavutil/intreadwrite.h"
28 #include "libavutil/avassert.h"
32 * - AMV is a hard-coded (and broken) subset of AVI. It's not worth sullying the
33 * existing AVI muxer with its filth.
34 * - No separate demuxer as the existing AVI demuxer can handle these.
35 * - The sizes of certain tags are deliberately set to 0 as some players break
36 * when they're set correctly. Ditto with some header fields.
37 * - There is no index.
38 * - Players are **very** sensitive to the frame order and sizes.
39 * - Frames must be strictly interleaved as V-A, any V-V or A-A will
41 * - Variable video frame sizes seem to be handled fine.
42 * - Variable audio frame sizes cause crashes.
43 * - If audio is shorter than video, it's padded with silence.
44 * - If video is shorter than audio, the most recent frame is repeated.
47 #define AMV_STREAM_COUNT 2
48 #define AMV_STREAM_VIDEO 0
49 #define AMV_STREAM_AUDIO 1
50 #define AMV_VIDEO_STRH_SIZE 56
51 #define AMV_VIDEO_STRF_SIZE 36
52 #define AMV_AUDIO_STRH_SIZE 48
53 #define AMV_AUDIO_STRF_SIZE 20 /* sizeof(WAVEFORMATEX) + 2 */
55 typedef struct AMVContext
59 int64_t offset_duration
;
62 int32_t us_per_frame
; /* Microseconds per frame. */
64 int32_t aframe_size
; /* Expected audio frame size. */
65 int32_t ablock_align
; /* Expected audio block align. */
66 AVPacket
*apad
; /* Dummy audio packet for padding; not owned by us. */
67 AVPacket
*vpad
; /* Most recent video frame, for padding. */
70 * Cumulative PTS values for each stream, used for the final
71 * duration calculation.
73 int64_t lastpts
[AMV_STREAM_COUNT
];
76 /* ff_{start,end}_tag(), but sets the size to 0. */
77 static int64_t amv_start_tag(AVIOContext
*pb
, const char *tag
)
79 ffio_wfourcc(pb
, tag
);
84 static void amv_end_tag(AVIOContext
*pb
, int64_t start
)
87 av_assert0((start
&1) == 0);
94 static av_cold
int amv_init(AVFormatContext
*s
)
96 AMVContext
*amv
= s
->priv_data
;
100 amv
->last_stream
= -1;
102 if (s
->nb_streams
!= AMV_STREAM_COUNT
) {
103 av_log(s
, AV_LOG_ERROR
, "AMV files only support 2 streams\n");
104 return AVERROR(EINVAL
);
107 vst
= s
->streams
[AMV_STREAM_VIDEO
];
108 ast
= s
->streams
[AMV_STREAM_AUDIO
];
110 if (vst
->codecpar
->codec_id
!= AV_CODEC_ID_AMV
) {
111 av_log(s
, AV_LOG_ERROR
, "First AMV stream must be %s\n",
112 avcodec_get_name(AV_CODEC_ID_AMV
));
113 return AVERROR(EINVAL
);
116 av_assert1(ast
->codecpar
->codec_id
== AV_CODEC_ID_ADPCM_IMA_AMV
);
118 /* These files are broken-enough as they are. They shouldn't be streamed. */
119 if (!(s
->pb
->seekable
& AVIO_SEEKABLE_NORMAL
)) {
120 av_log(s
, AV_LOG_ERROR
, "Stream not seekable, unable to write output file\n");
121 return AVERROR(EINVAL
);
124 amv
->us_per_frame
= av_rescale(AV_TIME_BASE
, vst
->time_base
.num
, vst
->time_base
.den
);
125 amv
->aframe_size
= av_rescale(ast
->codecpar
->sample_rate
, amv
->us_per_frame
, AV_TIME_BASE
);
126 amv
->ablock_align
= 8 + (FFALIGN(amv
->aframe_size
, 2) / 2);
128 av_log(s
, AV_LOG_TRACE
, "us_per_frame = %d\n", amv
->us_per_frame
);
129 av_log(s
, AV_LOG_TRACE
, "aframe_size = %d\n", amv
->aframe_size
);
130 av_log(s
, AV_LOG_TRACE
, "ablock_align = %d\n", amv
->ablock_align
);
133 * Bail if the framerate's too high. Prevents the audio frame size from
134 * getting too small. 63fps is the closest value to 60fps that divides
135 * cleanly, so cap it there.
137 if (amv
->us_per_frame
< 15873) {
138 av_log(s
, AV_LOG_ERROR
, "Refusing to mux >63fps video\n");
139 return AVERROR(EINVAL
);
143 * frame_size will be set if coming from the encoder.
144 * Make sure the its been configured correctly. The audio frame duration
145 * needs to match that of the video.
147 if (ast
->codecpar
->frame_size
) {
148 AVCodecParameters
*par
= ast
->codecpar
;
151 if (par
->frame_size
!= amv
->aframe_size
) {
152 av_log(s
, AV_LOG_ERROR
, "Invalid audio frame size. Got %d, wanted %d\n",
153 par
->frame_size
, amv
->aframe_size
);
157 if (par
->block_align
!= amv
->ablock_align
) {
158 av_log(s
, AV_LOG_ERROR
, "Invalid audio block align. Got %d, wanted %d\n",
159 par
->block_align
, amv
->ablock_align
);
164 av_log(s
, AV_LOG_ERROR
, "Try -block_size %d\n", amv
->aframe_size
);
165 return AVERROR(EINVAL
);
168 if (ast
->codecpar
->sample_rate
% amv
->aframe_size
) {
169 av_log(s
, AV_LOG_ERROR
, "Audio sample rate not a multiple of the frame size.\n"
170 "Please change video frame rate. Suggested rates: 10,14,15,18,21,25,30\n");
171 return AVERROR(EINVAL
);
174 /* If remuxing from the same source, then this will match the video. */
175 int32_t aus
= av_rescale(AV_TIME_BASE
, ast
->time_base
.num
, ast
->time_base
.den
);
176 if (aus
!= amv
->us_per_frame
) {
177 av_log(s
, AV_LOG_ERROR
, "Cannot remux streams with a different time base\n");
178 return AVERROR(EINVAL
);
182 /* Allocate and fill dummy packet so we can pad the audio. */
183 amv
->apad
= ffformatcontext(s
)->pkt
;
184 if ((ret
= av_new_packet(amv
->apad
, amv
->ablock_align
)) < 0) {
188 amv
->apad
->stream_index
= AMV_STREAM_AUDIO
;
189 memset(amv
->apad
->data
, 0, amv
->ablock_align
);
190 AV_WL32(amv
->apad
->data
+ 4, amv
->aframe_size
);
192 amv
->vpad
= av_packet_alloc();
194 return AVERROR(ENOMEM
);
196 amv
->vpad
->stream_index
= AMV_STREAM_VIDEO
;
197 amv
->vpad
->duration
= 1;
201 static void amv_deinit(AVFormatContext
*s
)
203 AMVContext
*amv
= s
->priv_data
;
205 av_packet_free(&amv
->vpad
);
208 static void amv_write_vlist(AVFormatContext
*s
, AVCodecParameters
*par
)
210 int64_t tag_list
, tag_str
;
212 av_assert0(par
->codec_id
== AV_CODEC_ID_AMV
);
214 tag_list
= amv_start_tag(s
->pb
, "LIST");
215 ffio_wfourcc(s
->pb
, "strl");
216 tag_str
= ff_start_tag(s
->pb
, "strh");
217 ffio_fill(s
->pb
, 0, AMV_VIDEO_STRH_SIZE
);
218 ff_end_tag(s
->pb
, tag_str
);
220 tag_str
= ff_start_tag(s
->pb
, "strf");
221 ffio_fill(s
->pb
, 0, AMV_VIDEO_STRF_SIZE
);
222 ff_end_tag(s
->pb
, tag_str
);
224 amv_end_tag(s
->pb
, tag_list
);
227 static void amv_write_alist(AVFormatContext
*s
, AVCodecParameters
*par
)
229 uint8_t buf
[AMV_AUDIO_STRF_SIZE
];
230 AVIOContext
*pb
= s
->pb
;
231 int64_t tag_list
, tag_str
;
233 av_assert0(par
->codec_id
== AV_CODEC_ID_ADPCM_IMA_AMV
);
235 tag_list
= amv_start_tag(pb
, "LIST");
236 ffio_wfourcc(pb
, "strl");
237 tag_str
= ff_start_tag(pb
, "strh");
238 ffio_fill(s
->pb
, 0, AMV_AUDIO_STRH_SIZE
);
239 ff_end_tag(pb
, tag_str
);
241 /* Bodge an (incorrect) WAVEFORMATEX (+2 pad bytes) */
242 tag_str
= ff_start_tag(pb
, "strf");
244 AV_WL16(buf
+ 2, par
->ch_layout
.nb_channels
);
245 AV_WL32(buf
+ 4, par
->sample_rate
);
246 AV_WL32(buf
+ 8, par
->sample_rate
* par
->ch_layout
.nb_channels
* 2);
247 AV_WL16(buf
+ 12, 2);
248 AV_WL16(buf
+ 14, 16);
249 AV_WL16(buf
+ 16, 0);
250 AV_WL16(buf
+ 18, 0);
251 avio_write(pb
, buf
, AMV_AUDIO_STRF_SIZE
);
252 ff_end_tag(pb
, tag_str
);
254 amv_end_tag(pb
, tag_list
);
257 static int amv_write_header(AVFormatContext
*s
)
259 AMVContext
*amv
= s
->priv_data
;
260 AVIOContext
*pb
= s
->pb
;
261 AVStream
*vst
= s
->streams
[AMV_STREAM_VIDEO
];
262 AVStream
*ast
= s
->streams
[AMV_STREAM_AUDIO
];
263 uint8_t amvh
[56] = {0};
266 amv
->riff_start
= amv_start_tag(pb
, "RIFF");
267 ffio_wfourcc(pb
, "AMV ");
268 list1
= amv_start_tag(pb
, "LIST");
269 ffio_wfourcc(pb
, "hdrl");
271 ffio_wfourcc(pb
, "amvh");
274 AV_WL32(amvh
+ 0, amv
->us_per_frame
);
275 AV_WL32(amvh
+ 32, vst
->codecpar
->width
);
276 AV_WL32(amvh
+ 36, vst
->codecpar
->height
);
277 AV_WL32(amvh
+ 40, vst
->time_base
.den
);
278 AV_WL32(amvh
+ 44, vst
->time_base
.num
);
279 AV_WL32(amvh
+ 48, 0);
280 AV_WL32(amvh
+ 52, 0); /* duration, filled in later. */
282 avio_write(pb
, amvh
, sizeof(amvh
));
283 amv
->offset_duration
= avio_tell(pb
) - 4;
285 amv_write_vlist(s
, vst
->codecpar
);
286 amv_write_alist(s
, ast
->codecpar
);
287 amv_end_tag(pb
, list1
);
289 amv
->movi_list
= amv_start_tag(pb
, "LIST");
290 ffio_wfourcc(pb
, "movi");
294 static int amv_write_packet_internal(AVFormatContext
*s
, AVPacket
*pkt
)
296 AMVContext
*amv
= s
->priv_data
;
298 if (pkt
->stream_index
== AMV_STREAM_VIDEO
)
299 ffio_wfourcc(s
->pb
, "00dc");
300 else if (pkt
->stream_index
== AMV_STREAM_AUDIO
)
301 ffio_wfourcc(s
->pb
, "01wb");
305 if (pkt
->stream_index
== AMV_STREAM_AUDIO
&& pkt
->size
!= amv
->ablock_align
) {
306 /* Can happen when remuxing files produced by another encoder. */
307 av_log(s
, AV_LOG_WARNING
, "Invalid audio packet size (%d != %d)\n",
308 pkt
->size
, amv
->ablock_align
);
311 avio_wl32(s
->pb
, pkt
->size
);
312 avio_write(s
->pb
, pkt
->data
, pkt
->size
);
314 amv
->lastpts
[pkt
->stream_index
] += pkt
->duration
;
315 amv
->last_stream
= pkt
->stream_index
;
319 static int amv_pad(AVFormatContext
*s
, AVPacket
*pkt
)
321 AMVContext
*amv
= s
->priv_data
;
322 int stream_index
= pkt
->stream_index
;
324 if (stream_index
!= amv
->last_stream
)
327 stream_index
= (stream_index
+ 1) % s
->nb_streams
;
328 if (stream_index
== AMV_STREAM_VIDEO
)
329 return amv_write_packet_internal(s
, amv
->vpad
);
330 else if (stream_index
== AMV_STREAM_AUDIO
)
331 return amv_write_packet_internal(s
, amv
->apad
);
335 return AVERROR(EINVAL
);
338 static int amv_write_packet(AVFormatContext
*s
, AVPacket
*pkt
)
340 AMVContext
*amv
= s
->priv_data
;
343 /* Add a dummy frame if we've received two of the same index. */
344 if ((ret
= amv_pad(s
, pkt
)) < 0)
347 if ((ret
= amv_write_packet_internal(s
, pkt
)) < 0)
350 if (pkt
->stream_index
== AMV_STREAM_VIDEO
) {
351 /* Save the last packet for padding. */
352 av_packet_unref(amv
->vpad
);
353 if ((ret
= av_packet_ref(amv
->vpad
, pkt
)) < 0)
360 static int amv_write_trailer(AVFormatContext
*s
)
362 AMVContext
*amv
= s
->priv_data
;
363 AVStream
*vst
= s
->streams
[AMV_STREAM_VIDEO
];
364 AVStream
*ast
= s
->streams
[AMV_STREAM_AUDIO
];
368 /* Pad-out one last audio frame if needed. */
369 if (amv
->last_stream
== AMV_STREAM_VIDEO
) {
370 if ((ret
= amv_write_packet_internal(s
, amv
->apad
)) < 0)
374 amv_end_tag(s
->pb
, amv
->movi_list
);
375 amv_end_tag(s
->pb
, amv
->riff_start
);
377 ffio_wfourcc(s
->pb
, "AMV_");
378 ffio_wfourcc(s
->pb
, "END_");
380 if ((ret
= avio_seek(s
->pb
, amv
->offset_duration
, SEEK_SET
)) < 0)
383 /* Go back and write the duration. */
385 av_rescale_q(amv
->lastpts
[AMV_STREAM_VIDEO
], vst
->time_base
, AV_TIME_BASE_Q
),
386 av_rescale_q(amv
->lastpts
[AMV_STREAM_AUDIO
], ast
->time_base
, AV_TIME_BASE_Q
)
389 ss
= maxpts
/ AV_TIME_BASE
;
397 avio_wl16(s
->pb
, hh
);
401 const FFOutputFormat ff_amv_muxer
= {
403 .p
.long_name
= NULL_IF_CONFIG_SMALL("AMV"),
404 .p
.mime_type
= "video/amv",
405 .p
.extensions
= "amv",
406 .priv_data_size
= sizeof(AMVContext
),
407 .p
.audio_codec
= AV_CODEC_ID_ADPCM_IMA_AMV
,
408 .p
.video_codec
= AV_CODEC_ID_AMV
,
409 .p
.subtitle_codec
= AV_CODEC_ID_NONE
,
410 .flags_internal
= FF_OFMT_FLAG_MAX_ONE_OF_EACH
|
411 FF_OFMT_FLAG_ONLY_DEFAULT_CODECS
,
413 .deinit
= amv_deinit
,
414 .write_header
= amv_write_header
,
415 .write_packet
= amv_write_packet
,
416 .write_trailer
= amv_write_trailer
,