src/feature/ffmpeg/ffmpeg-encoder.c (view raw)
1/* Copyright (c) 2013-2015 Jeffrey Pfau
2 *
3 * This Source Code Form is subject to the terms of the Mozilla Public
4 * License, v. 2.0. If a copy of the MPL was not distributed with this
5 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
6#include "ffmpeg-encoder.h"
7
8#include <mgba/core/core.h>
9#include <mgba/gba/interface.h>
10#include <mgba-util/math.h>
11
12#include <libavcodec/version.h>
13#include <libavcodec/avcodec.h>
14
15#include <libavfilter/buffersink.h>
16#include <libavfilter/buffersrc.h>
17
18#include <libavutil/version.h>
19#if LIBAVUTIL_VERSION_MAJOR >= 53
20#include <libavutil/buffer.h>
21#endif
22#include <libavutil/imgutils.h>
23#include <libavutil/mathematics.h>
24#include <libavutil/opt.h>
25
26#ifdef USE_LIBAVRESAMPLE
27#include <libavresample/avresample.h>
28#else
29#include <libswresample/swresample.h>
30#endif
31#include <libswscale/swscale.h>
32
33static void _ffmpegPostVideoFrame(struct mAVStream*, const color_t* pixels, size_t stride);
34static void _ffmpegPostAudioFrame(struct mAVStream*, int16_t left, int16_t right);
35static void _ffmpegSetVideoDimensions(struct mAVStream*, unsigned width, unsigned height);
36
37static bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame);
38static bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame);
39
40enum {
41 PREFERRED_SAMPLE_RATE = 0x8000
42};
43
44void FFmpegEncoderInit(struct FFmpegEncoder* encoder) {
45#if LIBAVFORMAT_VERSION_INT < AV_VERSION_INT(58, 9, 100)
46 av_register_all();
47#endif
48
49 encoder->d.videoDimensionsChanged = _ffmpegSetVideoDimensions;
50 encoder->d.postVideoFrame = _ffmpegPostVideoFrame;
51 encoder->d.postAudioFrame = _ffmpegPostAudioFrame;
52 encoder->d.postAudioBuffer = 0;
53
54 encoder->audioCodec = NULL;
55 encoder->videoCodec = NULL;
56 encoder->containerFormat = NULL;
57 FFmpegEncoderSetAudio(encoder, "flac", 0);
58 FFmpegEncoderSetVideo(encoder, "libx264", 0, 0);
59 FFmpegEncoderSetContainer(encoder, "matroska");
60 FFmpegEncoderSetDimensions(encoder, GBA_VIDEO_HORIZONTAL_PIXELS, GBA_VIDEO_VERTICAL_PIXELS);
61 encoder->iwidth = GBA_VIDEO_HORIZONTAL_PIXELS;
62 encoder->iheight = GBA_VIDEO_VERTICAL_PIXELS;
63 encoder->frameskip = 1;
64 encoder->skipResidue = 0;
65 encoder->loop = false;
66 encoder->ipixFormat =
67#ifdef COLOR_16_BIT
68#ifdef COLOR_5_6_5
69 AV_PIX_FMT_RGB565;
70#else
71 AV_PIX_FMT_BGR555;
72#endif
73#else
74#ifndef USE_LIBAV
75 AV_PIX_FMT_0BGR32;
76#else
77 AV_PIX_FMT_BGR32;
78#endif
79#endif
80 encoder->resampleContext = NULL;
81 encoder->absf = NULL;
82 encoder->context = NULL;
83 encoder->scaleContext = NULL;
84 encoder->audio = NULL;
85 encoder->audioStream = NULL;
86 encoder->audioFrame = NULL;
87 encoder->audioBuffer = NULL;
88 encoder->postaudioBuffer = NULL;
89 encoder->video = NULL;
90 encoder->videoStream = NULL;
91 encoder->videoFrame = NULL;
92 encoder->graph = NULL;
93 encoder->source = NULL;
94 encoder->sink = NULL;
95 encoder->sinkFrame = NULL;
96 FFmpegEncoderSetInputFrameRate(encoder, VIDEO_TOTAL_LENGTH, GBA_ARM7TDMI_FREQUENCY);
97
98 int i;
99 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
100 encoder->filters[i] = NULL;
101 }
102}
103
104bool FFmpegEncoderSetAudio(struct FFmpegEncoder* encoder, const char* acodec, unsigned abr) {
105 static const struct {
106 int format;
107 int priority;
108 } priorities[] = {
109 { AV_SAMPLE_FMT_S16, 0 },
110 { AV_SAMPLE_FMT_S16P, 1 },
111 { AV_SAMPLE_FMT_S32, 2 },
112 { AV_SAMPLE_FMT_S32P, 2 },
113 { AV_SAMPLE_FMT_FLT, 3 },
114 { AV_SAMPLE_FMT_FLTP, 3 },
115 { AV_SAMPLE_FMT_DBL, 4 },
116 { AV_SAMPLE_FMT_DBLP, 4 }
117 };
118
119 if (!acodec) {
120 encoder->audioCodec = 0;
121 return true;
122 }
123
124 AVCodec* codec = avcodec_find_encoder_by_name(acodec);
125 if (!codec) {
126 return false;
127 }
128
129 if (!codec->sample_fmts) {
130 return false;
131 }
132 size_t i;
133 size_t j;
134 int priority = INT_MAX;
135 encoder->sampleFormat = AV_SAMPLE_FMT_NONE;
136 for (i = 0; codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
137 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
138 if (codec->sample_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
139 priority = priorities[j].priority;
140 encoder->sampleFormat = codec->sample_fmts[i];
141 }
142 }
143 }
144 if (encoder->sampleFormat == AV_SAMPLE_FMT_NONE) {
145 return false;
146 }
147 encoder->sampleRate = PREFERRED_SAMPLE_RATE;
148 if (codec->supported_samplerates) {
149 for (i = 0; codec->supported_samplerates[i]; ++i) {
150 if (codec->supported_samplerates[i] < PREFERRED_SAMPLE_RATE) {
151 continue;
152 }
153 if (encoder->sampleRate == PREFERRED_SAMPLE_RATE || encoder->sampleRate > codec->supported_samplerates[i]) {
154 encoder->sampleRate = codec->supported_samplerates[i];
155 }
156 }
157 } else if (codec->id == AV_CODEC_ID_AAC) {
158 // HACK: AAC doesn't support 32768Hz (it rounds to 32000), but libfaac doesn't tell us that
159 encoder->sampleRate = 44100;
160 }
161 encoder->audioCodec = acodec;
162 encoder->audioBitrate = abr;
163 return true;
164}
165
166bool FFmpegEncoderSetVideo(struct FFmpegEncoder* encoder, const char* vcodec, unsigned vbr, int frameskip) {
167 static const struct {
168 enum AVPixelFormat format;
169 int priority;
170 } priorities[] = {
171 { AV_PIX_FMT_RGB555, 0 },
172 { AV_PIX_FMT_BGR555, 0 },
173 { AV_PIX_FMT_RGB565, 1 },
174 { AV_PIX_FMT_BGR565, 1 },
175 { AV_PIX_FMT_RGB24, 2 },
176 { AV_PIX_FMT_BGR24, 2 },
177#ifndef USE_LIBAV
178 { AV_PIX_FMT_BGR0, 3 },
179 { AV_PIX_FMT_RGB0, 3 },
180 { AV_PIX_FMT_0BGR, 3 },
181 { AV_PIX_FMT_0RGB, 3 },
182#endif
183 { AV_PIX_FMT_RGB32, 4},
184 { AV_PIX_FMT_BGR32, 4},
185 { AV_PIX_FMT_YUV444P, 5 },
186 { AV_PIX_FMT_YUV422P, 6 },
187 { AV_PIX_FMT_YUV420P, 7 },
188 { AV_PIX_FMT_PAL8, 8 },
189 };
190
191 if (!vcodec) {
192 encoder->videoCodec = 0;
193 return true;
194 }
195
196 AVCodec* codec = avcodec_find_encoder_by_name(vcodec);
197 if (!codec) {
198 return false;
199 }
200
201 size_t i;
202 size_t j;
203 int priority = INT_MAX;
204 encoder->pixFormat = AV_PIX_FMT_NONE;
205 for (i = 0; codec->pix_fmts[i] != AV_PIX_FMT_NONE; ++i) {
206 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
207 if (codec->pix_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
208 priority = priorities[j].priority;
209 encoder->pixFormat = codec->pix_fmts[i];
210 }
211 }
212 }
213 if (encoder->pixFormat == AV_PIX_FMT_NONE) {
214 return false;
215 }
216 encoder->videoCodec = vcodec;
217 encoder->videoBitrate = vbr;
218 encoder->frameskip = frameskip + 1;
219 return true;
220}
221
222bool FFmpegEncoderSetContainer(struct FFmpegEncoder* encoder, const char* container) {
223 AVOutputFormat* oformat = av_guess_format(container, 0, 0);
224 if (!oformat) {
225 return false;
226 }
227 encoder->containerFormat = container;
228 return true;
229}
230
231void FFmpegEncoderSetDimensions(struct FFmpegEncoder* encoder, int width, int height) {
232 encoder->width = width > 0 ? width : GBA_VIDEO_HORIZONTAL_PIXELS;
233 encoder->height = height > 0 ? height : GBA_VIDEO_VERTICAL_PIXELS;
234}
235
236void FFmpegEncoderSetLooping(struct FFmpegEncoder* encoder, bool loop) {
237 encoder->loop = loop;
238}
239
240bool FFmpegEncoderVerifyContainer(struct FFmpegEncoder* encoder) {
241 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
242 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
243 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
244 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !oformat || (!acodec && !vcodec)) {
245 return false;
246 }
247 if (encoder->audioCodec && !avformat_query_codec(oformat, acodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
248 return false;
249 }
250 if (encoder->videoCodec && !avformat_query_codec(oformat, vcodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
251 return false;
252 }
253 return true;
254}
255
256bool FFmpegEncoderOpen(struct FFmpegEncoder* encoder, const char* outfile) {
257 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
258 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
259 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !FFmpegEncoderVerifyContainer(encoder)) {
260 return false;
261 }
262
263 if (encoder->context) {
264 return false;
265 }
266
267 encoder->currentAudioSample = 0;
268 encoder->currentAudioFrame = 0;
269 encoder->currentVideoFrame = 0;
270 encoder->skipResidue = 0;
271
272 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
273#ifndef USE_LIBAV
274 avformat_alloc_output_context2(&encoder->context, oformat, 0, outfile);
275#else
276 encoder->context = avformat_alloc_context();
277 strncpy(encoder->context->filename, outfile, sizeof(encoder->context->filename) - 1);
278 encoder->context->filename[sizeof(encoder->context->filename) - 1] = '\0';
279 encoder->context->oformat = oformat;
280#endif
281
282 if (acodec) {
283#ifdef FFMPEG_USE_CODECPAR
284 encoder->audioStream = avformat_new_stream(encoder->context, NULL);
285 encoder->audio = avcodec_alloc_context3(acodec);
286#else
287 encoder->audioStream = avformat_new_stream(encoder->context, acodec);
288 encoder->audio = encoder->audioStream->codec;
289#endif
290 encoder->audio->bit_rate = encoder->audioBitrate;
291 encoder->audio->channels = 2;
292 encoder->audio->channel_layout = AV_CH_LAYOUT_STEREO;
293 encoder->audio->sample_rate = encoder->sampleRate;
294 encoder->audio->sample_fmt = encoder->sampleFormat;
295 AVDictionary* opts = 0;
296 av_dict_set(&opts, "strict", "-2", 0);
297 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
298#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
299 encoder->audio->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
300#else
301 encoder->audio->flags |= CODEC_FLAG_GLOBAL_HEADER;
302#endif
303 }
304 int res = avcodec_open2(encoder->audio, acodec, &opts);
305 av_dict_free(&opts);
306 if (res < 0) {
307 FFmpegEncoderClose(encoder);
308 return false;
309 }
310#if LIBAVCODEC_VERSION_MAJOR >= 55
311 encoder->audioFrame = av_frame_alloc();
312#else
313 encoder->audioFrame = avcodec_alloc_frame();
314#endif
315 if (!encoder->audio->frame_size) {
316 encoder->audio->frame_size = 1;
317 }
318 encoder->audioFrame->nb_samples = encoder->audio->frame_size;
319 encoder->audioFrame->format = encoder->audio->sample_fmt;
320 encoder->audioFrame->pts = 0;
321#ifdef USE_LIBAVRESAMPLE
322 encoder->resampleContext = avresample_alloc_context();
323 av_opt_set_int(encoder->resampleContext, "in_channel_layout", AV_CH_LAYOUT_STEREO, 0);
324 av_opt_set_int(encoder->resampleContext, "out_channel_layout", AV_CH_LAYOUT_STEREO, 0);
325 av_opt_set_int(encoder->resampleContext, "in_sample_rate", PREFERRED_SAMPLE_RATE, 0);
326 av_opt_set_int(encoder->resampleContext, "out_sample_rate", encoder->sampleRate, 0);
327 av_opt_set_int(encoder->resampleContext, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);
328 av_opt_set_int(encoder->resampleContext, "out_sample_fmt", encoder->sampleFormat, 0);
329 avresample_open(encoder->resampleContext);
330#else
331 encoder->resampleContext = swr_alloc_set_opts(NULL, AV_CH_LAYOUT_STEREO, encoder->sampleFormat, encoder->sampleRate,
332 AV_CH_LAYOUT_STEREO, AV_SAMPLE_FMT_S16, PREFERRED_SAMPLE_RATE, 0, NULL);
333 swr_init(encoder->resampleContext);
334#endif
335 encoder->audioBufferSize = (encoder->audioFrame->nb_samples * PREFERRED_SAMPLE_RATE / encoder->sampleRate) * 4;
336 encoder->audioBuffer = av_malloc(encoder->audioBufferSize);
337 encoder->postaudioBufferSize = av_samples_get_buffer_size(0, encoder->audio->channels, encoder->audio->frame_size, encoder->audio->sample_fmt, 0);
338 encoder->postaudioBuffer = av_malloc(encoder->postaudioBufferSize);
339 avcodec_fill_audio_frame(encoder->audioFrame, encoder->audio->channels, encoder->audio->sample_fmt, (const uint8_t*) encoder->postaudioBuffer, encoder->postaudioBufferSize, 0);
340
341 if (encoder->audio->codec->id == AV_CODEC_ID_AAC &&
342 (strcasecmp(encoder->containerFormat, "mp4") ||
343 strcasecmp(encoder->containerFormat, "m4v") ||
344 strcasecmp(encoder->containerFormat, "mov"))) {
345 // MP4 container doesn't support the raw ADTS AAC format that the encoder spits out
346#ifdef FFMPEG_USE_NEW_BSF
347 av_bsf_alloc(av_bsf_get_by_name("aac_adtstoasc"), &encoder->absf);
348 avcodec_parameters_from_context(encoder->absf->par_in, encoder->audio);
349 av_bsf_init(encoder->absf);
350#else
351 encoder->absf = av_bitstream_filter_init("aac_adtstoasc");
352#endif
353 }
354#ifdef FFMPEG_USE_CODECPAR
355 avcodec_parameters_from_context(encoder->audioStream->codecpar, encoder->audio);
356#endif
357 }
358
359 if (vcodec) {
360#ifdef FFMPEG_USE_CODECPAR
361 encoder->videoStream = avformat_new_stream(encoder->context, NULL);
362 encoder->video = avcodec_alloc_context3(vcodec);
363#else
364 encoder->videoStream = avformat_new_stream(encoder->context, vcodec);
365 encoder->video = encoder->videoStream->codec;
366#endif
367 encoder->video->bit_rate = encoder->videoBitrate;
368 encoder->video->width = encoder->width;
369 encoder->video->height = encoder->height;
370 encoder->video->time_base = (AVRational) { encoder->frameCycles * encoder->frameskip, encoder->cycles };
371 encoder->video->framerate = (AVRational) { encoder->cycles, encoder->frameCycles * encoder->frameskip };
372 encoder->videoStream->time_base = encoder->video->time_base;
373 encoder->videoStream->avg_frame_rate = encoder->video->framerate;
374 encoder->video->pix_fmt = encoder->pixFormat;
375 encoder->video->gop_size = 60;
376 encoder->video->max_b_frames = 3;
377 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
378#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
379 encoder->video->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
380#else
381 encoder->video->flags |= CODEC_FLAG_GLOBAL_HEADER;
382#endif
383 }
384
385 if (encoder->video->codec->id == AV_CODEC_ID_H264 &&
386 (strcasecmp(encoder->containerFormat, "mp4") ||
387 strcasecmp(encoder->containerFormat, "m4v") ||
388 strcasecmp(encoder->containerFormat, "mov"))) {
389 // QuickTime and a few other things require YUV420
390 encoder->video->pix_fmt = AV_PIX_FMT_YUV420P;
391 }
392#if LIBAVCODEC_VERSION_MAJOR >= 57
393 if (encoder->video->codec->id == AV_CODEC_ID_FFV1) {
394 av_opt_set(encoder->video->priv_data, "coder", "range_tab", 0);
395 }
396#endif
397
398 if (strcmp(vcodec->name, "libx264") == 0) {
399 // Try to adaptively figure out when you can use a slower encoder
400 if (encoder->width * encoder->height > 1000000) {
401 av_opt_set(encoder->video->priv_data, "preset", "superfast", 0);
402 } else if (encoder->width * encoder->height > 500000) {
403 av_opt_set(encoder->video->priv_data, "preset", "veryfast", 0);
404 } else {
405 av_opt_set(encoder->video->priv_data, "preset", "faster", 0);
406 }
407 if (encoder->videoBitrate == 0) {
408 av_opt_set(encoder->video->priv_data, "crf", "0", 0);
409 encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
410 }
411 }
412 if (strcmp(vcodec->name, "libvpx-vp9") == 0 && encoder->videoBitrate == 0) {
413 av_opt_set(encoder->video->priv_data, "lossless", "1", 0);
414 encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
415 }
416 if (strcmp(vcodec->name, "libwebp_anim") == 0 && encoder->videoBitrate == 0) {
417 av_opt_set(encoder->video->priv_data, "lossless", "1", 0);
418 encoder->video->pix_fmt = AV_PIX_FMT_RGB32;
419 }
420
421 if (encoder->pixFormat == AV_PIX_FMT_PAL8) {
422 encoder->graph = avfilter_graph_alloc();
423
424 const struct AVFilter* source = avfilter_get_by_name("buffer");
425 const struct AVFilter* sink = avfilter_get_by_name("buffersink");
426 const struct AVFilter* split = avfilter_get_by_name("split");
427 const struct AVFilter* palettegen = avfilter_get_by_name("palettegen");
428 const struct AVFilter* paletteuse = avfilter_get_by_name("paletteuse");
429
430 if (!source || !sink || !split || !palettegen || !paletteuse || !encoder->graph) {
431 FFmpegEncoderClose(encoder);
432 return false;
433 }
434
435 char args[256];
436 snprintf(args, sizeof(args), "video_size=%dx%d:pix_fmt=%d:time_base=%d/%d",
437 encoder->video->width, encoder->video->height, encoder->ipixFormat,
438 encoder->video->time_base.num, encoder->video->time_base.den);
439
440 int res = 0;
441 res |= avfilter_graph_create_filter(&encoder->source, source, NULL, args, NULL, encoder->graph);
442 res |= avfilter_graph_create_filter(&encoder->sink, sink, NULL, NULL, NULL, encoder->graph);
443 res |= avfilter_graph_create_filter(&encoder->filters[0], split, NULL, NULL, NULL, encoder->graph);
444 res |= avfilter_graph_create_filter(&encoder->filters[1], palettegen, NULL, "reserve_transparent=off", NULL, encoder->graph);
445 res |= avfilter_graph_create_filter(&encoder->filters[2], paletteuse, NULL, "dither=none", NULL, encoder->graph);
446 if (res < 0) {
447 FFmpegEncoderClose(encoder);
448 return false;
449 }
450
451 res = 0;
452 res |= avfilter_link(encoder->source, 0, encoder->filters[0], 0);
453 res |= avfilter_link(encoder->filters[0], 0, encoder->filters[1], 0);
454 res |= avfilter_link(encoder->filters[0], 1, encoder->filters[2], 0);
455 res |= avfilter_link(encoder->filters[1], 0, encoder->filters[2], 1);
456 res |= avfilter_link(encoder->filters[2], 0, encoder->sink, 0);
457 if (res < 0 || avfilter_graph_config(encoder->graph, NULL) < 0) {
458 FFmpegEncoderClose(encoder);
459 return false;
460 }
461
462#if LIBAVCODEC_VERSION_MAJOR >= 55
463 encoder->sinkFrame = av_frame_alloc();
464#else
465 encoder->sinkFrame = avcodec_alloc_frame();
466#endif
467 }
468 AVDictionary* opts = 0;
469 av_dict_set(&opts, "strict", "-2", 0);
470 int res = avcodec_open2(encoder->video, vcodec, &opts);
471 av_dict_free(&opts);
472 if (res < 0) {
473 FFmpegEncoderClose(encoder);
474 return false;
475 }
476#if LIBAVCODEC_VERSION_MAJOR >= 55
477 encoder->videoFrame = av_frame_alloc();
478#else
479 encoder->videoFrame = avcodec_alloc_frame();
480#endif
481 encoder->videoFrame->format = encoder->video->pix_fmt != AV_PIX_FMT_PAL8 ? encoder->video->pix_fmt : encoder->ipixFormat;
482 encoder->videoFrame->width = encoder->video->width;
483 encoder->videoFrame->height = encoder->video->height;
484 encoder->videoFrame->pts = 0;
485 _ffmpegSetVideoDimensions(&encoder->d, encoder->iwidth, encoder->iheight);
486 av_image_alloc(encoder->videoFrame->data, encoder->videoFrame->linesize, encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format, 32);
487#ifdef FFMPEG_USE_CODECPAR
488 avcodec_parameters_from_context(encoder->videoStream->codecpar, encoder->video);
489#endif
490 }
491
492 if (strcmp(encoder->containerFormat, "gif") == 0) {
493 av_opt_set(encoder->context->priv_data, "loop", encoder->loop ? "0" : "-1", 0);
494 } else if (strcmp(encoder->containerFormat, "apng") == 0) {
495 av_opt_set(encoder->context->priv_data, "plays", encoder->loop ? "0" : "1", 0);
496 } else if (strcmp(encoder->containerFormat, "webp") == 0) {
497 av_opt_set(encoder->context->priv_data, "loop", encoder->loop ? "0" : "1", 0);
498 }
499
500 AVDictionary* opts = 0;
501 av_dict_set(&opts, "strict", "-2", 0);
502 bool res = avio_open(&encoder->context->pb, outfile, AVIO_FLAG_WRITE) < 0 || avformat_write_header(encoder->context, &opts) < 0;
503 av_dict_free(&opts);
504 if (res) {
505 FFmpegEncoderClose(encoder);
506 return false;
507 }
508 return true;
509}
510
511void FFmpegEncoderClose(struct FFmpegEncoder* encoder) {
512 if (encoder->audio) {
513 while (true) {
514 if (!_ffmpegWriteAudioFrame(encoder, NULL)) {
515 break;
516 }
517 }
518 }
519 if (encoder->video) {
520 if (encoder->graph) {
521 if (av_buffersrc_add_frame(encoder->source, NULL) >= 0) {
522 while (true) {
523 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
524 if (res < 0) {
525 break;
526 }
527 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
528 av_frame_unref(encoder->sinkFrame);
529 }
530 }
531 }
532 while (true) {
533 if (!_ffmpegWriteVideoFrame(encoder, NULL)) {
534 break;
535 }
536 }
537 }
538
539 if (encoder->context && encoder->context->pb) {
540 av_write_trailer(encoder->context);
541 avio_close(encoder->context->pb);
542 }
543
544 if (encoder->postaudioBuffer) {
545 av_free(encoder->postaudioBuffer);
546 encoder->postaudioBuffer = NULL;
547 }
548 if (encoder->audioBuffer) {
549 av_free(encoder->audioBuffer);
550 encoder->audioBuffer = NULL;
551 }
552
553 if (encoder->audioFrame) {
554#if LIBAVCODEC_VERSION_MAJOR >= 55
555 av_frame_free(&encoder->audioFrame);
556#else
557 avcodec_free_frame(&encoder->audioFrame);
558#endif
559 }
560 if (encoder->audio) {
561#ifdef FFMPEG_USE_CODECPAR
562 avcodec_free_context(&encoder->audio);
563#else
564 avcodec_close(encoder->audio);
565 encoder->audio = NULL;
566#endif
567 }
568
569 if (encoder->resampleContext) {
570#ifdef USE_LIBAVRESAMPLE
571 avresample_close(encoder->resampleContext);
572 encoder->resampleContext = NULL;
573#else
574 swr_free(&encoder->resampleContext);
575#endif
576 }
577
578 if (encoder->absf) {
579#ifdef FFMPEG_USE_NEW_BSF
580 av_bsf_free(&encoder->absf);
581#else
582 av_bitstream_filter_close(encoder->absf);
583 encoder->absf = NULL;
584#endif
585 }
586
587 if (encoder->videoFrame) {
588 av_freep(encoder->videoFrame->data);
589#if LIBAVCODEC_VERSION_MAJOR >= 55
590 av_frame_free(&encoder->videoFrame);
591#else
592 avcodec_free_frame(&encoder->videoFrame);
593#endif
594 }
595
596 if (encoder->sinkFrame) {
597#if LIBAVCODEC_VERSION_MAJOR >= 55
598 av_frame_free(&encoder->sinkFrame);
599#else
600 avcodec_free_frame(&encoder->sinkFrame);
601#endif
602 encoder->sinkFrame = NULL;
603 }
604
605 if (encoder->video) {
606#ifdef FFMPEG_USE_CODECPAR
607 avcodec_free_context(&encoder->video);
608#else
609 avcodec_close(encoder->video);
610 encoder->video = NULL;
611#endif
612 }
613
614 if (encoder->scaleContext) {
615 sws_freeContext(encoder->scaleContext);
616 encoder->scaleContext = NULL;
617 }
618
619 if (encoder->graph) {
620 avfilter_graph_free(&encoder->graph);
621 encoder->graph = NULL;
622 encoder->source = NULL;
623 encoder->sink = NULL;
624
625 int i;
626 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
627 encoder->filters[i] = NULL;
628 }
629 }
630
631 if (encoder->context) {
632 avformat_free_context(encoder->context);
633 encoder->context = NULL;
634 }
635}
636
637bool FFmpegEncoderIsOpen(struct FFmpegEncoder* encoder) {
638 return !!encoder->context;
639}
640
641void _ffmpegPostAudioFrame(struct mAVStream* stream, int16_t left, int16_t right) {
642 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
643 if (!encoder->context || !encoder->audioCodec) {
644 return;
645 }
646
647 if (encoder->absf && !left) {
648 // XXX: AVBSF doesn't like silence. Figure out why.
649 left = 1;
650 }
651
652 encoder->audioBuffer[encoder->currentAudioSample * 2] = left;
653 encoder->audioBuffer[encoder->currentAudioSample * 2 + 1] = right;
654
655 ++encoder->currentAudioSample;
656
657 if (encoder->currentAudioSample * 4 < encoder->audioBufferSize) {
658 return;
659 }
660
661 int channelSize = 2 * av_get_bytes_per_sample(encoder->audio->sample_fmt);
662 encoder->currentAudioSample = 0;
663#ifdef USE_LIBAVRESAMPLE
664 avresample_convert(encoder->resampleContext, 0, 0, 0,
665 (uint8_t**) &encoder->audioBuffer, 0, encoder->audioBufferSize / 4);
666
667 if (avresample_available(encoder->resampleContext) < encoder->audioFrame->nb_samples) {
668 return;
669 }
670#if LIBAVCODEC_VERSION_MAJOR >= 55
671 av_frame_make_writable(encoder->audioFrame);
672#endif
673 int samples = avresample_read(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize);
674#else
675#if LIBAVCODEC_VERSION_MAJOR >= 55
676 av_frame_make_writable(encoder->audioFrame);
677#endif
678 if (swr_get_out_samples(encoder->resampleContext, 1) < encoder->audioFrame->nb_samples) {
679 swr_convert(encoder->resampleContext, NULL, 0, (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
680 return;
681 }
682 int samples = swr_convert(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize,
683 (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
684#endif
685
686 encoder->audioFrame->pts = encoder->currentAudioFrame;
687 encoder->currentAudioFrame += samples;
688
689 _ffmpegWriteAudioFrame(encoder, encoder->audioFrame);
690}
691
692bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame) {
693 AVPacket packet;
694 av_init_packet(&packet);
695 packet.data = 0;
696 packet.size = 0;
697
698 int gotData;
699#ifdef FFMPEG_USE_PACKETS
700 avcodec_send_frame(encoder->audio, audioFrame);
701 gotData = avcodec_receive_packet(encoder->audio, &packet);
702 gotData = (gotData == 0) && packet.size;
703#else
704 avcodec_encode_audio2(encoder->audio, &packet, audioFrame, &gotData);
705#endif
706 packet.pts = av_rescale_q(packet.pts, encoder->audio->time_base, encoder->audioStream->time_base);
707 packet.dts = packet.pts;
708
709 if (gotData) {
710 if (encoder->absf) {
711 AVPacket tempPacket;
712
713#ifdef FFMPEG_USE_NEW_BSF
714 int success = av_bsf_send_packet(encoder->absf, &packet);
715 if (success >= 0) {
716 success = av_bsf_receive_packet(encoder->absf, &tempPacket);
717 }
718#else
719 int success = av_bitstream_filter_filter(encoder->absf, encoder->audio, 0,
720 &tempPacket.data, &tempPacket.size,
721 packet.data, packet.size, 0);
722#endif
723
724 if (success >= 0) {
725#if LIBAVUTIL_VERSION_MAJOR >= 53
726 tempPacket.buf = av_buffer_create(tempPacket.data, tempPacket.size, av_buffer_default_free, 0, 0);
727#endif
728
729#ifdef FFMPEG_USE_PACKET_UNREF
730 av_packet_move_ref(&packet, &tempPacket);
731#else
732 av_free_packet(&packet);
733 packet = tempPacket;
734#endif
735
736 packet.stream_index = encoder->audioStream->index;
737 av_interleaved_write_frame(encoder->context, &packet);
738 }
739 } else {
740 packet.stream_index = encoder->audioStream->index;
741 av_interleaved_write_frame(encoder->context, &packet);
742 }
743 }
744#ifdef FFMPEG_USE_PACKET_UNREF
745 av_packet_unref(&packet);
746#else
747 av_free_packet(&packet);
748#endif
749 return gotData;
750}
751
752void _ffmpegPostVideoFrame(struct mAVStream* stream, const color_t* pixels, size_t stride) {
753 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
754 if (!encoder->context || !encoder->videoCodec) {
755 return;
756 }
757 encoder->skipResidue = (encoder->skipResidue + 1) % encoder->frameskip;
758 if (encoder->skipResidue) {
759 return;
760 }
761 stride *= BYTES_PER_PIXEL;
762
763#if LIBAVCODEC_VERSION_MAJOR >= 55
764 av_frame_make_writable(encoder->videoFrame);
765#endif
766 if (encoder->video->codec->id == AV_CODEC_ID_WEBP) {
767 // TODO: Figure out why WebP is rescaling internally (should video frames not be rescaled externally?)
768 encoder->videoFrame->pts = encoder->currentVideoFrame;
769 } else {
770 encoder->videoFrame->pts = av_rescale_q(encoder->currentVideoFrame, encoder->video->time_base, encoder->videoStream->time_base);
771 }
772 ++encoder->currentVideoFrame;
773
774 sws_scale(encoder->scaleContext, (const uint8_t* const*) &pixels, (const int*) &stride, 0, encoder->iheight, encoder->videoFrame->data, encoder->videoFrame->linesize);
775
776 if (encoder->graph) {
777 if (av_buffersrc_add_frame(encoder->source, encoder->videoFrame) < 0) {
778 return;
779 }
780 while (true) {
781 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
782 if (res < 0) {
783 break;
784 }
785 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
786 av_frame_unref(encoder->sinkFrame);
787 }
788 } else {
789 _ffmpegWriteVideoFrame(encoder, encoder->videoFrame);
790 }
791}
792
793bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame) {
794 AVPacket packet;
795
796 av_init_packet(&packet);
797 packet.data = 0;
798 packet.size = 0;
799
800 int gotData;
801#ifdef FFMPEG_USE_PACKETS
802 avcodec_send_frame(encoder->video, videoFrame);
803 gotData = avcodec_receive_packet(encoder->video, &packet) == 0;
804#else
805 avcodec_encode_video2(encoder->video, &packet, videoFrame, &gotData);
806#endif
807 if (gotData) {
808#ifndef FFMPEG_USE_PACKET_UNREF
809 if (encoder->video->coded_frame->key_frame) {
810 packet.flags |= AV_PKT_FLAG_KEY;
811 }
812#endif
813 packet.stream_index = encoder->videoStream->index;
814 av_interleaved_write_frame(encoder->context, &packet);
815 }
816#ifdef FFMPEG_USE_PACKET_UNREF
817 av_packet_unref(&packet);
818#else
819 av_free_packet(&packet);
820#endif
821
822 return gotData;
823}
824
825static void _ffmpegSetVideoDimensions(struct mAVStream* stream, unsigned width, unsigned height) {
826 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
827 if (!encoder->context || !encoder->videoCodec) {
828 return;
829 }
830 encoder->iwidth = width;
831 encoder->iheight = height;
832 if (encoder->scaleContext) {
833 sws_freeContext(encoder->scaleContext);
834 }
835 encoder->scaleContext = sws_getContext(encoder->iwidth, encoder->iheight, encoder->ipixFormat,
836 encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format,
837 SWS_POINT, 0, 0, 0);
838}
839
840void FFmpegEncoderSetInputFrameRate(struct FFmpegEncoder* encoder, int numerator, int denominator) {
841 reduceFraction(&numerator, &denominator);
842 encoder->frameCycles = numerator;
843 encoder->cycles = denominator;
844 if (encoder->video) {
845 encoder->video->framerate = (AVRational) { denominator, numerator * encoder->frameskip };
846 }
847}