src/feature/ffmpeg/ffmpeg-encoder.c (view raw)
1/* Copyright (c) 2013-2015 Jeffrey Pfau
2 *
3 * This Source Code Form is subject to the terms of the Mozilla Public
4 * License, v. 2.0. If a copy of the MPL was not distributed with this
5 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
6#include "ffmpeg-encoder.h"
7
8#include <mgba/core/core.h>
9#include <mgba/gba/interface.h>
10#include <mgba/internal/gba/gba.h>
11#include <mgba-util/math.h>
12
13#include <libavcodec/version.h>
14#include <libavcodec/avcodec.h>
15
16#include <libavfilter/buffersink.h>
17#include <libavfilter/buffersrc.h>
18
19#include <libavutil/version.h>
20#if LIBAVUTIL_VERSION_MAJOR >= 53
21#include <libavutil/buffer.h>
22#endif
23#include <libavutil/imgutils.h>
24#include <libavutil/mathematics.h>
25#include <libavutil/opt.h>
26
27#ifdef USE_LIBAVRESAMPLE
28#include <libavresample/avresample.h>
29#else
30#include <libswresample/swresample.h>
31#endif
32#include <libswscale/swscale.h>
33
34static void _ffmpegPostVideoFrame(struct mAVStream*, const color_t* pixels, size_t stride);
35static void _ffmpegPostAudioFrame(struct mAVStream*, int16_t left, int16_t right);
36static void _ffmpegSetVideoDimensions(struct mAVStream*, unsigned width, unsigned height);
37
38static bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame);
39static bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame);
40
41enum {
42 PREFERRED_SAMPLE_RATE = 0x8000
43};
44
45void FFmpegEncoderInit(struct FFmpegEncoder* encoder) {
46#if LIBAVFORMAT_VERSION_INT < AV_VERSION_INT(58, 9, 100)
47 av_register_all();
48#endif
49
50 encoder->d.videoDimensionsChanged = _ffmpegSetVideoDimensions;
51 encoder->d.postVideoFrame = _ffmpegPostVideoFrame;
52 encoder->d.postAudioFrame = _ffmpegPostAudioFrame;
53 encoder->d.postAudioBuffer = 0;
54
55 encoder->audioCodec = NULL;
56 encoder->videoCodec = NULL;
57 encoder->containerFormat = NULL;
58 FFmpegEncoderSetAudio(encoder, "flac", 0);
59 FFmpegEncoderSetVideo(encoder, "libx264", 0, 0);
60 FFmpegEncoderSetContainer(encoder, "matroska");
61 FFmpegEncoderSetDimensions(encoder, GBA_VIDEO_HORIZONTAL_PIXELS, GBA_VIDEO_VERTICAL_PIXELS);
62 encoder->iwidth = GBA_VIDEO_HORIZONTAL_PIXELS;
63 encoder->iheight = GBA_VIDEO_VERTICAL_PIXELS;
64 encoder->frameskip = 1;
65 encoder->skipResidue = 0;
66 encoder->loop = false;
67 encoder->ipixFormat =
68#ifdef COLOR_16_BIT
69#ifdef COLOR_5_6_5
70 AV_PIX_FMT_RGB565;
71#else
72 AV_PIX_FMT_BGR555;
73#endif
74#else
75#ifndef USE_LIBAV
76 AV_PIX_FMT_0BGR32;
77#else
78 AV_PIX_FMT_BGR32;
79#endif
80#endif
81 encoder->resampleContext = NULL;
82 encoder->absf = NULL;
83 encoder->context = NULL;
84 encoder->scaleContext = NULL;
85 encoder->audio = NULL;
86 encoder->audioStream = NULL;
87 encoder->audioFrame = NULL;
88 encoder->audioBuffer = NULL;
89 encoder->postaudioBuffer = NULL;
90 encoder->video = NULL;
91 encoder->videoStream = NULL;
92 encoder->videoFrame = NULL;
93 encoder->graph = NULL;
94 encoder->source = NULL;
95 encoder->sink = NULL;
96 encoder->sinkFrame = NULL;
97 FFmpegEncoderSetInputFrameRate(encoder, VIDEO_TOTAL_LENGTH, GBA_ARM7TDMI_FREQUENCY);
98
99 int i;
100 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
101 encoder->filters[i] = NULL;
102 }
103}
104
105bool FFmpegEncoderSetAudio(struct FFmpegEncoder* encoder, const char* acodec, unsigned abr) {
106 static const struct {
107 int format;
108 int priority;
109 } priorities[] = {
110 { AV_SAMPLE_FMT_S16, 0 },
111 { AV_SAMPLE_FMT_S16P, 1 },
112 { AV_SAMPLE_FMT_S32, 2 },
113 { AV_SAMPLE_FMT_S32P, 2 },
114 { AV_SAMPLE_FMT_FLT, 3 },
115 { AV_SAMPLE_FMT_FLTP, 3 },
116 { AV_SAMPLE_FMT_DBL, 4 },
117 { AV_SAMPLE_FMT_DBLP, 4 }
118 };
119
120 if (!acodec) {
121 encoder->audioCodec = 0;
122 return true;
123 }
124
125 AVCodec* codec = avcodec_find_encoder_by_name(acodec);
126 if (!codec) {
127 return false;
128 }
129
130 if (!codec->sample_fmts) {
131 return false;
132 }
133 size_t i;
134 size_t j;
135 int priority = INT_MAX;
136 encoder->sampleFormat = AV_SAMPLE_FMT_NONE;
137 for (i = 0; codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
138 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
139 if (codec->sample_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
140 priority = priorities[j].priority;
141 encoder->sampleFormat = codec->sample_fmts[i];
142 }
143 }
144 }
145 if (encoder->sampleFormat == AV_SAMPLE_FMT_NONE) {
146 return false;
147 }
148 encoder->sampleRate = PREFERRED_SAMPLE_RATE;
149 if (codec->supported_samplerates) {
150 for (i = 0; codec->supported_samplerates[i]; ++i) {
151 if (codec->supported_samplerates[i] < PREFERRED_SAMPLE_RATE) {
152 continue;
153 }
154 if (encoder->sampleRate == PREFERRED_SAMPLE_RATE || encoder->sampleRate > codec->supported_samplerates[i]) {
155 encoder->sampleRate = codec->supported_samplerates[i];
156 }
157 }
158 } else if (codec->id == AV_CODEC_ID_AAC) {
159 // HACK: AAC doesn't support 32768Hz (it rounds to 32000), but libfaac doesn't tell us that
160 encoder->sampleRate = 44100;
161 }
162 encoder->audioCodec = acodec;
163 encoder->audioBitrate = abr;
164 return true;
165}
166
167bool FFmpegEncoderSetVideo(struct FFmpegEncoder* encoder, const char* vcodec, int vbr, int frameskip) {
168 static const struct {
169 enum AVPixelFormat format;
170 int priority;
171 } priorities[] = {
172 { AV_PIX_FMT_RGB555, 0 },
173 { AV_PIX_FMT_BGR555, 0 },
174 { AV_PIX_FMT_RGB565, 1 },
175 { AV_PIX_FMT_BGR565, 1 },
176 { AV_PIX_FMT_RGB24, 2 },
177 { AV_PIX_FMT_BGR24, 2 },
178#ifndef USE_LIBAV
179 { AV_PIX_FMT_BGR0, 3 },
180 { AV_PIX_FMT_RGB0, 3 },
181 { AV_PIX_FMT_0BGR, 3 },
182 { AV_PIX_FMT_0RGB, 3 },
183#endif
184 { AV_PIX_FMT_RGB32, 4},
185 { AV_PIX_FMT_BGR32, 4},
186 { AV_PIX_FMT_YUV444P, 5 },
187 { AV_PIX_FMT_YUV422P, 6 },
188 { AV_PIX_FMT_YUV420P, 7 },
189 { AV_PIX_FMT_PAL8, 8 },
190 };
191
192 if (!vcodec) {
193 encoder->videoCodec = 0;
194 return true;
195 }
196
197 AVCodec* codec = avcodec_find_encoder_by_name(vcodec);
198 if (!codec) {
199 return false;
200 }
201
202 size_t i;
203 size_t j;
204 int priority = INT_MAX;
205 encoder->pixFormat = AV_PIX_FMT_NONE;
206 for (i = 0; codec->pix_fmts[i] != AV_PIX_FMT_NONE; ++i) {
207 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
208 if (codec->pix_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
209 priority = priorities[j].priority;
210 encoder->pixFormat = codec->pix_fmts[i];
211 }
212 }
213 }
214 if (encoder->pixFormat == AV_PIX_FMT_NONE) {
215 return false;
216 }
217 if (vbr < 0 && !av_opt_find(&codec->priv_class, "crf", NULL, 0, 0)) {
218 return false;
219 }
220 encoder->videoCodec = vcodec;
221 encoder->videoBitrate = vbr;
222 encoder->frameskip = frameskip + 1;
223 return true;
224}
225
226bool FFmpegEncoderSetContainer(struct FFmpegEncoder* encoder, const char* container) {
227 AVOutputFormat* oformat = av_guess_format(container, 0, 0);
228 if (!oformat) {
229 return false;
230 }
231 encoder->containerFormat = container;
232 return true;
233}
234
235void FFmpegEncoderSetDimensions(struct FFmpegEncoder* encoder, int width, int height) {
236 encoder->width = width > 0 ? width : GBA_VIDEO_HORIZONTAL_PIXELS;
237 encoder->height = height > 0 ? height : GBA_VIDEO_VERTICAL_PIXELS;
238}
239
240void FFmpegEncoderSetLooping(struct FFmpegEncoder* encoder, bool loop) {
241 encoder->loop = loop;
242}
243
244bool FFmpegEncoderVerifyContainer(struct FFmpegEncoder* encoder) {
245 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
246 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
247 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
248 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !oformat || (!acodec && !vcodec)) {
249 return false;
250 }
251 if (encoder->audioCodec && !avformat_query_codec(oformat, acodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
252 return false;
253 }
254 if (encoder->videoCodec && !avformat_query_codec(oformat, vcodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
255 return false;
256 }
257 return true;
258}
259
260bool FFmpegEncoderOpen(struct FFmpegEncoder* encoder, const char* outfile) {
261 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
262 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
263 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !FFmpegEncoderVerifyContainer(encoder)) {
264 return false;
265 }
266
267 if (encoder->context) {
268 return false;
269 }
270
271 encoder->currentAudioSample = 0;
272 encoder->currentAudioFrame = 0;
273 encoder->currentVideoFrame = 0;
274 encoder->skipResidue = 0;
275
276 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
277#ifndef USE_LIBAV
278 avformat_alloc_output_context2(&encoder->context, oformat, 0, outfile);
279#else
280 encoder->context = avformat_alloc_context();
281 strncpy(encoder->context->filename, outfile, sizeof(encoder->context->filename) - 1);
282 encoder->context->filename[sizeof(encoder->context->filename) - 1] = '\0';
283 encoder->context->oformat = oformat;
284#endif
285
286 if (acodec) {
287#ifdef FFMPEG_USE_CODECPAR
288 encoder->audioStream = avformat_new_stream(encoder->context, NULL);
289 encoder->audio = avcodec_alloc_context3(acodec);
290#else
291 encoder->audioStream = avformat_new_stream(encoder->context, acodec);
292 encoder->audio = encoder->audioStream->codec;
293#endif
294 encoder->audio->bit_rate = encoder->audioBitrate;
295 encoder->audio->channels = 2;
296 encoder->audio->channel_layout = AV_CH_LAYOUT_STEREO;
297 encoder->audio->sample_rate = encoder->sampleRate;
298 encoder->audio->sample_fmt = encoder->sampleFormat;
299 AVDictionary* opts = 0;
300 av_dict_set(&opts, "strict", "-2", 0);
301 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
302#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
303 encoder->audio->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
304#else
305 encoder->audio->flags |= CODEC_FLAG_GLOBAL_HEADER;
306#endif
307 }
308 int res = avcodec_open2(encoder->audio, acodec, &opts);
309 av_dict_free(&opts);
310 if (res < 0) {
311 FFmpegEncoderClose(encoder);
312 return false;
313 }
314#if LIBAVCODEC_VERSION_MAJOR >= 55
315 encoder->audioFrame = av_frame_alloc();
316#else
317 encoder->audioFrame = avcodec_alloc_frame();
318#endif
319 if (!encoder->audio->frame_size) {
320 encoder->audio->frame_size = 1;
321 }
322 encoder->audioFrame->nb_samples = encoder->audio->frame_size;
323 encoder->audioFrame->format = encoder->audio->sample_fmt;
324 encoder->audioFrame->pts = 0;
325#ifdef USE_LIBAVRESAMPLE
326 encoder->resampleContext = avresample_alloc_context();
327 av_opt_set_int(encoder->resampleContext, "in_channel_layout", AV_CH_LAYOUT_STEREO, 0);
328 av_opt_set_int(encoder->resampleContext, "out_channel_layout", AV_CH_LAYOUT_STEREO, 0);
329 av_opt_set_int(encoder->resampleContext, "in_sample_rate", PREFERRED_SAMPLE_RATE, 0);
330 av_opt_set_int(encoder->resampleContext, "out_sample_rate", encoder->sampleRate, 0);
331 av_opt_set_int(encoder->resampleContext, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);
332 av_opt_set_int(encoder->resampleContext, "out_sample_fmt", encoder->sampleFormat, 0);
333 avresample_open(encoder->resampleContext);
334#else
335 encoder->resampleContext = swr_alloc_set_opts(NULL, AV_CH_LAYOUT_STEREO, encoder->sampleFormat, encoder->sampleRate,
336 AV_CH_LAYOUT_STEREO, AV_SAMPLE_FMT_S16, PREFERRED_SAMPLE_RATE, 0, NULL);
337 swr_init(encoder->resampleContext);
338#endif
339 encoder->audioBufferSize = (encoder->audioFrame->nb_samples * PREFERRED_SAMPLE_RATE / encoder->sampleRate) * 4;
340 encoder->audioBuffer = av_malloc(encoder->audioBufferSize);
341 encoder->postaudioBufferSize = av_samples_get_buffer_size(0, encoder->audio->channels, encoder->audio->frame_size, encoder->audio->sample_fmt, 0);
342 encoder->postaudioBuffer = av_malloc(encoder->postaudioBufferSize);
343 avcodec_fill_audio_frame(encoder->audioFrame, encoder->audio->channels, encoder->audio->sample_fmt, (const uint8_t*) encoder->postaudioBuffer, encoder->postaudioBufferSize, 0);
344
345 if (encoder->audio->codec->id == AV_CODEC_ID_AAC &&
346 (strcasecmp(encoder->containerFormat, "mp4") ||
347 strcasecmp(encoder->containerFormat, "m4v") ||
348 strcasecmp(encoder->containerFormat, "mov"))) {
349 // MP4 container doesn't support the raw ADTS AAC format that the encoder spits out
350#ifdef FFMPEG_USE_NEW_BSF
351 av_bsf_alloc(av_bsf_get_by_name("aac_adtstoasc"), &encoder->absf);
352 avcodec_parameters_from_context(encoder->absf->par_in, encoder->audio);
353 av_bsf_init(encoder->absf);
354#else
355 encoder->absf = av_bitstream_filter_init("aac_adtstoasc");
356#endif
357 }
358#ifdef FFMPEG_USE_CODECPAR
359 avcodec_parameters_from_context(encoder->audioStream->codecpar, encoder->audio);
360#endif
361 }
362
363 if (vcodec) {
364#ifdef FFMPEG_USE_CODECPAR
365 encoder->videoStream = avformat_new_stream(encoder->context, NULL);
366 encoder->video = avcodec_alloc_context3(vcodec);
367#else
368 encoder->videoStream = avformat_new_stream(encoder->context, vcodec);
369 encoder->video = encoder->videoStream->codec;
370#endif
371 encoder->video->bit_rate = encoder->videoBitrate;
372 encoder->video->width = encoder->width;
373 encoder->video->height = encoder->height;
374 encoder->video->time_base = (AVRational) { encoder->frameCycles * encoder->frameskip, encoder->cycles };
375 encoder->video->framerate = (AVRational) { encoder->cycles, encoder->frameCycles * encoder->frameskip };
376 encoder->videoStream->time_base = encoder->video->time_base;
377 encoder->videoStream->avg_frame_rate = encoder->video->framerate;
378 encoder->video->pix_fmt = encoder->pixFormat;
379 encoder->video->gop_size = 60;
380 encoder->video->max_b_frames = 3;
381 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
382#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
383 encoder->video->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
384#else
385 encoder->video->flags |= CODEC_FLAG_GLOBAL_HEADER;
386#endif
387 }
388
389 if (encoder->video->codec->id == AV_CODEC_ID_H264 &&
390 (strcasecmp(encoder->containerFormat, "mp4") ||
391 strcasecmp(encoder->containerFormat, "m4v") ||
392 strcasecmp(encoder->containerFormat, "mov"))) {
393 // QuickTime and a few other things require YUV420
394 encoder->video->pix_fmt = AV_PIX_FMT_YUV420P;
395 }
396 if (encoder->video->codec->id == AV_CODEC_ID_FFV1) {
397#if LIBAVCODEC_VERSION_MAJOR >= 57
398 av_opt_set(encoder->video->priv_data, "coder", "range_tab", 0);
399 av_opt_set_int(encoder->video->priv_data, "context", 1, 0);
400#endif
401 encoder->video->gop_size = 128;
402 encoder->video->level = 3;
403 }
404
405 if (encoder->video->codec->id == AV_CODEC_ID_PNG) {
406 encoder->video->compression_level = 8;
407 }
408#if LIBAVCODEC_VERSION_INT >= AV_VERSION_INT(58, 48, 100)
409 if (encoder->video->codec->id == AV_CODEC_ID_ZMBV) {
410 encoder->video->compression_level = 5;
411 encoder->video->pix_fmt = AV_PIX_FMT_BGR0;
412 }
413#endif
414 if (strcmp(vcodec->name, "libx264") == 0 || strcmp(vcodec->name, "libx264rgb") == 0) {
415 // Try to adaptively figure out when you can use a slower encoder
416 if (encoder->width * encoder->height > 1000000) {
417 av_opt_set(encoder->video->priv_data, "preset", "superfast", 0);
418 } else if (encoder->width * encoder->height > 500000) {
419 av_opt_set(encoder->video->priv_data, "preset", "veryfast", 0);
420 } else {
421 av_opt_set(encoder->video->priv_data, "preset", "faster", 0);
422 }
423 av_opt_set(encoder->video->priv_data, "tune", "zerolatency", 0);
424 if (encoder->videoBitrate == 0) {
425 av_opt_set(encoder->video->priv_data, "qp", "0", 0);
426 if (strcmp(vcodec->name, "libx264") == 0) {
427 encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
428 }
429 } else if (encoder->videoBitrate < 0) {
430 av_opt_set_int(encoder->video->priv_data, "crf", -encoder->videoBitrate, 0);
431 }
432 } else if (encoder->videoBitrate < 0) {
433 if (strcmp(vcodec->name, "libvpx") == 0 || strcmp(vcodec->name, "libvpx-vp9") == 0 || strcmp(vcodec->name, "libx265") == 0) {
434 av_opt_set_int(encoder->video->priv_data, "crf", -encoder->videoBitrate, 0);
435 } else {
436 FFmpegEncoderClose(encoder);
437 return false;
438 }
439 }
440 if (strncmp(vcodec->name, "libvpx", 6) == 0) {
441 av_opt_set_int(encoder->video->priv_data, "cpu-used", 2, 0);
442 av_opt_set(encoder->video->priv_data, "deadline", "realtime", 0);
443 }
444 if (strcmp(vcodec->name, "libvpx-vp9") == 0 && encoder->videoBitrate == 0) {
445 av_opt_set_int(encoder->video->priv_data, "lossless", 1, 0);
446 av_opt_set_int(encoder->video->priv_data, "crf", 0, 0);
447 encoder->video->gop_size = 120;
448 encoder->video->pix_fmt = AV_PIX_FMT_GBRP;
449 }
450 if (strcmp(vcodec->name, "libwebp_anim") == 0 && encoder->videoBitrate == 0) {
451 av_opt_set(encoder->video->priv_data, "lossless", "1", 0);
452 encoder->video->pix_fmt = AV_PIX_FMT_RGB32;
453 }
454
455 if (encoder->pixFormat == AV_PIX_FMT_PAL8) {
456 encoder->graph = avfilter_graph_alloc();
457
458 const struct AVFilter* source = avfilter_get_by_name("buffer");
459 const struct AVFilter* sink = avfilter_get_by_name("buffersink");
460 const struct AVFilter* split = avfilter_get_by_name("split");
461 const struct AVFilter* palettegen = avfilter_get_by_name("palettegen");
462 const struct AVFilter* paletteuse = avfilter_get_by_name("paletteuse");
463
464 if (!source || !sink || !split || !palettegen || !paletteuse || !encoder->graph) {
465 FFmpegEncoderClose(encoder);
466 return false;
467 }
468
469 char args[256];
470 snprintf(args, sizeof(args), "video_size=%dx%d:pix_fmt=%d:time_base=%d/%d",
471 encoder->video->width, encoder->video->height, encoder->ipixFormat,
472 encoder->video->time_base.num, encoder->video->time_base.den);
473
474 int res = 0;
475 res |= avfilter_graph_create_filter(&encoder->source, source, NULL, args, NULL, encoder->graph);
476 res |= avfilter_graph_create_filter(&encoder->sink, sink, NULL, NULL, NULL, encoder->graph);
477 res |= avfilter_graph_create_filter(&encoder->filters[0], split, NULL, NULL, NULL, encoder->graph);
478 res |= avfilter_graph_create_filter(&encoder->filters[1], palettegen, NULL, "reserve_transparent=off", NULL, encoder->graph);
479 res |= avfilter_graph_create_filter(&encoder->filters[2], paletteuse, NULL, "dither=none", NULL, encoder->graph);
480 if (res < 0) {
481 FFmpegEncoderClose(encoder);
482 return false;
483 }
484
485 res = 0;
486 res |= avfilter_link(encoder->source, 0, encoder->filters[0], 0);
487 res |= avfilter_link(encoder->filters[0], 0, encoder->filters[1], 0);
488 res |= avfilter_link(encoder->filters[0], 1, encoder->filters[2], 0);
489 res |= avfilter_link(encoder->filters[1], 0, encoder->filters[2], 1);
490 res |= avfilter_link(encoder->filters[2], 0, encoder->sink, 0);
491 if (res < 0 || avfilter_graph_config(encoder->graph, NULL) < 0) {
492 FFmpegEncoderClose(encoder);
493 return false;
494 }
495
496#if LIBAVCODEC_VERSION_MAJOR >= 55
497 encoder->sinkFrame = av_frame_alloc();
498#else
499 encoder->sinkFrame = avcodec_alloc_frame();
500#endif
501 }
502 AVDictionary* opts = 0;
503 av_dict_set(&opts, "strict", "-2", 0);
504 int res = avcodec_open2(encoder->video, vcodec, &opts);
505 av_dict_free(&opts);
506 if (res < 0) {
507 FFmpegEncoderClose(encoder);
508 return false;
509 }
510#if LIBAVCODEC_VERSION_MAJOR >= 55
511 encoder->videoFrame = av_frame_alloc();
512#else
513 encoder->videoFrame = avcodec_alloc_frame();
514#endif
515 encoder->videoFrame->format = encoder->video->pix_fmt != AV_PIX_FMT_PAL8 ? encoder->video->pix_fmt : encoder->ipixFormat;
516 encoder->videoFrame->width = encoder->video->width;
517 encoder->videoFrame->height = encoder->video->height;
518 encoder->videoFrame->pts = 0;
519 _ffmpegSetVideoDimensions(&encoder->d, encoder->iwidth, encoder->iheight);
520 av_image_alloc(encoder->videoFrame->data, encoder->videoFrame->linesize, encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format, 32);
521#ifdef FFMPEG_USE_CODECPAR
522 avcodec_parameters_from_context(encoder->videoStream->codecpar, encoder->video);
523#endif
524 }
525
526 if (strcmp(encoder->containerFormat, "gif") == 0) {
527 av_opt_set(encoder->context->priv_data, "loop", encoder->loop ? "0" : "-1", 0);
528 } else if (strcmp(encoder->containerFormat, "apng") == 0) {
529 av_opt_set(encoder->context->priv_data, "plays", encoder->loop ? "0" : "1", 0);
530 } else if (strcmp(encoder->containerFormat, "webp") == 0) {
531 av_opt_set(encoder->context->priv_data, "loop", encoder->loop ? "0" : "1", 0);
532 }
533
534 AVDictionary* opts = 0;
535 av_dict_set(&opts, "strict", "-2", 0);
536 bool res = avio_open(&encoder->context->pb, outfile, AVIO_FLAG_WRITE) < 0 || avformat_write_header(encoder->context, &opts) < 0;
537 av_dict_free(&opts);
538 if (res) {
539 FFmpegEncoderClose(encoder);
540 return false;
541 }
542 return true;
543}
544
545void FFmpegEncoderClose(struct FFmpegEncoder* encoder) {
546 if (encoder->audio) {
547 while (true) {
548 if (!_ffmpegWriteAudioFrame(encoder, NULL)) {
549 break;
550 }
551 }
552 }
553 if (encoder->video) {
554 if (encoder->graph) {
555 if (av_buffersrc_add_frame(encoder->source, NULL) >= 0) {
556 while (true) {
557 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
558 if (res < 0) {
559 break;
560 }
561 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
562 av_frame_unref(encoder->sinkFrame);
563 }
564 }
565 }
566 while (true) {
567 if (!_ffmpegWriteVideoFrame(encoder, NULL)) {
568 break;
569 }
570 }
571 }
572
573 if (encoder->context && encoder->context->pb) {
574 av_write_trailer(encoder->context);
575 avio_close(encoder->context->pb);
576 }
577
578 if (encoder->postaudioBuffer) {
579 av_free(encoder->postaudioBuffer);
580 encoder->postaudioBuffer = NULL;
581 }
582 if (encoder->audioBuffer) {
583 av_free(encoder->audioBuffer);
584 encoder->audioBuffer = NULL;
585 }
586
587 if (encoder->audioFrame) {
588#if LIBAVCODEC_VERSION_MAJOR >= 55
589 av_frame_free(&encoder->audioFrame);
590#else
591 avcodec_free_frame(&encoder->audioFrame);
592#endif
593 }
594 if (encoder->audio) {
595#ifdef FFMPEG_USE_CODECPAR
596 avcodec_free_context(&encoder->audio);
597#else
598 avcodec_close(encoder->audio);
599 encoder->audio = NULL;
600#endif
601 }
602
603 if (encoder->resampleContext) {
604#ifdef USE_LIBAVRESAMPLE
605 avresample_close(encoder->resampleContext);
606 encoder->resampleContext = NULL;
607#else
608 swr_free(&encoder->resampleContext);
609#endif
610 }
611
612 if (encoder->absf) {
613#ifdef FFMPEG_USE_NEW_BSF
614 av_bsf_free(&encoder->absf);
615#else
616 av_bitstream_filter_close(encoder->absf);
617 encoder->absf = NULL;
618#endif
619 }
620
621 if (encoder->videoFrame) {
622 av_freep(encoder->videoFrame->data);
623#if LIBAVCODEC_VERSION_MAJOR >= 55
624 av_frame_free(&encoder->videoFrame);
625#else
626 avcodec_free_frame(&encoder->videoFrame);
627#endif
628 }
629
630 if (encoder->sinkFrame) {
631#if LIBAVCODEC_VERSION_MAJOR >= 55
632 av_frame_free(&encoder->sinkFrame);
633#else
634 avcodec_free_frame(&encoder->sinkFrame);
635#endif
636 encoder->sinkFrame = NULL;
637 }
638
639 if (encoder->video) {
640#ifdef FFMPEG_USE_CODECPAR
641 avcodec_free_context(&encoder->video);
642#else
643 avcodec_close(encoder->video);
644 encoder->video = NULL;
645#endif
646 }
647
648 if (encoder->scaleContext) {
649 sws_freeContext(encoder->scaleContext);
650 encoder->scaleContext = NULL;
651 }
652
653 if (encoder->graph) {
654 avfilter_graph_free(&encoder->graph);
655 encoder->graph = NULL;
656 encoder->source = NULL;
657 encoder->sink = NULL;
658
659 int i;
660 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
661 encoder->filters[i] = NULL;
662 }
663 }
664
665 if (encoder->context) {
666 avformat_free_context(encoder->context);
667 encoder->context = NULL;
668 }
669}
670
671bool FFmpegEncoderIsOpen(struct FFmpegEncoder* encoder) {
672 return !!encoder->context;
673}
674
675void _ffmpegPostAudioFrame(struct mAVStream* stream, int16_t left, int16_t right) {
676 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
677 if (!encoder->context || !encoder->audioCodec) {
678 return;
679 }
680
681 if (encoder->absf && !left) {
682 // XXX: AVBSF doesn't like silence. Figure out why.
683 left = 1;
684 }
685
686 encoder->audioBuffer[encoder->currentAudioSample * 2] = left;
687 encoder->audioBuffer[encoder->currentAudioSample * 2 + 1] = right;
688
689 ++encoder->currentAudioSample;
690
691 if (encoder->currentAudioSample * 4 < encoder->audioBufferSize) {
692 return;
693 }
694
695 int channelSize = 2 * av_get_bytes_per_sample(encoder->audio->sample_fmt);
696 encoder->currentAudioSample = 0;
697#ifdef USE_LIBAVRESAMPLE
698 avresample_convert(encoder->resampleContext, 0, 0, 0,
699 (uint8_t**) &encoder->audioBuffer, 0, encoder->audioBufferSize / 4);
700
701 if (avresample_available(encoder->resampleContext) < encoder->audioFrame->nb_samples) {
702 return;
703 }
704#if LIBAVCODEC_VERSION_MAJOR >= 55
705 av_frame_make_writable(encoder->audioFrame);
706#endif
707 int samples = avresample_read(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize);
708#else
709#if LIBAVCODEC_VERSION_MAJOR >= 55
710 av_frame_make_writable(encoder->audioFrame);
711#endif
712 if (swr_get_out_samples(encoder->resampleContext, 1) < encoder->audioFrame->nb_samples) {
713 swr_convert(encoder->resampleContext, NULL, 0, (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
714 return;
715 }
716 int samples = swr_convert(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize,
717 (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
718#endif
719
720 encoder->audioFrame->pts = encoder->currentAudioFrame;
721 encoder->currentAudioFrame += samples;
722
723 _ffmpegWriteAudioFrame(encoder, encoder->audioFrame);
724}
725
726bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame) {
727 AVPacket packet;
728 av_init_packet(&packet);
729 packet.data = 0;
730 packet.size = 0;
731
732 int gotData;
733#ifdef FFMPEG_USE_PACKETS
734 avcodec_send_frame(encoder->audio, audioFrame);
735 gotData = avcodec_receive_packet(encoder->audio, &packet);
736 gotData = (gotData == 0) && packet.size;
737#else
738 avcodec_encode_audio2(encoder->audio, &packet, audioFrame, &gotData);
739#endif
740 packet.pts = av_rescale_q(packet.pts, encoder->audio->time_base, encoder->audioStream->time_base);
741 packet.dts = packet.pts;
742
743 if (gotData) {
744 if (encoder->absf) {
745 AVPacket tempPacket;
746
747#ifdef FFMPEG_USE_NEW_BSF
748 int success = av_bsf_send_packet(encoder->absf, &packet);
749 if (success >= 0) {
750 success = av_bsf_receive_packet(encoder->absf, &tempPacket);
751 }
752#else
753 int success = av_bitstream_filter_filter(encoder->absf, encoder->audio, 0,
754 &tempPacket.data, &tempPacket.size,
755 packet.data, packet.size, 0);
756#endif
757
758 if (success >= 0) {
759#if LIBAVUTIL_VERSION_MAJOR >= 53
760 tempPacket.buf = av_buffer_create(tempPacket.data, tempPacket.size, av_buffer_default_free, 0, 0);
761#endif
762
763#ifdef FFMPEG_USE_PACKET_UNREF
764 av_packet_move_ref(&packet, &tempPacket);
765#else
766 av_free_packet(&packet);
767 packet = tempPacket;
768#endif
769
770 packet.stream_index = encoder->audioStream->index;
771 av_interleaved_write_frame(encoder->context, &packet);
772 }
773 } else {
774 packet.stream_index = encoder->audioStream->index;
775 av_interleaved_write_frame(encoder->context, &packet);
776 }
777 }
778#ifdef FFMPEG_USE_PACKET_UNREF
779 av_packet_unref(&packet);
780#else
781 av_free_packet(&packet);
782#endif
783 return gotData;
784}
785
786void _ffmpegPostVideoFrame(struct mAVStream* stream, const color_t* pixels, size_t stride) {
787 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
788 if (!encoder->context || !encoder->videoCodec) {
789 return;
790 }
791 encoder->skipResidue = (encoder->skipResidue + 1) % encoder->frameskip;
792 if (encoder->skipResidue) {
793 return;
794 }
795 stride *= BYTES_PER_PIXEL;
796
797#if LIBAVCODEC_VERSION_MAJOR >= 55
798 av_frame_make_writable(encoder->videoFrame);
799#endif
800 if (encoder->video->codec->id == AV_CODEC_ID_WEBP) {
801 // TODO: Figure out why WebP is rescaling internally (should video frames not be rescaled externally?)
802 encoder->videoFrame->pts = encoder->currentVideoFrame;
803 } else {
804 encoder->videoFrame->pts = av_rescale_q(encoder->currentVideoFrame, encoder->video->time_base, encoder->videoStream->time_base);
805 }
806 ++encoder->currentVideoFrame;
807
808 sws_scale(encoder->scaleContext, (const uint8_t* const*) &pixels, (const int*) &stride, 0, encoder->iheight, encoder->videoFrame->data, encoder->videoFrame->linesize);
809
810 if (encoder->graph) {
811 if (av_buffersrc_add_frame(encoder->source, encoder->videoFrame) < 0) {
812 return;
813 }
814 while (true) {
815 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
816 if (res < 0) {
817 break;
818 }
819 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
820 av_frame_unref(encoder->sinkFrame);
821 }
822 } else {
823 _ffmpegWriteVideoFrame(encoder, encoder->videoFrame);
824 }
825}
826
827bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame) {
828 AVPacket packet;
829
830 av_init_packet(&packet);
831 packet.data = 0;
832 packet.size = 0;
833
834 int gotData;
835#ifdef FFMPEG_USE_PACKETS
836 avcodec_send_frame(encoder->video, videoFrame);
837 gotData = avcodec_receive_packet(encoder->video, &packet) == 0;
838#else
839 avcodec_encode_video2(encoder->video, &packet, videoFrame, &gotData);
840#endif
841 if (gotData) {
842#ifndef FFMPEG_USE_PACKET_UNREF
843 if (encoder->video->coded_frame->key_frame) {
844 packet.flags |= AV_PKT_FLAG_KEY;
845 }
846#endif
847 packet.stream_index = encoder->videoStream->index;
848 av_interleaved_write_frame(encoder->context, &packet);
849 }
850#ifdef FFMPEG_USE_PACKET_UNREF
851 av_packet_unref(&packet);
852#else
853 av_free_packet(&packet);
854#endif
855
856 return gotData;
857}
858
859static void _ffmpegSetVideoDimensions(struct mAVStream* stream, unsigned width, unsigned height) {
860 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
861 if (!encoder->context || !encoder->videoCodec) {
862 return;
863 }
864 encoder->iwidth = width;
865 encoder->iheight = height;
866 if (encoder->scaleContext) {
867 sws_freeContext(encoder->scaleContext);
868 }
869 encoder->scaleContext = sws_getContext(encoder->iwidth, encoder->iheight, encoder->ipixFormat,
870 encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format,
871 SWS_POINT, 0, 0, 0);
872}
873
874void FFmpegEncoderSetInputFrameRate(struct FFmpegEncoder* encoder, int numerator, int denominator) {
875 reduceFraction(&numerator, &denominator);
876 encoder->frameCycles = numerator;
877 encoder->cycles = denominator;
878 if (encoder->video) {
879 encoder->video->framerate = (AVRational) { denominator, numerator * encoder->frameskip };
880 }
881}