src/feature/ffmpeg/ffmpeg-encoder.c (view raw)
1/* Copyright (c) 2013-2015 Jeffrey Pfau
2 *
3 * This Source Code Form is subject to the terms of the Mozilla Public
4 * License, v. 2.0. If a copy of the MPL was not distributed with this
5 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
6#include "ffmpeg-encoder.h"
7
8#include <mgba/core/core.h>
9#include <mgba/gba/interface.h>
10
11#include <libavcodec/version.h>
12#include <libavcodec/avcodec.h>
13
14#include <libavfilter/buffersink.h>
15#include <libavfilter/buffersrc.h>
16
17#include <libavutil/version.h>
18#if LIBAVUTIL_VERSION_MAJOR >= 53
19#include <libavutil/buffer.h>
20#endif
21#include <libavutil/imgutils.h>
22#include <libavutil/mathematics.h>
23#include <libavutil/opt.h>
24
25#ifdef USE_LIBAVRESAMPLE
26#include <libavresample/avresample.h>
27#else
28#include <libswresample/swresample.h>
29#endif
30#include <libswscale/swscale.h>
31
32static void _ffmpegPostVideoFrame(struct mAVStream*, const color_t* pixels, size_t stride);
33static void _ffmpegPostAudioFrame(struct mAVStream*, int16_t left, int16_t right);
34static void _ffmpegSetVideoDimensions(struct mAVStream*, unsigned width, unsigned height);
35
36static bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame);
37static bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame);
38
39enum {
40 PREFERRED_SAMPLE_RATE = 0x8000
41};
42
43void FFmpegEncoderInit(struct FFmpegEncoder* encoder) {
44#if LIBAVFORMAT_VERSION_INT < AV_VERSION_INT(58, 9, 100)
45 av_register_all();
46#endif
47
48 encoder->d.videoDimensionsChanged = _ffmpegSetVideoDimensions;
49 encoder->d.postVideoFrame = _ffmpegPostVideoFrame;
50 encoder->d.postAudioFrame = _ffmpegPostAudioFrame;
51 encoder->d.postAudioBuffer = 0;
52
53 encoder->audioCodec = NULL;
54 encoder->videoCodec = NULL;
55 encoder->containerFormat = NULL;
56 FFmpegEncoderSetAudio(encoder, "flac", 0);
57 FFmpegEncoderSetVideo(encoder, "libx264", 0, 0);
58 FFmpegEncoderSetContainer(encoder, "matroska");
59 FFmpegEncoderSetDimensions(encoder, GBA_VIDEO_HORIZONTAL_PIXELS, GBA_VIDEO_VERTICAL_PIXELS);
60 encoder->iwidth = GBA_VIDEO_HORIZONTAL_PIXELS;
61 encoder->iheight = GBA_VIDEO_VERTICAL_PIXELS;
62 encoder->frameskip = 1;
63 encoder->skipResidue = 0;
64 encoder->loop = false;
65 encoder->ipixFormat =
66#ifdef COLOR_16_BIT
67#ifdef COLOR_5_6_5
68 AV_PIX_FMT_RGB565;
69#else
70 AV_PIX_FMT_BGR555;
71#endif
72#else
73#ifndef USE_LIBAV
74 AV_PIX_FMT_0BGR32;
75#else
76 AV_PIX_FMT_BGR32;
77#endif
78#endif
79 encoder->resampleContext = NULL;
80 encoder->absf = NULL;
81 encoder->context = NULL;
82 encoder->scaleContext = NULL;
83 encoder->audio = NULL;
84 encoder->audioStream = NULL;
85 encoder->audioFrame = NULL;
86 encoder->audioBuffer = NULL;
87 encoder->postaudioBuffer = NULL;
88 encoder->video = NULL;
89 encoder->videoStream = NULL;
90 encoder->videoFrame = NULL;
91 encoder->graph = NULL;
92 encoder->source = NULL;
93 encoder->sink = NULL;
94 encoder->sinkFrame = NULL;
95
96 int i;
97 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
98 encoder->filters[i] = NULL;
99 }
100}
101
102bool FFmpegEncoderSetAudio(struct FFmpegEncoder* encoder, const char* acodec, unsigned abr) {
103 static const struct {
104 int format;
105 int priority;
106 } priorities[] = {
107 { AV_SAMPLE_FMT_S16, 0 },
108 { AV_SAMPLE_FMT_S16P, 1 },
109 { AV_SAMPLE_FMT_S32, 2 },
110 { AV_SAMPLE_FMT_S32P, 2 },
111 { AV_SAMPLE_FMT_FLT, 3 },
112 { AV_SAMPLE_FMT_FLTP, 3 },
113 { AV_SAMPLE_FMT_DBL, 4 },
114 { AV_SAMPLE_FMT_DBLP, 4 }
115 };
116
117 if (!acodec) {
118 encoder->audioCodec = 0;
119 return true;
120 }
121
122 AVCodec* codec = avcodec_find_encoder_by_name(acodec);
123 if (!codec) {
124 return false;
125 }
126
127 if (!codec->sample_fmts) {
128 return false;
129 }
130 size_t i;
131 size_t j;
132 int priority = INT_MAX;
133 encoder->sampleFormat = AV_SAMPLE_FMT_NONE;
134 for (i = 0; codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
135 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
136 if (codec->sample_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
137 priority = priorities[j].priority;
138 encoder->sampleFormat = codec->sample_fmts[i];
139 }
140 }
141 }
142 if (encoder->sampleFormat == AV_SAMPLE_FMT_NONE) {
143 return false;
144 }
145 encoder->sampleRate = PREFERRED_SAMPLE_RATE;
146 if (codec->supported_samplerates) {
147 for (i = 0; codec->supported_samplerates[i]; ++i) {
148 if (codec->supported_samplerates[i] < PREFERRED_SAMPLE_RATE) {
149 continue;
150 }
151 if (encoder->sampleRate == PREFERRED_SAMPLE_RATE || encoder->sampleRate > codec->supported_samplerates[i]) {
152 encoder->sampleRate = codec->supported_samplerates[i];
153 }
154 }
155 } else if (codec->id == AV_CODEC_ID_AAC) {
156 // HACK: AAC doesn't support 32768Hz (it rounds to 32000), but libfaac doesn't tell us that
157 encoder->sampleRate = 44100;
158 }
159 encoder->audioCodec = acodec;
160 encoder->audioBitrate = abr;
161 return true;
162}
163
164bool FFmpegEncoderSetVideo(struct FFmpegEncoder* encoder, const char* vcodec, unsigned vbr, int frameskip) {
165 static const struct {
166 enum AVPixelFormat format;
167 int priority;
168 } priorities[] = {
169 { AV_PIX_FMT_RGB555, 0 },
170 { AV_PIX_FMT_BGR555, 0 },
171 { AV_PIX_FMT_RGB565, 1 },
172 { AV_PIX_FMT_BGR565, 1 },
173 { AV_PIX_FMT_RGB24, 2 },
174 { AV_PIX_FMT_BGR24, 2 },
175#ifndef USE_LIBAV
176 { AV_PIX_FMT_BGR0, 3 },
177 { AV_PIX_FMT_RGB0, 3 },
178 { AV_PIX_FMT_0BGR, 3 },
179 { AV_PIX_FMT_0RGB, 3 },
180#endif
181 { AV_PIX_FMT_YUV422P, 4 },
182 { AV_PIX_FMT_YUV444P, 5 },
183 { AV_PIX_FMT_YUV420P, 6 },
184 { AV_PIX_FMT_PAL8, 7 },
185 };
186
187 if (!vcodec) {
188 encoder->videoCodec = 0;
189 return true;
190 }
191
192 AVCodec* codec = avcodec_find_encoder_by_name(vcodec);
193 if (!codec) {
194 return false;
195 }
196
197 size_t i;
198 size_t j;
199 int priority = INT_MAX;
200 encoder->pixFormat = AV_PIX_FMT_NONE;
201 for (i = 0; codec->pix_fmts[i] != AV_PIX_FMT_NONE; ++i) {
202 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
203 if (codec->pix_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
204 priority = priorities[j].priority;
205 encoder->pixFormat = codec->pix_fmts[i];
206 }
207 }
208 }
209 if (encoder->pixFormat == AV_PIX_FMT_NONE) {
210 return false;
211 }
212 encoder->videoCodec = vcodec;
213 encoder->videoBitrate = vbr;
214 encoder->frameskip = frameskip + 1;
215 return true;
216}
217
218bool FFmpegEncoderSetContainer(struct FFmpegEncoder* encoder, const char* container) {
219 AVOutputFormat* oformat = av_guess_format(container, 0, 0);
220 if (!oformat) {
221 return false;
222 }
223 encoder->containerFormat = container;
224 return true;
225}
226
227void FFmpegEncoderSetDimensions(struct FFmpegEncoder* encoder, int width, int height) {
228 encoder->width = width > 0 ? width : GBA_VIDEO_HORIZONTAL_PIXELS;
229 encoder->height = height > 0 ? height : GBA_VIDEO_VERTICAL_PIXELS;
230}
231
232void FFmpegEncoderSetLooping(struct FFmpegEncoder* encoder, bool loop) {
233 encoder->loop = loop;
234}
235
236bool FFmpegEncoderVerifyContainer(struct FFmpegEncoder* encoder) {
237 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
238 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
239 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
240 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !oformat || (!acodec && !vcodec)) {
241 return false;
242 }
243 if (encoder->audioCodec && !avformat_query_codec(oformat, acodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
244 return false;
245 }
246 if (encoder->videoCodec && !avformat_query_codec(oformat, vcodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
247 return false;
248 }
249 return true;
250}
251
252bool FFmpegEncoderOpen(struct FFmpegEncoder* encoder, const char* outfile) {
253 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
254 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
255 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !FFmpegEncoderVerifyContainer(encoder)) {
256 return false;
257 }
258
259 if (encoder->context) {
260 return false;
261 }
262
263 encoder->currentAudioSample = 0;
264 encoder->currentAudioFrame = 0;
265 encoder->currentVideoFrame = 0;
266 encoder->skipResidue = 0;
267
268 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
269#ifndef USE_LIBAV
270 avformat_alloc_output_context2(&encoder->context, oformat, 0, outfile);
271#else
272 encoder->context = avformat_alloc_context();
273 strncpy(encoder->context->filename, outfile, sizeof(encoder->context->filename) - 1);
274 encoder->context->filename[sizeof(encoder->context->filename) - 1] = '\0';
275 encoder->context->oformat = oformat;
276#endif
277
278 if (acodec) {
279#ifdef FFMPEG_USE_CODECPAR
280 encoder->audioStream = avformat_new_stream(encoder->context, NULL);
281 encoder->audio = avcodec_alloc_context3(acodec);
282#else
283 encoder->audioStream = avformat_new_stream(encoder->context, acodec);
284 encoder->audio = encoder->audioStream->codec;
285#endif
286 encoder->audio->bit_rate = encoder->audioBitrate;
287 encoder->audio->channels = 2;
288 encoder->audio->channel_layout = AV_CH_LAYOUT_STEREO;
289 encoder->audio->sample_rate = encoder->sampleRate;
290 encoder->audio->sample_fmt = encoder->sampleFormat;
291 AVDictionary* opts = 0;
292 av_dict_set(&opts, "strict", "-2", 0);
293 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
294#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
295 encoder->audio->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
296#else
297 encoder->audio->flags |= CODEC_FLAG_GLOBAL_HEADER;
298#endif
299 }
300 int res = avcodec_open2(encoder->audio, acodec, &opts);
301 av_dict_free(&opts);
302 if (res < 0) {
303 FFmpegEncoderClose(encoder);
304 return false;
305 }
306#if LIBAVCODEC_VERSION_MAJOR >= 55
307 encoder->audioFrame = av_frame_alloc();
308#else
309 encoder->audioFrame = avcodec_alloc_frame();
310#endif
311 if (!encoder->audio->frame_size) {
312 encoder->audio->frame_size = 1;
313 }
314 encoder->audioFrame->nb_samples = encoder->audio->frame_size;
315 encoder->audioFrame->format = encoder->audio->sample_fmt;
316 encoder->audioFrame->pts = 0;
317#ifdef USE_LIBAVRESAMPLE
318 encoder->resampleContext = avresample_alloc_context();
319 av_opt_set_int(encoder->resampleContext, "in_channel_layout", AV_CH_LAYOUT_STEREO, 0);
320 av_opt_set_int(encoder->resampleContext, "out_channel_layout", AV_CH_LAYOUT_STEREO, 0);
321 av_opt_set_int(encoder->resampleContext, "in_sample_rate", PREFERRED_SAMPLE_RATE, 0);
322 av_opt_set_int(encoder->resampleContext, "out_sample_rate", encoder->sampleRate, 0);
323 av_opt_set_int(encoder->resampleContext, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);
324 av_opt_set_int(encoder->resampleContext, "out_sample_fmt", encoder->sampleFormat, 0);
325 avresample_open(encoder->resampleContext);
326#else
327 encoder->resampleContext = swr_alloc_set_opts(NULL, AV_CH_LAYOUT_STEREO, encoder->sampleFormat, encoder->sampleRate,
328 AV_CH_LAYOUT_STEREO, AV_SAMPLE_FMT_S16, PREFERRED_SAMPLE_RATE, 0, NULL);
329 swr_init(encoder->resampleContext);
330#endif
331 encoder->audioBufferSize = (encoder->audioFrame->nb_samples * PREFERRED_SAMPLE_RATE / encoder->sampleRate) * 4;
332 encoder->audioBuffer = av_malloc(encoder->audioBufferSize);
333 encoder->postaudioBufferSize = av_samples_get_buffer_size(0, encoder->audio->channels, encoder->audio->frame_size, encoder->audio->sample_fmt, 0);
334 encoder->postaudioBuffer = av_malloc(encoder->postaudioBufferSize);
335 avcodec_fill_audio_frame(encoder->audioFrame, encoder->audio->channels, encoder->audio->sample_fmt, (const uint8_t*) encoder->postaudioBuffer, encoder->postaudioBufferSize, 0);
336
337 if (encoder->audio->codec->id == AV_CODEC_ID_AAC &&
338 (strcasecmp(encoder->containerFormat, "mp4") ||
339 strcasecmp(encoder->containerFormat, "m4v") ||
340 strcasecmp(encoder->containerFormat, "mov"))) {
341 // MP4 container doesn't support the raw ADTS AAC format that the encoder spits out
342#ifdef FFMPEG_USE_NEW_BSF
343 av_bsf_alloc(av_bsf_get_by_name("aac_adtstoasc"), &encoder->absf);
344 avcodec_parameters_from_context(encoder->absf->par_in, encoder->audio);
345 av_bsf_init(encoder->absf);
346#else
347 encoder->absf = av_bitstream_filter_init("aac_adtstoasc");
348#endif
349 }
350#ifdef FFMPEG_USE_CODECPAR
351 avcodec_parameters_from_context(encoder->audioStream->codecpar, encoder->audio);
352#endif
353 }
354
355 if (vcodec) {
356#ifdef FFMPEG_USE_CODECPAR
357 encoder->videoStream = avformat_new_stream(encoder->context, NULL);
358 encoder->video = avcodec_alloc_context3(vcodec);
359#else
360 encoder->videoStream = avformat_new_stream(encoder->context, vcodec);
361 encoder->video = encoder->videoStream->codec;
362#endif
363 encoder->video->bit_rate = encoder->videoBitrate;
364 encoder->video->width = encoder->width;
365 encoder->video->height = encoder->height;
366 encoder->video->time_base = (AVRational) { VIDEO_TOTAL_LENGTH * encoder->frameskip, GBA_ARM7TDMI_FREQUENCY };
367 encoder->video->framerate = (AVRational) { GBA_ARM7TDMI_FREQUENCY, VIDEO_TOTAL_LENGTH * encoder->frameskip };
368 encoder->video->pix_fmt = encoder->pixFormat;
369 encoder->video->gop_size = 60;
370 encoder->video->max_b_frames = 3;
371 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
372#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
373 encoder->video->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
374#else
375 encoder->video->flags |= CODEC_FLAG_GLOBAL_HEADER;
376#endif
377 }
378
379 if (encoder->video->codec->id == AV_CODEC_ID_H264 &&
380 (strcasecmp(encoder->containerFormat, "mp4") ||
381 strcasecmp(encoder->containerFormat, "m4v") ||
382 strcasecmp(encoder->containerFormat, "mov"))) {
383 // QuickTime and a few other things require YUV420
384 encoder->video->pix_fmt = AV_PIX_FMT_YUV420P;
385 }
386#if LIBAVCODEC_VERSION_MAJOR >= 57
387 if (encoder->video->codec->id == AV_CODEC_ID_FFV1) {
388 av_opt_set(encoder->video->priv_data, "coder", "range_tab", 0);
389 }
390#endif
391
392 if (strcmp(vcodec->name, "libx264") == 0) {
393 // Try to adaptively figure out when you can use a slower encoder
394 if (encoder->width * encoder->height > 1000000) {
395 av_opt_set(encoder->video->priv_data, "preset", "superfast", 0);
396 } else if (encoder->width * encoder->height > 500000) {
397 av_opt_set(encoder->video->priv_data, "preset", "veryfast", 0);
398 } else {
399 av_opt_set(encoder->video->priv_data, "preset", "faster", 0);
400 }
401 if (encoder->videoBitrate == 0) {
402 av_opt_set(encoder->video->priv_data, "crf", "0", 0);
403 encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
404 }
405 }
406 if (strcmp(vcodec->name, "libvpx-vp9") == 0 && encoder->videoBitrate == 0) {
407 av_opt_set(encoder->video->priv_data, "lossless", "1", 0);
408 encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
409 }
410
411 if (encoder->pixFormat == AV_PIX_FMT_PAL8) {
412 encoder->graph = avfilter_graph_alloc();
413
414 const struct AVFilter* source = avfilter_get_by_name("buffer");
415 const struct AVFilter* sink = avfilter_get_by_name("buffersink");
416 const struct AVFilter* split = avfilter_get_by_name("split");
417 const struct AVFilter* palettegen = avfilter_get_by_name("palettegen");
418 const struct AVFilter* paletteuse = avfilter_get_by_name("paletteuse");
419
420 if (!source || !sink || !split || !palettegen || !paletteuse || !encoder->graph) {
421 FFmpegEncoderClose(encoder);
422 return false;
423 }
424
425 char args[256];
426 snprintf(args, sizeof(args), "video_size=%dx%d:pix_fmt=%d:time_base=%d/%d",
427 encoder->video->width, encoder->video->height, encoder->ipixFormat,
428 encoder->video->time_base.num, encoder->video->time_base.den);
429
430 int res = 0;
431 res |= avfilter_graph_create_filter(&encoder->source, source, NULL, args, NULL, encoder->graph);
432 res |= avfilter_graph_create_filter(&encoder->sink, sink, NULL, NULL, NULL, encoder->graph);
433 res |= avfilter_graph_create_filter(&encoder->filters[0], split, NULL, NULL, NULL, encoder->graph);
434 res |= avfilter_graph_create_filter(&encoder->filters[1], palettegen, NULL, "reserve_transparent=off", NULL, encoder->graph);
435 res |= avfilter_graph_create_filter(&encoder->filters[2], paletteuse, NULL, "dither=none", NULL, encoder->graph);
436 if (res < 0) {
437 FFmpegEncoderClose(encoder);
438 return false;
439 }
440
441 res = 0;
442 res |= avfilter_link(encoder->source, 0, encoder->filters[0], 0);
443 res |= avfilter_link(encoder->filters[0], 0, encoder->filters[1], 0);
444 res |= avfilter_link(encoder->filters[0], 1, encoder->filters[2], 0);
445 res |= avfilter_link(encoder->filters[1], 0, encoder->filters[2], 1);
446 res |= avfilter_link(encoder->filters[2], 0, encoder->sink, 0);
447 if (res < 0 || avfilter_graph_config(encoder->graph, NULL) < 0) {
448 FFmpegEncoderClose(encoder);
449 return false;
450 }
451
452#if LIBAVCODEC_VERSION_MAJOR >= 55
453 encoder->sinkFrame = av_frame_alloc();
454#else
455 encoder->sinkFrame = avcodec_alloc_frame();
456#endif
457 }
458 AVDictionary* opts = 0;
459 av_dict_set(&opts, "strict", "-2", 0);
460 int res = avcodec_open2(encoder->video, vcodec, &opts);
461 av_dict_free(&opts);
462 if (res < 0) {
463 FFmpegEncoderClose(encoder);
464 return false;
465 }
466#if LIBAVCODEC_VERSION_MAJOR >= 55
467 encoder->videoFrame = av_frame_alloc();
468#else
469 encoder->videoFrame = avcodec_alloc_frame();
470#endif
471 encoder->videoFrame->format = encoder->video->pix_fmt != AV_PIX_FMT_PAL8 ? encoder->video->pix_fmt : encoder->ipixFormat;
472 encoder->videoFrame->width = encoder->video->width;
473 encoder->videoFrame->height = encoder->video->height;
474 encoder->videoFrame->pts = 0;
475 _ffmpegSetVideoDimensions(&encoder->d, encoder->iwidth, encoder->iheight);
476 av_image_alloc(encoder->videoFrame->data, encoder->videoFrame->linesize, encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format, 32);
477#ifdef FFMPEG_USE_CODECPAR
478 avcodec_parameters_from_context(encoder->videoStream->codecpar, encoder->video);
479#endif
480 }
481
482 if (strcmp(encoder->containerFormat, "gif") == 0) {
483 av_opt_set(encoder->context->priv_data, "loop", encoder->loop ? "0" : "-1", 0);
484 } else if (strcmp(encoder->containerFormat, "apng") == 0) {
485 av_opt_set(encoder->context->priv_data, "plays", encoder->loop ? "0" : "1", 0);
486 }
487
488 AVDictionary* opts = 0;
489 av_dict_set(&opts, "strict", "-2", 0);
490 bool res = avio_open(&encoder->context->pb, outfile, AVIO_FLAG_WRITE) < 0 || avformat_write_header(encoder->context, &opts) < 0;
491 av_dict_free(&opts);
492 if (res) {
493 FFmpegEncoderClose(encoder);
494 return false;
495 }
496 return true;
497}
498
499void FFmpegEncoderClose(struct FFmpegEncoder* encoder) {
500 if (encoder->audio) {
501 while (true) {
502 if (!_ffmpegWriteAudioFrame(encoder, NULL)) {
503 break;
504 }
505 }
506 }
507 if (encoder->video) {
508 if (encoder->graph) {
509 if (av_buffersrc_add_frame(encoder->source, NULL) >= 0) {
510 while (true) {
511 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
512 if (res < 0) {
513 break;
514 }
515 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
516 av_frame_unref(encoder->sinkFrame);
517 }
518 }
519 }
520 while (true) {
521 if (!_ffmpegWriteVideoFrame(encoder, NULL)) {
522 break;
523 }
524 }
525 }
526
527 if (encoder->context && encoder->context->pb) {
528 av_write_trailer(encoder->context);
529 avio_close(encoder->context->pb);
530 }
531
532 if (encoder->postaudioBuffer) {
533 av_free(encoder->postaudioBuffer);
534 encoder->postaudioBuffer = NULL;
535 }
536 if (encoder->audioBuffer) {
537 av_free(encoder->audioBuffer);
538 encoder->audioBuffer = NULL;
539 }
540
541 if (encoder->audioFrame) {
542#if LIBAVCODEC_VERSION_MAJOR >= 55
543 av_frame_free(&encoder->audioFrame);
544#else
545 avcodec_free_frame(&encoder->audioFrame);
546#endif
547 }
548 if (encoder->audio) {
549 avcodec_close(encoder->audio);
550 encoder->audio = NULL;
551 }
552
553 if (encoder->resampleContext) {
554#ifdef USE_LIBAVRESAMPLE
555 avresample_close(encoder->resampleContext);
556 encoder->resampleContext = NULL;
557#else
558 swr_free(&encoder->resampleContext);
559#endif
560 }
561
562 if (encoder->absf) {
563#ifdef FFMPEG_USE_NEW_BSF
564 av_bsf_free(&encoder->absf);
565#else
566 av_bitstream_filter_close(encoder->absf);
567 encoder->absf = NULL;
568#endif
569 }
570
571 if (encoder->videoFrame) {
572#if LIBAVCODEC_VERSION_MAJOR >= 55
573 av_frame_free(&encoder->videoFrame);
574#else
575 avcodec_free_frame(&encoder->videoFrame);
576#endif
577 }
578
579 if (encoder->sinkFrame) {
580#if LIBAVCODEC_VERSION_MAJOR >= 55
581 av_frame_free(&encoder->sinkFrame);
582#else
583 avcodec_free_frame(&encoder->sinkFrame);
584#endif
585 encoder->sinkFrame = NULL;
586 }
587
588 if (encoder->video) {
589 avcodec_close(encoder->video);
590 encoder->video = NULL;
591 }
592
593 if (encoder->scaleContext) {
594 sws_freeContext(encoder->scaleContext);
595 encoder->scaleContext = NULL;
596 }
597
598 if (encoder->graph) {
599 avfilter_graph_free(&encoder->graph);
600 encoder->graph = NULL;
601 encoder->source = NULL;
602 encoder->sink = NULL;
603
604 int i;
605 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
606 encoder->filters[i] = NULL;
607 }
608 }
609
610 if (encoder->context) {
611 avformat_free_context(encoder->context);
612 encoder->context = NULL;
613 }
614}
615
616bool FFmpegEncoderIsOpen(struct FFmpegEncoder* encoder) {
617 return !!encoder->context;
618}
619
620void _ffmpegPostAudioFrame(struct mAVStream* stream, int16_t left, int16_t right) {
621 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
622 if (!encoder->context || !encoder->audioCodec) {
623 return;
624 }
625
626 if (encoder->absf && !left) {
627 // XXX: AVBSF doesn't like silence. Figure out why.
628 left = 1;
629 }
630
631 encoder->audioBuffer[encoder->currentAudioSample * 2] = left;
632 encoder->audioBuffer[encoder->currentAudioSample * 2 + 1] = right;
633
634 ++encoder->currentAudioSample;
635
636 if (encoder->currentAudioSample * 4 < encoder->audioBufferSize) {
637 return;
638 }
639
640 int channelSize = 2 * av_get_bytes_per_sample(encoder->audio->sample_fmt);
641 encoder->currentAudioSample = 0;
642#ifdef USE_LIBAVRESAMPLE
643 avresample_convert(encoder->resampleContext, 0, 0, 0,
644 (uint8_t**) &encoder->audioBuffer, 0, encoder->audioBufferSize / 4);
645
646 if (avresample_available(encoder->resampleContext) < encoder->audioFrame->nb_samples) {
647 return;
648 }
649#if LIBAVCODEC_VERSION_MAJOR >= 55
650 av_frame_make_writable(encoder->audioFrame);
651#endif
652 int samples = avresample_read(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize);
653#else
654#if LIBAVCODEC_VERSION_MAJOR >= 55
655 av_frame_make_writable(encoder->audioFrame);
656#endif
657 if (swr_get_out_samples(encoder->resampleContext, 1) < encoder->audioFrame->nb_samples) {
658 swr_convert(encoder->resampleContext, NULL, 0, (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
659 return;
660 }
661 int samples = swr_convert(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize,
662 (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
663#endif
664
665 encoder->audioFrame->pts = encoder->currentAudioFrame;
666 encoder->currentAudioFrame += samples;
667
668 _ffmpegWriteAudioFrame(encoder, encoder->audioFrame);
669}
670
671bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame) {
672 AVPacket packet;
673 av_init_packet(&packet);
674 packet.data = 0;
675 packet.size = 0;
676
677 int gotData;
678#ifdef FFMPEG_USE_PACKETS
679 avcodec_send_frame(encoder->audio, audioFrame);
680 gotData = avcodec_receive_packet(encoder->audio, &packet);
681 gotData = (gotData == 0) && packet.size;
682#else
683 avcodec_encode_audio2(encoder->audio, &packet, audioFrame, &gotData);
684#endif
685 packet.pts = av_rescale_q(packet.pts, encoder->audio->time_base, encoder->audioStream->time_base);
686 packet.dts = packet.pts;
687
688 if (gotData) {
689 if (encoder->absf) {
690 AVPacket tempPacket;
691
692#ifdef FFMPEG_USE_NEW_BSF
693 int success = av_bsf_send_packet(encoder->absf, &packet);
694 if (success >= 0) {
695 success = av_bsf_receive_packet(encoder->absf, &tempPacket);
696 }
697#else
698 int success = av_bitstream_filter_filter(encoder->absf, encoder->audio, 0,
699 &tempPacket.data, &tempPacket.size,
700 packet.data, packet.size, 0);
701#endif
702
703 if (success >= 0) {
704#if LIBAVUTIL_VERSION_MAJOR >= 53
705 tempPacket.buf = av_buffer_create(tempPacket.data, tempPacket.size, av_buffer_default_free, 0, 0);
706#endif
707
708#ifdef FFMPEG_USE_PACKET_UNREF
709 av_packet_move_ref(&packet, &tempPacket);
710#else
711 av_free_packet(&packet);
712 packet = tempPacket;
713#endif
714
715 packet.stream_index = encoder->audioStream->index;
716 av_interleaved_write_frame(encoder->context, &packet);
717 }
718 } else {
719 packet.stream_index = encoder->audioStream->index;
720 av_interleaved_write_frame(encoder->context, &packet);
721 }
722 }
723#ifdef FFMPEG_USE_PACKET_UNREF
724 av_packet_unref(&packet);
725#else
726 av_free_packet(&packet);
727#endif
728 return gotData;
729}
730
731void _ffmpegPostVideoFrame(struct mAVStream* stream, const color_t* pixels, size_t stride) {
732 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
733 if (!encoder->context || !encoder->videoCodec) {
734 return;
735 }
736 encoder->skipResidue = (encoder->skipResidue + 1) % encoder->frameskip;
737 if (encoder->skipResidue) {
738 return;
739 }
740 stride *= BYTES_PER_PIXEL;
741
742#if LIBAVCODEC_VERSION_MAJOR >= 55
743 av_frame_make_writable(encoder->videoFrame);
744#endif
745 encoder->videoFrame->pts = av_rescale_q(encoder->currentVideoFrame, encoder->video->time_base, encoder->videoStream->time_base);
746 ++encoder->currentVideoFrame;
747
748 sws_scale(encoder->scaleContext, (const uint8_t* const*) &pixels, (const int*) &stride, 0, encoder->iheight, encoder->videoFrame->data, encoder->videoFrame->linesize);
749
750 if (encoder->graph) {
751 if (av_buffersrc_add_frame(encoder->source, encoder->videoFrame) < 0) {
752 return;
753 }
754 while (true) {
755 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
756 if (res < 0) {
757 break;
758 }
759 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
760 av_frame_unref(encoder->sinkFrame);
761 }
762 } else {
763 _ffmpegWriteVideoFrame(encoder, encoder->videoFrame);
764 }
765}
766
767bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame) {
768 AVPacket packet;
769
770 av_init_packet(&packet);
771 packet.data = 0;
772 packet.size = 0;
773
774 int gotData;
775#ifdef FFMPEG_USE_PACKETS
776 avcodec_send_frame(encoder->video, videoFrame);
777 gotData = avcodec_receive_packet(encoder->video, &packet) == 0;
778#else
779 avcodec_encode_video2(encoder->video, &packet, videoFrame, &gotData);
780#endif
781 if (gotData) {
782#ifndef FFMPEG_USE_PACKET_UNREF
783 if (encoder->video->coded_frame->key_frame) {
784 packet.flags |= AV_PKT_FLAG_KEY;
785 }
786#endif
787 packet.stream_index = encoder->videoStream->index;
788 av_interleaved_write_frame(encoder->context, &packet);
789 }
790#ifdef FFMPEG_USE_PACKET_UNREF
791 av_packet_unref(&packet);
792#else
793 av_free_packet(&packet);
794#endif
795
796 return gotData;
797}
798
799static void _ffmpegSetVideoDimensions(struct mAVStream* stream, unsigned width, unsigned height) {
800 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
801 if (!encoder->context || !encoder->videoCodec) {
802 return;
803 }
804 encoder->iwidth = width;
805 encoder->iheight = height;
806 if (encoder->scaleContext) {
807 sws_freeContext(encoder->scaleContext);
808 }
809 encoder->scaleContext = sws_getContext(encoder->iwidth, encoder->iheight, encoder->ipixFormat,
810 encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format,
811 SWS_POINT, 0, 0, 0);
812}