src/feature/ffmpeg/ffmpeg-encoder.c (view raw)
1/* Copyright (c) 2013-2015 Jeffrey Pfau
2 *
3 * This Source Code Form is subject to the terms of the Mozilla Public
4 * License, v. 2.0. If a copy of the MPL was not distributed with this
5 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
6#include "ffmpeg-encoder.h"
7
8#include <mgba/core/core.h>
9#include <mgba/gba/interface.h>
10
11#include <libavcodec/version.h>
12#include <libavcodec/avcodec.h>
13
14#include <libavfilter/buffersink.h>
15#include <libavfilter/buffersrc.h>
16
17#include <libavutil/version.h>
18#if LIBAVUTIL_VERSION_MAJOR >= 53
19#include <libavutil/buffer.h>
20#endif
21#include <libavutil/imgutils.h>
22#include <libavutil/mathematics.h>
23#include <libavutil/opt.h>
24
25#ifdef USE_LIBAVRESAMPLE
26#include <libavresample/avresample.h>
27#else
28#include <libswresample/swresample.h>
29#endif
30#include <libswscale/swscale.h>
31
32static void _ffmpegPostVideoFrame(struct mAVStream*, const color_t* pixels, size_t stride);
33static void _ffmpegPostAudioFrame(struct mAVStream*, int16_t left, int16_t right);
34static void _ffmpegSetVideoDimensions(struct mAVStream*, unsigned width, unsigned height);
35static void _ffmpegSetVideoFrameRate(struct mAVStream*, unsigned numerator, unsigned denominator);
36
37static bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame);
38static bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame);
39
40enum {
41 PREFERRED_SAMPLE_RATE = 0x8000
42};
43
44void FFmpegEncoderInit(struct FFmpegEncoder* encoder) {
45#if LIBAVFORMAT_VERSION_INT < AV_VERSION_INT(58, 9, 100)
46 av_register_all();
47#endif
48
49 encoder->d.videoDimensionsChanged = _ffmpegSetVideoDimensions;
50 encoder->d.postVideoFrame = _ffmpegPostVideoFrame;
51 encoder->d.postAudioFrame = _ffmpegPostAudioFrame;
52 encoder->d.postAudioBuffer = 0;
53 encoder->d.videoFrameRateChanged = _ffmpegSetVideoFrameRate;
54
55 encoder->audioCodec = NULL;
56 encoder->videoCodec = NULL;
57 encoder->containerFormat = NULL;
58 FFmpegEncoderSetAudio(encoder, "flac", 0);
59 FFmpegEncoderSetVideo(encoder, "libx264", 0, 0);
60 FFmpegEncoderSetContainer(encoder, "matroska");
61 FFmpegEncoderSetDimensions(encoder, GBA_VIDEO_HORIZONTAL_PIXELS, GBA_VIDEO_VERTICAL_PIXELS);
62 encoder->iwidth = GBA_VIDEO_HORIZONTAL_PIXELS;
63 encoder->iheight = GBA_VIDEO_VERTICAL_PIXELS;
64 encoder->frameCycles = VIDEO_TOTAL_LENGTH;
65 encoder->cycles = GBA_ARM7TDMI_FREQUENCY;
66 encoder->frameskip = 1;
67 encoder->skipResidue = 0;
68 encoder->loop = false;
69 encoder->ipixFormat =
70#ifdef COLOR_16_BIT
71#ifdef COLOR_5_6_5
72 AV_PIX_FMT_RGB565;
73#else
74 AV_PIX_FMT_BGR555;
75#endif
76#else
77#ifndef USE_LIBAV
78 AV_PIX_FMT_0BGR32;
79#else
80 AV_PIX_FMT_BGR32;
81#endif
82#endif
83 encoder->resampleContext = NULL;
84 encoder->absf = NULL;
85 encoder->context = NULL;
86 encoder->scaleContext = NULL;
87 encoder->audio = NULL;
88 encoder->audioStream = NULL;
89 encoder->audioFrame = NULL;
90 encoder->audioBuffer = NULL;
91 encoder->postaudioBuffer = NULL;
92 encoder->video = NULL;
93 encoder->videoStream = NULL;
94 encoder->videoFrame = NULL;
95 encoder->graph = NULL;
96 encoder->source = NULL;
97 encoder->sink = NULL;
98 encoder->sinkFrame = NULL;
99
100 int i;
101 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
102 encoder->filters[i] = NULL;
103 }
104}
105
106bool FFmpegEncoderSetAudio(struct FFmpegEncoder* encoder, const char* acodec, unsigned abr) {
107 static const struct {
108 int format;
109 int priority;
110 } priorities[] = {
111 { AV_SAMPLE_FMT_S16, 0 },
112 { AV_SAMPLE_FMT_S16P, 1 },
113 { AV_SAMPLE_FMT_S32, 2 },
114 { AV_SAMPLE_FMT_S32P, 2 },
115 { AV_SAMPLE_FMT_FLT, 3 },
116 { AV_SAMPLE_FMT_FLTP, 3 },
117 { AV_SAMPLE_FMT_DBL, 4 },
118 { AV_SAMPLE_FMT_DBLP, 4 }
119 };
120
121 if (!acodec) {
122 encoder->audioCodec = 0;
123 return true;
124 }
125
126 AVCodec* codec = avcodec_find_encoder_by_name(acodec);
127 if (!codec) {
128 return false;
129 }
130
131 if (!codec->sample_fmts) {
132 return false;
133 }
134 size_t i;
135 size_t j;
136 int priority = INT_MAX;
137 encoder->sampleFormat = AV_SAMPLE_FMT_NONE;
138 for (i = 0; codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
139 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
140 if (codec->sample_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
141 priority = priorities[j].priority;
142 encoder->sampleFormat = codec->sample_fmts[i];
143 }
144 }
145 }
146 if (encoder->sampleFormat == AV_SAMPLE_FMT_NONE) {
147 return false;
148 }
149 encoder->sampleRate = PREFERRED_SAMPLE_RATE;
150 if (codec->supported_samplerates) {
151 for (i = 0; codec->supported_samplerates[i]; ++i) {
152 if (codec->supported_samplerates[i] < PREFERRED_SAMPLE_RATE) {
153 continue;
154 }
155 if (encoder->sampleRate == PREFERRED_SAMPLE_RATE || encoder->sampleRate > codec->supported_samplerates[i]) {
156 encoder->sampleRate = codec->supported_samplerates[i];
157 }
158 }
159 } else if (codec->id == AV_CODEC_ID_AAC) {
160 // HACK: AAC doesn't support 32768Hz (it rounds to 32000), but libfaac doesn't tell us that
161 encoder->sampleRate = 44100;
162 }
163 encoder->audioCodec = acodec;
164 encoder->audioBitrate = abr;
165 return true;
166}
167
168bool FFmpegEncoderSetVideo(struct FFmpegEncoder* encoder, const char* vcodec, unsigned vbr, int frameskip) {
169 static const struct {
170 enum AVPixelFormat format;
171 int priority;
172 } priorities[] = {
173 { AV_PIX_FMT_RGB555, 0 },
174 { AV_PIX_FMT_BGR555, 0 },
175 { AV_PIX_FMT_RGB565, 1 },
176 { AV_PIX_FMT_BGR565, 1 },
177 { AV_PIX_FMT_RGB24, 2 },
178 { AV_PIX_FMT_BGR24, 2 },
179#ifndef USE_LIBAV
180 { AV_PIX_FMT_BGR0, 3 },
181 { AV_PIX_FMT_RGB0, 3 },
182 { AV_PIX_FMT_0BGR, 3 },
183 { AV_PIX_FMT_0RGB, 3 },
184#endif
185 { AV_PIX_FMT_YUV422P, 4 },
186 { AV_PIX_FMT_YUV444P, 5 },
187 { AV_PIX_FMT_YUV420P, 6 },
188 { AV_PIX_FMT_PAL8, 7 },
189 };
190
191 if (!vcodec) {
192 encoder->videoCodec = 0;
193 return true;
194 }
195
196 AVCodec* codec = avcodec_find_encoder_by_name(vcodec);
197 if (!codec) {
198 return false;
199 }
200
201 size_t i;
202 size_t j;
203 int priority = INT_MAX;
204 encoder->pixFormat = AV_PIX_FMT_NONE;
205 for (i = 0; codec->pix_fmts[i] != AV_PIX_FMT_NONE; ++i) {
206 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
207 if (codec->pix_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
208 priority = priorities[j].priority;
209 encoder->pixFormat = codec->pix_fmts[i];
210 }
211 }
212 }
213 if (encoder->pixFormat == AV_PIX_FMT_NONE) {
214 return false;
215 }
216 encoder->videoCodec = vcodec;
217 encoder->videoBitrate = vbr;
218 encoder->frameskip = frameskip + 1;
219 return true;
220}
221
222bool FFmpegEncoderSetContainer(struct FFmpegEncoder* encoder, const char* container) {
223 AVOutputFormat* oformat = av_guess_format(container, 0, 0);
224 if (!oformat) {
225 return false;
226 }
227 encoder->containerFormat = container;
228 return true;
229}
230
231void FFmpegEncoderSetDimensions(struct FFmpegEncoder* encoder, int width, int height) {
232 encoder->width = width > 0 ? width : GBA_VIDEO_HORIZONTAL_PIXELS;
233 encoder->height = height > 0 ? height : GBA_VIDEO_VERTICAL_PIXELS;
234}
235
236void FFmpegEncoderSetLooping(struct FFmpegEncoder* encoder, bool loop) {
237 encoder->loop = loop;
238}
239
240bool FFmpegEncoderVerifyContainer(struct FFmpegEncoder* encoder) {
241 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
242 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
243 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
244 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !oformat || (!acodec && !vcodec)) {
245 return false;
246 }
247 if (encoder->audioCodec && !avformat_query_codec(oformat, acodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
248 return false;
249 }
250 if (encoder->videoCodec && !avformat_query_codec(oformat, vcodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
251 return false;
252 }
253 return true;
254}
255
256bool FFmpegEncoderOpen(struct FFmpegEncoder* encoder, const char* outfile) {
257 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
258 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
259 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !FFmpegEncoderVerifyContainer(encoder)) {
260 return false;
261 }
262
263 if (encoder->context) {
264 return false;
265 }
266
267 encoder->currentAudioSample = 0;
268 encoder->currentAudioFrame = 0;
269 encoder->currentVideoFrame = 0;
270 encoder->skipResidue = 0;
271
272 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
273#ifndef USE_LIBAV
274 avformat_alloc_output_context2(&encoder->context, oformat, 0, outfile);
275#else
276 encoder->context = avformat_alloc_context();
277 strncpy(encoder->context->filename, outfile, sizeof(encoder->context->filename) - 1);
278 encoder->context->filename[sizeof(encoder->context->filename) - 1] = '\0';
279 encoder->context->oformat = oformat;
280#endif
281
282 if (acodec) {
283#ifdef FFMPEG_USE_CODECPAR
284 encoder->audioStream = avformat_new_stream(encoder->context, NULL);
285 encoder->audio = avcodec_alloc_context3(acodec);
286#else
287 encoder->audioStream = avformat_new_stream(encoder->context, acodec);
288 encoder->audio = encoder->audioStream->codec;
289#endif
290 encoder->audio->bit_rate = encoder->audioBitrate;
291 encoder->audio->channels = 2;
292 encoder->audio->channel_layout = AV_CH_LAYOUT_STEREO;
293 encoder->audio->sample_rate = encoder->sampleRate;
294 encoder->audio->sample_fmt = encoder->sampleFormat;
295 AVDictionary* opts = 0;
296 av_dict_set(&opts, "strict", "-2", 0);
297 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
298#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
299 encoder->audio->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
300#else
301 encoder->audio->flags |= CODEC_FLAG_GLOBAL_HEADER;
302#endif
303 }
304 int res = avcodec_open2(encoder->audio, acodec, &opts);
305 av_dict_free(&opts);
306 if (res < 0) {
307 FFmpegEncoderClose(encoder);
308 return false;
309 }
310#if LIBAVCODEC_VERSION_MAJOR >= 55
311 encoder->audioFrame = av_frame_alloc();
312#else
313 encoder->audioFrame = avcodec_alloc_frame();
314#endif
315 if (!encoder->audio->frame_size) {
316 encoder->audio->frame_size = 1;
317 }
318 encoder->audioFrame->nb_samples = encoder->audio->frame_size;
319 encoder->audioFrame->format = encoder->audio->sample_fmt;
320 encoder->audioFrame->pts = 0;
321#ifdef USE_LIBAVRESAMPLE
322 encoder->resampleContext = avresample_alloc_context();
323 av_opt_set_int(encoder->resampleContext, "in_channel_layout", AV_CH_LAYOUT_STEREO, 0);
324 av_opt_set_int(encoder->resampleContext, "out_channel_layout", AV_CH_LAYOUT_STEREO, 0);
325 av_opt_set_int(encoder->resampleContext, "in_sample_rate", PREFERRED_SAMPLE_RATE, 0);
326 av_opt_set_int(encoder->resampleContext, "out_sample_rate", encoder->sampleRate, 0);
327 av_opt_set_int(encoder->resampleContext, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);
328 av_opt_set_int(encoder->resampleContext, "out_sample_fmt", encoder->sampleFormat, 0);
329 avresample_open(encoder->resampleContext);
330#else
331 encoder->resampleContext = swr_alloc_set_opts(NULL, AV_CH_LAYOUT_STEREO, encoder->sampleFormat, encoder->sampleRate,
332 AV_CH_LAYOUT_STEREO, AV_SAMPLE_FMT_S16, PREFERRED_SAMPLE_RATE, 0, NULL);
333 swr_init(encoder->resampleContext);
334#endif
335 encoder->audioBufferSize = (encoder->audioFrame->nb_samples * PREFERRED_SAMPLE_RATE / encoder->sampleRate) * 4;
336 encoder->audioBuffer = av_malloc(encoder->audioBufferSize);
337 encoder->postaudioBufferSize = av_samples_get_buffer_size(0, encoder->audio->channels, encoder->audio->frame_size, encoder->audio->sample_fmt, 0);
338 encoder->postaudioBuffer = av_malloc(encoder->postaudioBufferSize);
339 avcodec_fill_audio_frame(encoder->audioFrame, encoder->audio->channels, encoder->audio->sample_fmt, (const uint8_t*) encoder->postaudioBuffer, encoder->postaudioBufferSize, 0);
340
341 if (encoder->audio->codec->id == AV_CODEC_ID_AAC &&
342 (strcasecmp(encoder->containerFormat, "mp4") ||
343 strcasecmp(encoder->containerFormat, "m4v") ||
344 strcasecmp(encoder->containerFormat, "mov"))) {
345 // MP4 container doesn't support the raw ADTS AAC format that the encoder spits out
346#ifdef FFMPEG_USE_NEW_BSF
347 av_bsf_alloc(av_bsf_get_by_name("aac_adtstoasc"), &encoder->absf);
348 avcodec_parameters_from_context(encoder->absf->par_in, encoder->audio);
349 av_bsf_init(encoder->absf);
350#else
351 encoder->absf = av_bitstream_filter_init("aac_adtstoasc");
352#endif
353 }
354#ifdef FFMPEG_USE_CODECPAR
355 avcodec_parameters_from_context(encoder->audioStream->codecpar, encoder->audio);
356#endif
357 }
358
359 if (vcodec) {
360#ifdef FFMPEG_USE_CODECPAR
361 encoder->videoStream = avformat_new_stream(encoder->context, NULL);
362 encoder->video = avcodec_alloc_context3(vcodec);
363#else
364 encoder->videoStream = avformat_new_stream(encoder->context, vcodec);
365 encoder->video = encoder->videoStream->codec;
366#endif
367 encoder->video->bit_rate = encoder->videoBitrate;
368 encoder->video->width = encoder->width;
369 encoder->video->height = encoder->height;
370 encoder->video->time_base = (AVRational) { encoder->frameCycles * encoder->frameskip, encoder->cycles };
371 encoder->video->framerate = (AVRational) { encoder->cycles, encoder->frameCycles * encoder->frameskip };
372 encoder->videoStream->time_base = encoder->video->time_base;
373 encoder->videoStream->avg_frame_rate = encoder->video->framerate;
374 encoder->video->pix_fmt = encoder->pixFormat;
375 encoder->video->gop_size = 60;
376 encoder->video->max_b_frames = 3;
377 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
378#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
379 encoder->video->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
380#else
381 encoder->video->flags |= CODEC_FLAG_GLOBAL_HEADER;
382#endif
383 }
384
385 if (encoder->video->codec->id == AV_CODEC_ID_H264 &&
386 (strcasecmp(encoder->containerFormat, "mp4") ||
387 strcasecmp(encoder->containerFormat, "m4v") ||
388 strcasecmp(encoder->containerFormat, "mov"))) {
389 // QuickTime and a few other things require YUV420
390 encoder->video->pix_fmt = AV_PIX_FMT_YUV420P;
391 }
392#if LIBAVCODEC_VERSION_MAJOR >= 57
393 if (encoder->video->codec->id == AV_CODEC_ID_FFV1) {
394 av_opt_set(encoder->video->priv_data, "coder", "range_tab", 0);
395 }
396#endif
397
398 if (strcmp(vcodec->name, "libx264") == 0) {
399 // Try to adaptively figure out when you can use a slower encoder
400 if (encoder->width * encoder->height > 1000000) {
401 av_opt_set(encoder->video->priv_data, "preset", "superfast", 0);
402 } else if (encoder->width * encoder->height > 500000) {
403 av_opt_set(encoder->video->priv_data, "preset", "veryfast", 0);
404 } else {
405 av_opt_set(encoder->video->priv_data, "preset", "faster", 0);
406 }
407 if (encoder->videoBitrate == 0) {
408 av_opt_set(encoder->video->priv_data, "crf", "0", 0);
409 encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
410 }
411 }
412 if (strcmp(vcodec->name, "libvpx-vp9") == 0 && encoder->videoBitrate == 0) {
413 av_opt_set(encoder->video->priv_data, "lossless", "1", 0);
414 encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
415 }
416
417 if (encoder->pixFormat == AV_PIX_FMT_PAL8) {
418 encoder->graph = avfilter_graph_alloc();
419
420 const struct AVFilter* source = avfilter_get_by_name("buffer");
421 const struct AVFilter* sink = avfilter_get_by_name("buffersink");
422 const struct AVFilter* split = avfilter_get_by_name("split");
423 const struct AVFilter* palettegen = avfilter_get_by_name("palettegen");
424 const struct AVFilter* paletteuse = avfilter_get_by_name("paletteuse");
425
426 if (!source || !sink || !split || !palettegen || !paletteuse || !encoder->graph) {
427 FFmpegEncoderClose(encoder);
428 return false;
429 }
430
431 char args[256];
432 snprintf(args, sizeof(args), "video_size=%dx%d:pix_fmt=%d:time_base=%d/%d",
433 encoder->video->width, encoder->video->height, encoder->ipixFormat,
434 encoder->video->time_base.num, encoder->video->time_base.den);
435
436 int res = 0;
437 res |= avfilter_graph_create_filter(&encoder->source, source, NULL, args, NULL, encoder->graph);
438 res |= avfilter_graph_create_filter(&encoder->sink, sink, NULL, NULL, NULL, encoder->graph);
439 res |= avfilter_graph_create_filter(&encoder->filters[0], split, NULL, NULL, NULL, encoder->graph);
440 res |= avfilter_graph_create_filter(&encoder->filters[1], palettegen, NULL, "reserve_transparent=off", NULL, encoder->graph);
441 res |= avfilter_graph_create_filter(&encoder->filters[2], paletteuse, NULL, "dither=none", NULL, encoder->graph);
442 if (res < 0) {
443 FFmpegEncoderClose(encoder);
444 return false;
445 }
446
447 res = 0;
448 res |= avfilter_link(encoder->source, 0, encoder->filters[0], 0);
449 res |= avfilter_link(encoder->filters[0], 0, encoder->filters[1], 0);
450 res |= avfilter_link(encoder->filters[0], 1, encoder->filters[2], 0);
451 res |= avfilter_link(encoder->filters[1], 0, encoder->filters[2], 1);
452 res |= avfilter_link(encoder->filters[2], 0, encoder->sink, 0);
453 if (res < 0 || avfilter_graph_config(encoder->graph, NULL) < 0) {
454 FFmpegEncoderClose(encoder);
455 return false;
456 }
457
458#if LIBAVCODEC_VERSION_MAJOR >= 55
459 encoder->sinkFrame = av_frame_alloc();
460#else
461 encoder->sinkFrame = avcodec_alloc_frame();
462#endif
463 }
464 AVDictionary* opts = 0;
465 av_dict_set(&opts, "strict", "-2", 0);
466 int res = avcodec_open2(encoder->video, vcodec, &opts);
467 av_dict_free(&opts);
468 if (res < 0) {
469 FFmpegEncoderClose(encoder);
470 return false;
471 }
472#if LIBAVCODEC_VERSION_MAJOR >= 55
473 encoder->videoFrame = av_frame_alloc();
474#else
475 encoder->videoFrame = avcodec_alloc_frame();
476#endif
477 encoder->videoFrame->format = encoder->video->pix_fmt != AV_PIX_FMT_PAL8 ? encoder->video->pix_fmt : encoder->ipixFormat;
478 encoder->videoFrame->width = encoder->video->width;
479 encoder->videoFrame->height = encoder->video->height;
480 encoder->videoFrame->pts = 0;
481 _ffmpegSetVideoDimensions(&encoder->d, encoder->iwidth, encoder->iheight);
482 av_image_alloc(encoder->videoFrame->data, encoder->videoFrame->linesize, encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format, 32);
483#ifdef FFMPEG_USE_CODECPAR
484 avcodec_parameters_from_context(encoder->videoStream->codecpar, encoder->video);
485#endif
486 }
487
488 if (strcmp(encoder->containerFormat, "gif") == 0) {
489 av_opt_set(encoder->context->priv_data, "loop", encoder->loop ? "0" : "-1", 0);
490 } else if (strcmp(encoder->containerFormat, "apng") == 0) {
491 av_opt_set(encoder->context->priv_data, "plays", encoder->loop ? "0" : "1", 0);
492 }
493
494 AVDictionary* opts = 0;
495 av_dict_set(&opts, "strict", "-2", 0);
496 bool res = avio_open(&encoder->context->pb, outfile, AVIO_FLAG_WRITE) < 0 || avformat_write_header(encoder->context, &opts) < 0;
497 av_dict_free(&opts);
498 if (res) {
499 FFmpegEncoderClose(encoder);
500 return false;
501 }
502 return true;
503}
504
505void FFmpegEncoderClose(struct FFmpegEncoder* encoder) {
506 if (encoder->audio) {
507 while (true) {
508 if (!_ffmpegWriteAudioFrame(encoder, NULL)) {
509 break;
510 }
511 }
512 }
513 if (encoder->video) {
514 if (encoder->graph) {
515 if (av_buffersrc_add_frame(encoder->source, NULL) >= 0) {
516 while (true) {
517 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
518 if (res < 0) {
519 break;
520 }
521 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
522 av_frame_unref(encoder->sinkFrame);
523 }
524 }
525 }
526 while (true) {
527 if (!_ffmpegWriteVideoFrame(encoder, NULL)) {
528 break;
529 }
530 }
531 }
532
533 if (encoder->context && encoder->context->pb) {
534 av_write_trailer(encoder->context);
535 avio_close(encoder->context->pb);
536 }
537
538 if (encoder->postaudioBuffer) {
539 av_free(encoder->postaudioBuffer);
540 encoder->postaudioBuffer = NULL;
541 }
542 if (encoder->audioBuffer) {
543 av_free(encoder->audioBuffer);
544 encoder->audioBuffer = NULL;
545 }
546
547 if (encoder->audioFrame) {
548#if LIBAVCODEC_VERSION_MAJOR >= 55
549 av_frame_free(&encoder->audioFrame);
550#else
551 avcodec_free_frame(&encoder->audioFrame);
552#endif
553 }
554 if (encoder->audio) {
555#ifdef FFMPEG_USE_CODECPAR
556 avcodec_free_context(&encoder->audio);
557#else
558 avcodec_close(encoder->audio);
559 encoder->audio = NULL;
560#endif
561 }
562
563 if (encoder->resampleContext) {
564#ifdef USE_LIBAVRESAMPLE
565 avresample_close(encoder->resampleContext);
566 encoder->resampleContext = NULL;
567#else
568 swr_free(&encoder->resampleContext);
569#endif
570 }
571
572 if (encoder->absf) {
573#ifdef FFMPEG_USE_NEW_BSF
574 av_bsf_free(&encoder->absf);
575#else
576 av_bitstream_filter_close(encoder->absf);
577 encoder->absf = NULL;
578#endif
579 }
580
581 if (encoder->videoFrame) {
582 av_freep(encoder->videoFrame->data);
583#if LIBAVCODEC_VERSION_MAJOR >= 55
584 av_frame_free(&encoder->videoFrame);
585#else
586 avcodec_free_frame(&encoder->videoFrame);
587#endif
588 }
589
590 if (encoder->sinkFrame) {
591#if LIBAVCODEC_VERSION_MAJOR >= 55
592 av_frame_free(&encoder->sinkFrame);
593#else
594 avcodec_free_frame(&encoder->sinkFrame);
595#endif
596 encoder->sinkFrame = NULL;
597 }
598
599 if (encoder->video) {
600#ifdef FFMPEG_USE_CODECPAR
601 avcodec_free_context(&encoder->video);
602#else
603 avcodec_close(encoder->video);
604 encoder->video = NULL;
605#endif
606 }
607
608 if (encoder->scaleContext) {
609 sws_freeContext(encoder->scaleContext);
610 encoder->scaleContext = NULL;
611 }
612
613 if (encoder->graph) {
614 avfilter_graph_free(&encoder->graph);
615 encoder->graph = NULL;
616 encoder->source = NULL;
617 encoder->sink = NULL;
618
619 int i;
620 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
621 encoder->filters[i] = NULL;
622 }
623 }
624
625 if (encoder->context) {
626 avformat_free_context(encoder->context);
627 encoder->context = NULL;
628 }
629}
630
631bool FFmpegEncoderIsOpen(struct FFmpegEncoder* encoder) {
632 return !!encoder->context;
633}
634
635void _ffmpegPostAudioFrame(struct mAVStream* stream, int16_t left, int16_t right) {
636 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
637 if (!encoder->context || !encoder->audioCodec) {
638 return;
639 }
640
641 if (encoder->absf && !left) {
642 // XXX: AVBSF doesn't like silence. Figure out why.
643 left = 1;
644 }
645
646 encoder->audioBuffer[encoder->currentAudioSample * 2] = left;
647 encoder->audioBuffer[encoder->currentAudioSample * 2 + 1] = right;
648
649 ++encoder->currentAudioSample;
650
651 if (encoder->currentAudioSample * 4 < encoder->audioBufferSize) {
652 return;
653 }
654
655 int channelSize = 2 * av_get_bytes_per_sample(encoder->audio->sample_fmt);
656 encoder->currentAudioSample = 0;
657#ifdef USE_LIBAVRESAMPLE
658 avresample_convert(encoder->resampleContext, 0, 0, 0,
659 (uint8_t**) &encoder->audioBuffer, 0, encoder->audioBufferSize / 4);
660
661 if (avresample_available(encoder->resampleContext) < encoder->audioFrame->nb_samples) {
662 return;
663 }
664#if LIBAVCODEC_VERSION_MAJOR >= 55
665 av_frame_make_writable(encoder->audioFrame);
666#endif
667 int samples = avresample_read(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize);
668#else
669#if LIBAVCODEC_VERSION_MAJOR >= 55
670 av_frame_make_writable(encoder->audioFrame);
671#endif
672 if (swr_get_out_samples(encoder->resampleContext, 1) < encoder->audioFrame->nb_samples) {
673 swr_convert(encoder->resampleContext, NULL, 0, (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
674 return;
675 }
676 int samples = swr_convert(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize,
677 (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
678#endif
679
680 encoder->audioFrame->pts = encoder->currentAudioFrame;
681 encoder->currentAudioFrame += samples;
682
683 _ffmpegWriteAudioFrame(encoder, encoder->audioFrame);
684}
685
686bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame) {
687 AVPacket packet;
688 av_init_packet(&packet);
689 packet.data = 0;
690 packet.size = 0;
691
692 int gotData;
693#ifdef FFMPEG_USE_PACKETS
694 avcodec_send_frame(encoder->audio, audioFrame);
695 gotData = avcodec_receive_packet(encoder->audio, &packet);
696 gotData = (gotData == 0) && packet.size;
697#else
698 avcodec_encode_audio2(encoder->audio, &packet, audioFrame, &gotData);
699#endif
700 packet.pts = av_rescale_q(packet.pts, encoder->audio->time_base, encoder->audioStream->time_base);
701 packet.dts = packet.pts;
702
703 if (gotData) {
704 if (encoder->absf) {
705 AVPacket tempPacket;
706
707#ifdef FFMPEG_USE_NEW_BSF
708 int success = av_bsf_send_packet(encoder->absf, &packet);
709 if (success >= 0) {
710 success = av_bsf_receive_packet(encoder->absf, &tempPacket);
711 }
712#else
713 int success = av_bitstream_filter_filter(encoder->absf, encoder->audio, 0,
714 &tempPacket.data, &tempPacket.size,
715 packet.data, packet.size, 0);
716#endif
717
718 if (success >= 0) {
719#if LIBAVUTIL_VERSION_MAJOR >= 53
720 tempPacket.buf = av_buffer_create(tempPacket.data, tempPacket.size, av_buffer_default_free, 0, 0);
721#endif
722
723#ifdef FFMPEG_USE_PACKET_UNREF
724 av_packet_move_ref(&packet, &tempPacket);
725#else
726 av_free_packet(&packet);
727 packet = tempPacket;
728#endif
729
730 packet.stream_index = encoder->audioStream->index;
731 av_interleaved_write_frame(encoder->context, &packet);
732 }
733 } else {
734 packet.stream_index = encoder->audioStream->index;
735 av_interleaved_write_frame(encoder->context, &packet);
736 }
737 }
738#ifdef FFMPEG_USE_PACKET_UNREF
739 av_packet_unref(&packet);
740#else
741 av_free_packet(&packet);
742#endif
743 return gotData;
744}
745
746void _ffmpegPostVideoFrame(struct mAVStream* stream, const color_t* pixels, size_t stride) {
747 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
748 if (!encoder->context || !encoder->videoCodec) {
749 return;
750 }
751 encoder->skipResidue = (encoder->skipResidue + 1) % encoder->frameskip;
752 if (encoder->skipResidue) {
753 return;
754 }
755 stride *= BYTES_PER_PIXEL;
756
757#if LIBAVCODEC_VERSION_MAJOR >= 55
758 av_frame_make_writable(encoder->videoFrame);
759#endif
760 encoder->videoFrame->pts = av_rescale_q(encoder->currentVideoFrame, encoder->video->time_base, encoder->videoStream->time_base);
761 ++encoder->currentVideoFrame;
762
763 sws_scale(encoder->scaleContext, (const uint8_t* const*) &pixels, (const int*) &stride, 0, encoder->iheight, encoder->videoFrame->data, encoder->videoFrame->linesize);
764
765 if (encoder->graph) {
766 if (av_buffersrc_add_frame(encoder->source, encoder->videoFrame) < 0) {
767 return;
768 }
769 while (true) {
770 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
771 if (res < 0) {
772 break;
773 }
774 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
775 av_frame_unref(encoder->sinkFrame);
776 }
777 } else {
778 _ffmpegWriteVideoFrame(encoder, encoder->videoFrame);
779 }
780}
781
782bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame) {
783 AVPacket packet;
784
785 av_init_packet(&packet);
786 packet.data = 0;
787 packet.size = 0;
788
789 int gotData;
790#ifdef FFMPEG_USE_PACKETS
791 avcodec_send_frame(encoder->video, videoFrame);
792 gotData = avcodec_receive_packet(encoder->video, &packet) == 0;
793#else
794 avcodec_encode_video2(encoder->video, &packet, videoFrame, &gotData);
795#endif
796 if (gotData) {
797#ifndef FFMPEG_USE_PACKET_UNREF
798 if (encoder->video->coded_frame->key_frame) {
799 packet.flags |= AV_PKT_FLAG_KEY;
800 }
801#endif
802 packet.stream_index = encoder->videoStream->index;
803 av_interleaved_write_frame(encoder->context, &packet);
804 }
805#ifdef FFMPEG_USE_PACKET_UNREF
806 av_packet_unref(&packet);
807#else
808 av_free_packet(&packet);
809#endif
810
811 return gotData;
812}
813
814static void _ffmpegSetVideoDimensions(struct mAVStream* stream, unsigned width, unsigned height) {
815 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
816 if (!encoder->context || !encoder->videoCodec) {
817 return;
818 }
819 encoder->iwidth = width;
820 encoder->iheight = height;
821 if (encoder->scaleContext) {
822 sws_freeContext(encoder->scaleContext);
823 }
824 encoder->scaleContext = sws_getContext(encoder->iwidth, encoder->iheight, encoder->ipixFormat,
825 encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format,
826 SWS_POINT, 0, 0, 0);
827}
828
829static void _ffmpegSetVideoFrameRate(struct mAVStream* stream, unsigned numerator, unsigned denominator) {
830 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
831 FFmpegEncoderSetInputFrameRate(encoder, numerator, denominator);
832}
833
834void FFmpegEncoderSetInputFrameRate(struct FFmpegEncoder* encoder, unsigned numerator, unsigned denominator) {
835 encoder->frameCycles = numerator;
836 encoder->cycles = denominator;
837 if (encoder->video) {
838 encoder->video->time_base = (AVRational) { numerator, denominator };
839 }
840}