src/feature/ffmpeg/ffmpeg-encoder.c (view raw)
1/* Copyright (c) 2013-2015 Jeffrey Pfau
2 *
3 * This Source Code Form is subject to the terms of the Mozilla Public
4 * License, v. 2.0. If a copy of the MPL was not distributed with this
5 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
6#include "ffmpeg-encoder.h"
7
8#include <mgba/core/core.h>
9#include <mgba/gba/interface.h>
10
11#include <libavcodec/version.h>
12#include <libavcodec/avcodec.h>
13
14#include <libavfilter/buffersink.h>
15#include <libavfilter/buffersrc.h>
16
17#include <libavutil/version.h>
18#if LIBAVUTIL_VERSION_MAJOR >= 53
19#include <libavutil/buffer.h>
20#endif
21#include <libavutil/imgutils.h>
22#include <libavutil/mathematics.h>
23#include <libavutil/opt.h>
24
25#ifdef USE_LIBAVRESAMPLE
26#include <libavresample/avresample.h>
27#else
28#include <libswresample/swresample.h>
29#endif
30#include <libswscale/swscale.h>
31
32static void _ffmpegPostVideoFrame(struct mAVStream*, const color_t* pixels, size_t stride);
33static void _ffmpegPostAudioFrame(struct mAVStream*, int16_t left, int16_t right);
34static void _ffmpegSetVideoDimensions(struct mAVStream*, unsigned width, unsigned height);
35static void _ffmpegSetVideoFrameRate(struct mAVStream*, unsigned numerator, unsigned denominator);
36
37static bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame);
38static bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame);
39
40enum {
41 PREFERRED_SAMPLE_RATE = 0x8000
42};
43
44void FFmpegEncoderInit(struct FFmpegEncoder* encoder) {
45#if LIBAVFORMAT_VERSION_INT < AV_VERSION_INT(58, 9, 100)
46 av_register_all();
47#endif
48
49 encoder->d.videoDimensionsChanged = _ffmpegSetVideoDimensions;
50 encoder->d.postVideoFrame = _ffmpegPostVideoFrame;
51 encoder->d.postAudioFrame = _ffmpegPostAudioFrame;
52 encoder->d.postAudioBuffer = 0;
53 encoder->d.videoFrameRateChanged = _ffmpegSetVideoFrameRate;
54
55 encoder->audioCodec = NULL;
56 encoder->videoCodec = NULL;
57 encoder->containerFormat = NULL;
58 FFmpegEncoderSetAudio(encoder, "flac", 0);
59 FFmpegEncoderSetVideo(encoder, "libx264", 0, 0);
60 FFmpegEncoderSetContainer(encoder, "matroska");
61 FFmpegEncoderSetDimensions(encoder, GBA_VIDEO_HORIZONTAL_PIXELS, GBA_VIDEO_VERTICAL_PIXELS);
62 encoder->iwidth = GBA_VIDEO_HORIZONTAL_PIXELS;
63 encoder->iheight = GBA_VIDEO_VERTICAL_PIXELS;
64 encoder->frameCycles = VIDEO_TOTAL_LENGTH;
65 encoder->cycles = GBA_ARM7TDMI_FREQUENCY;
66 encoder->frameskip = 1;
67 encoder->skipResidue = 0;
68 encoder->ipixFormat =
69#ifdef COLOR_16_BIT
70#ifdef COLOR_5_6_5
71 AV_PIX_FMT_RGB565;
72#else
73 AV_PIX_FMT_BGR555;
74#endif
75#else
76#ifndef USE_LIBAV
77 AV_PIX_FMT_0BGR32;
78#else
79 AV_PIX_FMT_BGR32;
80#endif
81#endif
82 encoder->resampleContext = NULL;
83 encoder->absf = NULL;
84 encoder->context = NULL;
85 encoder->scaleContext = NULL;
86 encoder->audio = NULL;
87 encoder->audioStream = NULL;
88 encoder->audioFrame = NULL;
89 encoder->audioBuffer = NULL;
90 encoder->postaudioBuffer = NULL;
91 encoder->video = NULL;
92 encoder->videoStream = NULL;
93 encoder->videoFrame = NULL;
94 encoder->graph = NULL;
95 encoder->source = NULL;
96 encoder->sink = NULL;
97 encoder->sinkFrame = NULL;
98
99 int i;
100 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
101 encoder->filters[i] = NULL;
102 }
103}
104
105bool FFmpegEncoderSetAudio(struct FFmpegEncoder* encoder, const char* acodec, unsigned abr) {
106 static const struct {
107 int format;
108 int priority;
109 } priorities[] = {
110 { AV_SAMPLE_FMT_S16, 0 },
111 { AV_SAMPLE_FMT_S16P, 1 },
112 { AV_SAMPLE_FMT_S32, 2 },
113 { AV_SAMPLE_FMT_S32P, 2 },
114 { AV_SAMPLE_FMT_FLT, 3 },
115 { AV_SAMPLE_FMT_FLTP, 3 },
116 { AV_SAMPLE_FMT_DBL, 4 },
117 { AV_SAMPLE_FMT_DBLP, 4 }
118 };
119
120 if (!acodec) {
121 encoder->audioCodec = 0;
122 return true;
123 }
124
125 AVCodec* codec = avcodec_find_encoder_by_name(acodec);
126 if (!codec) {
127 return false;
128 }
129
130 if (!codec->sample_fmts) {
131 return false;
132 }
133 size_t i;
134 size_t j;
135 int priority = INT_MAX;
136 encoder->sampleFormat = AV_SAMPLE_FMT_NONE;
137 for (i = 0; codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
138 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
139 if (codec->sample_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
140 priority = priorities[j].priority;
141 encoder->sampleFormat = codec->sample_fmts[i];
142 }
143 }
144 }
145 if (encoder->sampleFormat == AV_SAMPLE_FMT_NONE) {
146 return false;
147 }
148 encoder->sampleRate = PREFERRED_SAMPLE_RATE;
149 if (codec->supported_samplerates) {
150 for (i = 0; codec->supported_samplerates[i]; ++i) {
151 if (codec->supported_samplerates[i] < PREFERRED_SAMPLE_RATE) {
152 continue;
153 }
154 if (encoder->sampleRate == PREFERRED_SAMPLE_RATE || encoder->sampleRate > codec->supported_samplerates[i]) {
155 encoder->sampleRate = codec->supported_samplerates[i];
156 }
157 }
158 } else if (codec->id == AV_CODEC_ID_AAC) {
159 // HACK: AAC doesn't support 32768Hz (it rounds to 32000), but libfaac doesn't tell us that
160 encoder->sampleRate = 44100;
161 }
162 encoder->audioCodec = acodec;
163 encoder->audioBitrate = abr;
164 return true;
165}
166
167bool FFmpegEncoderSetVideo(struct FFmpegEncoder* encoder, const char* vcodec, unsigned vbr, int frameskip) {
168 static const struct {
169 enum AVPixelFormat format;
170 int priority;
171 } priorities[] = {
172 { AV_PIX_FMT_RGB555, 0 },
173 { AV_PIX_FMT_BGR555, 0 },
174 { AV_PIX_FMT_RGB565, 1 },
175 { AV_PIX_FMT_BGR565, 1 },
176 { AV_PIX_FMT_RGB24, 2 },
177 { AV_PIX_FMT_BGR24, 2 },
178#ifndef USE_LIBAV
179 { AV_PIX_FMT_BGR0, 3 },
180 { AV_PIX_FMT_RGB0, 3 },
181 { AV_PIX_FMT_0BGR, 3 },
182 { AV_PIX_FMT_0RGB, 3 },
183#endif
184 { AV_PIX_FMT_YUV422P, 4 },
185 { AV_PIX_FMT_YUV444P, 5 },
186 { AV_PIX_FMT_YUV420P, 6 },
187 { AV_PIX_FMT_PAL8, 7 },
188 };
189
190 if (!vcodec) {
191 encoder->videoCodec = 0;
192 return true;
193 }
194
195 AVCodec* codec = avcodec_find_encoder_by_name(vcodec);
196 if (!codec) {
197 return false;
198 }
199
200 size_t i;
201 size_t j;
202 int priority = INT_MAX;
203 encoder->pixFormat = AV_PIX_FMT_NONE;
204 for (i = 0; codec->pix_fmts[i] != AV_PIX_FMT_NONE; ++i) {
205 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
206 if (codec->pix_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
207 priority = priorities[j].priority;
208 encoder->pixFormat = codec->pix_fmts[i];
209 }
210 }
211 }
212 if (encoder->pixFormat == AV_PIX_FMT_NONE) {
213 return false;
214 }
215 encoder->videoCodec = vcodec;
216 encoder->videoBitrate = vbr;
217 encoder->frameskip = frameskip + 1;
218 return true;
219}
220
221bool FFmpegEncoderSetContainer(struct FFmpegEncoder* encoder, const char* container) {
222 AVOutputFormat* oformat = av_guess_format(container, 0, 0);
223 if (!oformat) {
224 return false;
225 }
226 encoder->containerFormat = container;
227 return true;
228}
229
230void FFmpegEncoderSetDimensions(struct FFmpegEncoder* encoder, int width, int height) {
231 encoder->width = width > 0 ? width : GBA_VIDEO_HORIZONTAL_PIXELS;
232 encoder->height = height > 0 ? height : GBA_VIDEO_VERTICAL_PIXELS;
233}
234
235bool FFmpegEncoderVerifyContainer(struct FFmpegEncoder* encoder) {
236 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
237 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
238 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
239 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !oformat) {
240 return false;
241 }
242 if (encoder->audioCodec && !avformat_query_codec(oformat, acodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
243 return false;
244 }
245 if (encoder->videoCodec && !avformat_query_codec(oformat, vcodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
246 return false;
247 }
248 return true;
249}
250
251bool FFmpegEncoderOpen(struct FFmpegEncoder* encoder, const char* outfile) {
252 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
253 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
254 if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !FFmpegEncoderVerifyContainer(encoder)) {
255 return false;
256 }
257
258 if (encoder->context) {
259 return false;
260 }
261
262 encoder->currentAudioSample = 0;
263 encoder->currentAudioFrame = 0;
264 encoder->currentVideoFrame = 0;
265 encoder->skipResidue = 0;
266
267 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
268#ifndef USE_LIBAV
269 avformat_alloc_output_context2(&encoder->context, oformat, 0, outfile);
270#else
271 encoder->context = avformat_alloc_context();
272 strncpy(encoder->context->filename, outfile, sizeof(encoder->context->filename) - 1);
273 encoder->context->filename[sizeof(encoder->context->filename) - 1] = '\0';
274 encoder->context->oformat = oformat;
275#endif
276
277 if (acodec) {
278#ifdef FFMPEG_USE_CODECPAR
279 encoder->audioStream = avformat_new_stream(encoder->context, NULL);
280 encoder->audio = avcodec_alloc_context3(acodec);
281#else
282 encoder->audioStream = avformat_new_stream(encoder->context, acodec);
283 encoder->audio = encoder->audioStream->codec;
284#endif
285 encoder->audio->bit_rate = encoder->audioBitrate;
286 encoder->audio->channels = 2;
287 encoder->audio->channel_layout = AV_CH_LAYOUT_STEREO;
288 encoder->audio->sample_rate = encoder->sampleRate;
289 encoder->audio->sample_fmt = encoder->sampleFormat;
290 AVDictionary* opts = 0;
291 av_dict_set(&opts, "strict", "-2", 0);
292 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
293#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
294 encoder->audio->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
295#else
296 encoder->audio->flags |= CODEC_FLAG_GLOBAL_HEADER;
297#endif
298 }
299 int res = avcodec_open2(encoder->audio, acodec, &opts);
300 av_dict_free(&opts);
301 if (res < 0) {
302 FFmpegEncoderClose(encoder);
303 return false;
304 }
305#if LIBAVCODEC_VERSION_MAJOR >= 55
306 encoder->audioFrame = av_frame_alloc();
307#else
308 encoder->audioFrame = avcodec_alloc_frame();
309#endif
310 if (!encoder->audio->frame_size) {
311 encoder->audio->frame_size = 1;
312 }
313 encoder->audioFrame->nb_samples = encoder->audio->frame_size;
314 encoder->audioFrame->format = encoder->audio->sample_fmt;
315 encoder->audioFrame->pts = 0;
316#ifdef USE_LIBAVRESAMPLE
317 encoder->resampleContext = avresample_alloc_context();
318 av_opt_set_int(encoder->resampleContext, "in_channel_layout", AV_CH_LAYOUT_STEREO, 0);
319 av_opt_set_int(encoder->resampleContext, "out_channel_layout", AV_CH_LAYOUT_STEREO, 0);
320 av_opt_set_int(encoder->resampleContext, "in_sample_rate", PREFERRED_SAMPLE_RATE, 0);
321 av_opt_set_int(encoder->resampleContext, "out_sample_rate", encoder->sampleRate, 0);
322 av_opt_set_int(encoder->resampleContext, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);
323 av_opt_set_int(encoder->resampleContext, "out_sample_fmt", encoder->sampleFormat, 0);
324 avresample_open(encoder->resampleContext);
325#else
326 encoder->resampleContext = swr_alloc_set_opts(NULL, AV_CH_LAYOUT_STEREO, encoder->sampleFormat, encoder->sampleRate,
327 AV_CH_LAYOUT_STEREO, AV_SAMPLE_FMT_S16, PREFERRED_SAMPLE_RATE, 0, NULL);
328 swr_init(encoder->resampleContext);
329#endif
330 encoder->audioBufferSize = (encoder->audioFrame->nb_samples * PREFERRED_SAMPLE_RATE / encoder->sampleRate) * 4;
331 encoder->audioBuffer = av_malloc(encoder->audioBufferSize);
332 encoder->postaudioBufferSize = av_samples_get_buffer_size(0, encoder->audio->channels, encoder->audio->frame_size, encoder->audio->sample_fmt, 0);
333 encoder->postaudioBuffer = av_malloc(encoder->postaudioBufferSize);
334 avcodec_fill_audio_frame(encoder->audioFrame, encoder->audio->channels, encoder->audio->sample_fmt, (const uint8_t*) encoder->postaudioBuffer, encoder->postaudioBufferSize, 0);
335
336 if (encoder->audio->codec->id == AV_CODEC_ID_AAC &&
337 (strcasecmp(encoder->containerFormat, "mp4") ||
338 strcasecmp(encoder->containerFormat, "m4v") ||
339 strcasecmp(encoder->containerFormat, "mov"))) {
340 // MP4 container doesn't support the raw ADTS AAC format that the encoder spits out
341#ifdef FFMPEG_USE_NEW_BSF
342 av_bsf_alloc(av_bsf_get_by_name("aac_adtstoasc"), &encoder->absf);
343 avcodec_parameters_from_context(encoder->absf->par_in, encoder->audio);
344 av_bsf_init(encoder->absf);
345#else
346 encoder->absf = av_bitstream_filter_init("aac_adtstoasc");
347#endif
348 }
349#ifdef FFMPEG_USE_CODECPAR
350 avcodec_parameters_from_context(encoder->audioStream->codecpar, encoder->audio);
351#endif
352 }
353
354 if (vcodec) {
355#ifdef FFMPEG_USE_CODECPAR
356 encoder->videoStream = avformat_new_stream(encoder->context, NULL);
357 encoder->video = avcodec_alloc_context3(vcodec);
358#else
359 encoder->videoStream = avformat_new_stream(encoder->context, vcodec);
360 encoder->video = encoder->videoStream->codec;
361#endif
362 encoder->video->bit_rate = encoder->videoBitrate;
363 encoder->video->width = encoder->width;
364 encoder->video->height = encoder->height;
365 encoder->video->time_base = (AVRational) { encoder->frameCycles * encoder->frameskip, encoder->cycles };
366 encoder->video->framerate = (AVRational) { encoder->cycles, encoder->frameCycles * encoder->frameskip };
367 encoder->video->pix_fmt = encoder->pixFormat;
368 encoder->video->gop_size = 60;
369 encoder->video->max_b_frames = 3;
370 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
371#ifdef AV_CODEC_FLAG_GLOBAL_HEADER
372 encoder->video->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
373#else
374 encoder->video->flags |= CODEC_FLAG_GLOBAL_HEADER;
375#endif
376 }
377
378 if (encoder->video->codec->id == AV_CODEC_ID_H264 &&
379 (strcasecmp(encoder->containerFormat, "mp4") ||
380 strcasecmp(encoder->containerFormat, "m4v") ||
381 strcasecmp(encoder->containerFormat, "mov"))) {
382 // QuickTime and a few other things require YUV420
383 encoder->video->pix_fmt = AV_PIX_FMT_YUV420P;
384 }
385
386 if (strcmp(vcodec->name, "libx264") == 0) {
387 // Try to adaptively figure out when you can use a slower encoder
388 if (encoder->width * encoder->height > 1000000) {
389 av_opt_set(encoder->video->priv_data, "preset", "superfast", 0);
390 } else if (encoder->width * encoder->height > 500000) {
391 av_opt_set(encoder->video->priv_data, "preset", "veryfast", 0);
392 } else {
393 av_opt_set(encoder->video->priv_data, "preset", "faster", 0);
394 }
395 if (encoder->videoBitrate == 0) {
396 av_opt_set(encoder->video->priv_data, "crf", "0", 0);
397 encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
398 }
399 }
400 if (strcmp(vcodec->name, "libvpx-vp9") == 0 && encoder->videoBitrate == 0) {
401 av_opt_set(encoder->video->priv_data, "lossless", "1", 0);
402 encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
403 }
404
405 if (encoder->pixFormat == AV_PIX_FMT_PAL8) {
406 encoder->graph = avfilter_graph_alloc();
407
408 const struct AVFilter* source = avfilter_get_by_name("buffer");
409 const struct AVFilter* sink = avfilter_get_by_name("buffersink");
410 const struct AVFilter* split = avfilter_get_by_name("split");
411 const struct AVFilter* palettegen = avfilter_get_by_name("palettegen");
412 const struct AVFilter* paletteuse = avfilter_get_by_name("paletteuse");
413
414 if (!source || !sink || !split || !palettegen || !paletteuse || !encoder->graph) {
415 FFmpegEncoderClose(encoder);
416 return false;
417 }
418
419 char args[256];
420 snprintf(args, sizeof(args), "video_size=%dx%d:pix_fmt=%d:time_base=%d/%d",
421 encoder->video->width, encoder->video->height, encoder->ipixFormat,
422 encoder->video->time_base.num, encoder->video->time_base.den);
423
424 int res = 0;
425 res |= avfilter_graph_create_filter(&encoder->source, source, NULL, args, NULL, encoder->graph);
426 res |= avfilter_graph_create_filter(&encoder->sink, sink, NULL, NULL, NULL, encoder->graph);
427 res |= avfilter_graph_create_filter(&encoder->filters[0], split, NULL, NULL, NULL, encoder->graph);
428 res |= avfilter_graph_create_filter(&encoder->filters[1], palettegen, NULL, "reserve_transparent=off", NULL, encoder->graph);
429 res |= avfilter_graph_create_filter(&encoder->filters[2], paletteuse, NULL, "dither=none", NULL, encoder->graph);
430 if (res < 0) {
431 FFmpegEncoderClose(encoder);
432 return false;
433 }
434
435 res = 0;
436 res |= avfilter_link(encoder->source, 0, encoder->filters[0], 0);
437 res |= avfilter_link(encoder->filters[0], 0, encoder->filters[1], 0);
438 res |= avfilter_link(encoder->filters[0], 1, encoder->filters[2], 0);
439 res |= avfilter_link(encoder->filters[1], 0, encoder->filters[2], 1);
440 res |= avfilter_link(encoder->filters[2], 0, encoder->sink, 0);
441 if (res < 0 || avfilter_graph_config(encoder->graph, NULL) < 0) {
442 FFmpegEncoderClose(encoder);
443 return false;
444 }
445
446#if LIBAVCODEC_VERSION_MAJOR >= 55
447 encoder->sinkFrame = av_frame_alloc();
448#else
449 encoder->sinkFrame = avcodec_alloc_frame();
450#endif
451 }
452
453 if (avcodec_open2(encoder->video, vcodec, 0) < 0) {
454 FFmpegEncoderClose(encoder);
455 return false;
456 }
457#if LIBAVCODEC_VERSION_MAJOR >= 55
458 encoder->videoFrame = av_frame_alloc();
459#else
460 encoder->videoFrame = avcodec_alloc_frame();
461#endif
462 encoder->videoFrame->format = encoder->video->pix_fmt != AV_PIX_FMT_PAL8 ? encoder->video->pix_fmt : encoder->ipixFormat;
463 encoder->videoFrame->width = encoder->video->width;
464 encoder->videoFrame->height = encoder->video->height;
465 encoder->videoFrame->pts = 0;
466 _ffmpegSetVideoDimensions(&encoder->d, encoder->iwidth, encoder->iheight);
467 av_image_alloc(encoder->videoFrame->data, encoder->videoFrame->linesize, encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format, 32);
468#ifdef FFMPEG_USE_CODECPAR
469 avcodec_parameters_from_context(encoder->videoStream->codecpar, encoder->video);
470#endif
471 }
472
473 if (avio_open(&encoder->context->pb, outfile, AVIO_FLAG_WRITE) < 0 || avformat_write_header(encoder->context, 0) < 0) {
474 FFmpegEncoderClose(encoder);
475 return false;
476 }
477 return true;
478}
479
480void FFmpegEncoderClose(struct FFmpegEncoder* encoder) {
481 if (encoder->audio) {
482 while (true) {
483 if (!_ffmpegWriteAudioFrame(encoder, NULL)) {
484 break;
485 }
486 }
487 }
488 if (encoder->video) {
489 if (encoder->graph) {
490 if (av_buffersrc_add_frame(encoder->source, NULL) >= 0) {
491 while (true) {
492 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
493 if (res < 0) {
494 break;
495 }
496 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
497 av_frame_unref(encoder->sinkFrame);
498 }
499 }
500 }
501 while (true) {
502 if (!_ffmpegWriteVideoFrame(encoder, NULL)) {
503 break;
504 }
505 }
506 }
507
508 if (encoder->context && encoder->context->pb) {
509 av_write_trailer(encoder->context);
510 avio_close(encoder->context->pb);
511 }
512
513 if (encoder->postaudioBuffer) {
514 av_free(encoder->postaudioBuffer);
515 encoder->postaudioBuffer = NULL;
516 }
517 if (encoder->audioBuffer) {
518 av_free(encoder->audioBuffer);
519 encoder->audioBuffer = NULL;
520 }
521
522 if (encoder->audioFrame) {
523#if LIBAVCODEC_VERSION_MAJOR >= 55
524 av_frame_free(&encoder->audioFrame);
525#else
526 avcodec_free_frame(&encoder->audioFrame);
527#endif
528 }
529 if (encoder->audio) {
530 avcodec_close(encoder->audio);
531 encoder->audio = NULL;
532 }
533
534 if (encoder->resampleContext) {
535#ifdef USE_LIBAVRESAMPLE
536 avresample_close(encoder->resampleContext);
537 encoder->resampleContext = NULL;
538#else
539 swr_free(&encoder->resampleContext);
540#endif
541 }
542
543 if (encoder->absf) {
544#ifdef FFMPEG_USE_NEW_BSF
545 av_bsf_free(&encoder->absf);
546#else
547 av_bitstream_filter_close(encoder->absf);
548 encoder->absf = NULL;
549#endif
550 }
551
552 if (encoder->videoFrame) {
553#if LIBAVCODEC_VERSION_MAJOR >= 55
554 av_frame_free(&encoder->videoFrame);
555#else
556 avcodec_free_frame(&encoder->videoFrame);
557#endif
558 }
559
560 if (encoder->sinkFrame) {
561#if LIBAVCODEC_VERSION_MAJOR >= 55
562 av_frame_free(&encoder->sinkFrame);
563#else
564 avcodec_free_frame(&encoder->sinkFrame);
565#endif
566 encoder->sinkFrame = NULL;
567 }
568
569 if (encoder->video) {
570 avcodec_close(encoder->video);
571 encoder->video = NULL;
572 }
573
574 if (encoder->scaleContext) {
575 sws_freeContext(encoder->scaleContext);
576 encoder->scaleContext = NULL;
577 }
578
579 if (encoder->graph) {
580 avfilter_graph_free(&encoder->graph);
581 encoder->graph = NULL;
582 encoder->source = NULL;
583 encoder->sink = NULL;
584
585 int i;
586 for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
587 encoder->filters[i] = NULL;
588 }
589 }
590
591 if (encoder->context) {
592 avformat_free_context(encoder->context);
593 encoder->context = NULL;
594 }
595}
596
597bool FFmpegEncoderIsOpen(struct FFmpegEncoder* encoder) {
598 return !!encoder->context;
599}
600
601void _ffmpegPostAudioFrame(struct mAVStream* stream, int16_t left, int16_t right) {
602 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
603 if (!encoder->context || !encoder->audioCodec) {
604 return;
605 }
606
607 if (encoder->absf && !left) {
608 // XXX: AVBSF doesn't like silence. Figure out why.
609 left = 1;
610 }
611
612 encoder->audioBuffer[encoder->currentAudioSample * 2] = left;
613 encoder->audioBuffer[encoder->currentAudioSample * 2 + 1] = right;
614
615 ++encoder->currentAudioSample;
616
617 if (encoder->currentAudioSample * 4 < encoder->audioBufferSize) {
618 return;
619 }
620
621 int channelSize = 2 * av_get_bytes_per_sample(encoder->audio->sample_fmt);
622 encoder->currentAudioSample = 0;
623#ifdef USE_LIBAVRESAMPLE
624 avresample_convert(encoder->resampleContext, 0, 0, 0,
625 (uint8_t**) &encoder->audioBuffer, 0, encoder->audioBufferSize / 4);
626
627 if (avresample_available(encoder->resampleContext) < encoder->audioFrame->nb_samples) {
628 return;
629 }
630#if LIBAVCODEC_VERSION_MAJOR >= 55
631 av_frame_make_writable(encoder->audioFrame);
632#endif
633 int samples = avresample_read(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize);
634#else
635#if LIBAVCODEC_VERSION_MAJOR >= 55
636 av_frame_make_writable(encoder->audioFrame);
637#endif
638 if (swr_get_out_samples(encoder->resampleContext, 1) < encoder->audioFrame->nb_samples) {
639 swr_convert(encoder->resampleContext, NULL, 0, (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
640 return;
641 }
642 int samples = swr_convert(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize,
643 (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
644#endif
645
646 encoder->audioFrame->pts = encoder->currentAudioFrame;
647 encoder->currentAudioFrame += samples;
648
649 _ffmpegWriteAudioFrame(encoder, encoder->audioFrame);
650}
651
652bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame) {
653 AVPacket packet;
654 av_init_packet(&packet);
655 packet.data = 0;
656 packet.size = 0;
657
658 int gotData;
659#ifdef FFMPEG_USE_PACKETS
660 avcodec_send_frame(encoder->audio, audioFrame);
661 gotData = avcodec_receive_packet(encoder->audio, &packet);
662 gotData = (gotData == 0) && packet.size;
663#else
664 avcodec_encode_audio2(encoder->audio, &packet, audioFrame, &gotData);
665#endif
666 packet.pts = av_rescale_q(packet.pts, encoder->audio->time_base, encoder->audioStream->time_base);
667 packet.dts = packet.pts;
668
669 if (gotData) {
670 if (encoder->absf) {
671 AVPacket tempPacket;
672
673#ifdef FFMPEG_USE_NEW_BSF
674 int success = av_bsf_send_packet(encoder->absf, &packet);
675 if (success >= 0) {
676 success = av_bsf_receive_packet(encoder->absf, &tempPacket);
677 }
678#else
679 int success = av_bitstream_filter_filter(encoder->absf, encoder->audio, 0,
680 &tempPacket.data, &tempPacket.size,
681 packet.data, packet.size, 0);
682#endif
683
684 if (success >= 0) {
685#if LIBAVUTIL_VERSION_MAJOR >= 53
686 tempPacket.buf = av_buffer_create(tempPacket.data, tempPacket.size, av_buffer_default_free, 0, 0);
687#endif
688
689#ifdef FFMPEG_USE_PACKET_UNREF
690 av_packet_move_ref(&packet, &tempPacket);
691#else
692 av_free_packet(&packet);
693 packet = tempPacket;
694#endif
695
696 packet.stream_index = encoder->audioStream->index;
697 av_interleaved_write_frame(encoder->context, &packet);
698 }
699 } else {
700 packet.stream_index = encoder->audioStream->index;
701 av_interleaved_write_frame(encoder->context, &packet);
702 }
703 }
704#ifdef FFMPEG_USE_PACKET_UNREF
705 av_packet_unref(&packet);
706#else
707 av_free_packet(&packet);
708#endif
709 return gotData;
710}
711
712void _ffmpegPostVideoFrame(struct mAVStream* stream, const color_t* pixels, size_t stride) {
713 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
714 if (!encoder->context || !encoder->videoCodec) {
715 return;
716 }
717 encoder->skipResidue = (encoder->skipResidue + 1) % encoder->frameskip;
718 if (encoder->skipResidue) {
719 return;
720 }
721 stride *= BYTES_PER_PIXEL;
722
723#if LIBAVCODEC_VERSION_MAJOR >= 55
724 av_frame_make_writable(encoder->videoFrame);
725#endif
726 encoder->videoFrame->pts = av_rescale_q(encoder->currentVideoFrame, encoder->video->time_base, encoder->videoStream->time_base);
727 ++encoder->currentVideoFrame;
728
729 sws_scale(encoder->scaleContext, (const uint8_t* const*) &pixels, (const int*) &stride, 0, encoder->iheight, encoder->videoFrame->data, encoder->videoFrame->linesize);
730
731 if (encoder->graph) {
732 if (av_buffersrc_add_frame(encoder->source, encoder->videoFrame) < 0) {
733 return;
734 }
735 while (true) {
736 int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
737 if (res < 0) {
738 break;
739 }
740 _ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
741 av_frame_unref(encoder->sinkFrame);
742 }
743 } else {
744 _ffmpegWriteVideoFrame(encoder, encoder->videoFrame);
745 }
746}
747
748bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame) {
749 AVPacket packet;
750
751 av_init_packet(&packet);
752 packet.data = 0;
753 packet.size = 0;
754
755 int gotData;
756#ifdef FFMPEG_USE_PACKETS
757 avcodec_send_frame(encoder->video, videoFrame);
758 gotData = avcodec_receive_packet(encoder->video, &packet) == 0;
759#else
760 avcodec_encode_video2(encoder->video, &packet, videoFrame, &gotData);
761#endif
762 if (gotData) {
763#ifndef FFMPEG_USE_PACKET_UNREF
764 if (encoder->video->coded_frame->key_frame) {
765 packet.flags |= AV_PKT_FLAG_KEY;
766 }
767#endif
768 packet.stream_index = encoder->videoStream->index;
769 av_interleaved_write_frame(encoder->context, &packet);
770 }
771#ifdef FFMPEG_USE_PACKET_UNREF
772 av_packet_unref(&packet);
773#else
774 av_free_packet(&packet);
775#endif
776
777 return gotData;
778}
779
780static void _ffmpegSetVideoDimensions(struct mAVStream* stream, unsigned width, unsigned height) {
781 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
782 if (!encoder->context || !encoder->videoCodec) {
783 return;
784 }
785 encoder->iwidth = width;
786 encoder->iheight = height;
787 if (encoder->scaleContext) {
788 sws_freeContext(encoder->scaleContext);
789 }
790 encoder->scaleContext = sws_getContext(encoder->iwidth, encoder->iheight, encoder->ipixFormat,
791 encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format,
792 SWS_POINT, 0, 0, 0);
793}
794
795static void _ffmpegSetVideoFrameRate(struct mAVStream* stream, unsigned numerator, unsigned denominator) {
796 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
797 FFmpegEncoderSetInputFrameRate(encoder, numerator, denominator);
798}
799
800void FFmpegEncoderSetInputFrameRate(struct FFmpegEncoder* encoder, unsigned numerator, unsigned denominator) {
801 encoder->frameCycles = numerator;
802 encoder->cycles = denominator;
803 if (encoder->video) {
804 encoder->video->time_base = (AVRational) { numerator, denominator };
805 }
806}