src/feature/ffmpeg/ffmpeg-encoder.c (view raw)
1/* Copyright (c) 2013-2015 Jeffrey Pfau
2 *
3 * This Source Code Form is subject to the terms of the Mozilla Public
4 * License, v. 2.0. If a copy of the MPL was not distributed with this
5 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
6#include "ffmpeg-encoder.h"
7
8#include <mgba/core/core.h>
9#include <mgba/internal/gba/video.h>
10
11#include <libavcodec/version.h>
12#include <libavcodec/avcodec.h>
13
14#include <libavutil/version.h>
15#if LIBAVUTIL_VERSION_MAJOR >= 53
16#include <libavutil/buffer.h>
17#endif
18#include <libavutil/imgutils.h>
19#include <libavutil/mathematics.h>
20#include <libavutil/opt.h>
21
22#include <libavresample/avresample.h>
23#include <libswscale/swscale.h>
24
25static void _ffmpegPostVideoFrame(struct mAVStream*, const color_t* pixels, size_t stride);
26static void _ffmpegPostAudioFrame(struct mAVStream*, int16_t left, int16_t right);
27static void _ffmpegSetVideoDimensions(struct mAVStream*, unsigned width, unsigned height);
28
29enum {
30 PREFERRED_SAMPLE_RATE = 0x8000
31};
32
33void FFmpegEncoderInit(struct FFmpegEncoder* encoder) {
34 av_register_all();
35
36 encoder->d.videoDimensionsChanged = _ffmpegSetVideoDimensions;
37 encoder->d.postVideoFrame = _ffmpegPostVideoFrame;
38 encoder->d.postAudioFrame = _ffmpegPostAudioFrame;
39 encoder->d.postAudioBuffer = 0;
40
41 encoder->audioCodec = 0;
42 encoder->videoCodec = 0;
43 encoder->containerFormat = 0;
44 FFmpegEncoderSetAudio(encoder, "flac", 0);
45 FFmpegEncoderSetVideo(encoder, "png", 0);
46 FFmpegEncoderSetContainer(encoder, "matroska");
47 FFmpegEncoderSetDimensions(encoder, VIDEO_HORIZONTAL_PIXELS, VIDEO_VERTICAL_PIXELS);
48 encoder->iwidth = VIDEO_HORIZONTAL_PIXELS;
49 encoder->iheight = VIDEO_VERTICAL_PIXELS;
50 encoder->resampleContext = 0;
51 encoder->absf = 0;
52 encoder->context = 0;
53 encoder->scaleContext = NULL;
54}
55
56bool FFmpegEncoderSetAudio(struct FFmpegEncoder* encoder, const char* acodec, unsigned abr) {
57 static const struct {
58 int format;
59 int priority;
60 } priorities[] = {
61 { AV_SAMPLE_FMT_S16, 0 },
62 { AV_SAMPLE_FMT_S16P, 1 },
63 { AV_SAMPLE_FMT_S32, 2 },
64 { AV_SAMPLE_FMT_S32P, 2 },
65 { AV_SAMPLE_FMT_FLT, 3 },
66 { AV_SAMPLE_FMT_FLTP, 3 },
67 { AV_SAMPLE_FMT_DBL, 4 },
68 { AV_SAMPLE_FMT_DBLP, 4 }
69 };
70
71 if (!acodec) {
72 encoder->audioCodec = 0;
73 return true;
74 }
75
76 AVCodec* codec = avcodec_find_encoder_by_name(acodec);
77 if (!codec) {
78 return false;
79 }
80
81 if (!codec->sample_fmts) {
82 return false;
83 }
84 size_t i;
85 size_t j;
86 int priority = INT_MAX;
87 encoder->sampleFormat = AV_SAMPLE_FMT_NONE;
88 for (i = 0; codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
89 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
90 if (codec->sample_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
91 priority = priorities[j].priority;
92 encoder->sampleFormat = codec->sample_fmts[i];
93 }
94 }
95 }
96 if (encoder->sampleFormat == AV_SAMPLE_FMT_NONE) {
97 return false;
98 }
99 encoder->sampleRate = PREFERRED_SAMPLE_RATE;
100 if (codec->supported_samplerates) {
101 for (i = 0; codec->supported_samplerates[i]; ++i) {
102 if (codec->supported_samplerates[i] < PREFERRED_SAMPLE_RATE) {
103 continue;
104 }
105 if (encoder->sampleRate == PREFERRED_SAMPLE_RATE || encoder->sampleRate > codec->supported_samplerates[i]) {
106 encoder->sampleRate = codec->supported_samplerates[i];
107 }
108 }
109 } else if (codec->id == AV_CODEC_ID_AAC) {
110 // HACK: AAC doesn't support 32768Hz (it rounds to 32000), but libfaac doesn't tell us that
111 encoder->sampleRate = 44100;
112 }
113 encoder->audioCodec = acodec;
114 encoder->audioBitrate = abr;
115 return true;
116}
117
118bool FFmpegEncoderSetVideo(struct FFmpegEncoder* encoder, const char* vcodec, unsigned vbr) {
119 static const struct {
120 enum AVPixelFormat format;
121 int priority;
122 } priorities[] = {
123 { AV_PIX_FMT_RGB555, 0 },
124 { AV_PIX_FMT_BGR555, 0 },
125 { AV_PIX_FMT_RGB565, 1 },
126 { AV_PIX_FMT_BGR565, 1 },
127 { AV_PIX_FMT_RGB24, 2 },
128 { AV_PIX_FMT_BGR24, 2 },
129#ifndef USE_LIBAV
130 { AV_PIX_FMT_BGR0, 3 },
131 { AV_PIX_FMT_RGB0, 3 },
132 { AV_PIX_FMT_0BGR, 3 },
133 { AV_PIX_FMT_0RGB, 3 },
134#endif
135 { AV_PIX_FMT_YUV422P, 4 },
136 { AV_PIX_FMT_YUV444P, 5 },
137 { AV_PIX_FMT_YUV420P, 6 }
138 };
139 AVCodec* codec = avcodec_find_encoder_by_name(vcodec);
140 if (!codec) {
141 return false;
142 }
143
144 size_t i;
145 size_t j;
146 int priority = INT_MAX;
147 encoder->pixFormat = AV_PIX_FMT_NONE;
148 for (i = 0; codec->pix_fmts[i] != AV_PIX_FMT_NONE; ++i) {
149 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
150 if (codec->pix_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
151 priority = priorities[j].priority;
152 encoder->pixFormat = codec->pix_fmts[i];
153 }
154 }
155 }
156 if (encoder->pixFormat == AV_PIX_FMT_NONE) {
157 return false;
158 }
159 encoder->videoCodec = vcodec;
160 encoder->videoBitrate = vbr;
161 return true;
162}
163
164bool FFmpegEncoderSetContainer(struct FFmpegEncoder* encoder, const char* container) {
165 AVOutputFormat* oformat = av_guess_format(container, 0, 0);
166 if (!oformat) {
167 return false;
168 }
169 encoder->containerFormat = container;
170 return true;
171}
172
173void FFmpegEncoderSetDimensions(struct FFmpegEncoder* encoder, int width, int height) {
174 encoder->width = width > 0 ? width : VIDEO_HORIZONTAL_PIXELS;
175 encoder->height = height > 0 ? height : VIDEO_VERTICAL_PIXELS;
176}
177
178bool FFmpegEncoderVerifyContainer(struct FFmpegEncoder* encoder) {
179 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
180 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
181 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
182 if ((encoder->audioCodec && !acodec) || !vcodec || !oformat) {
183 return false;
184 }
185 if (encoder->audioCodec && !avformat_query_codec(oformat, acodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
186 return false;
187 }
188 if (!avformat_query_codec(oformat, vcodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
189 return false;
190 }
191 return true;
192}
193
194bool FFmpegEncoderOpen(struct FFmpegEncoder* encoder, const char* outfile) {
195 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
196 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
197 if ((encoder->audioCodec && !acodec) || !vcodec || !FFmpegEncoderVerifyContainer(encoder)) {
198 return false;
199 }
200
201 encoder->currentAudioSample = 0;
202 encoder->currentAudioFrame = 0;
203 encoder->currentVideoFrame = 0;
204 encoder->nextAudioPts = 0;
205
206 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
207#ifndef USE_LIBAV
208 avformat_alloc_output_context2(&encoder->context, oformat, 0, outfile);
209#else
210 encoder->context = avformat_alloc_context();
211 strncpy(encoder->context->filename, outfile, sizeof(encoder->context->filename) - 1);
212 encoder->context->filename[sizeof(encoder->context->filename) - 1] = '\0';
213 encoder->context->oformat = oformat;
214#endif
215
216 if (acodec) {
217#ifdef FFMPEG_USE_CODECPAR
218 encoder->audioStream = avformat_new_stream(encoder->context, NULL);
219 encoder->audio = avcodec_alloc_context3(acodec);
220#else
221 encoder->audioStream = avformat_new_stream(encoder->context, acodec);
222 encoder->audio = encoder->audioStream->codec;
223#endif
224 encoder->audio->bit_rate = encoder->audioBitrate;
225 encoder->audio->channels = 2;
226 encoder->audio->channel_layout = AV_CH_LAYOUT_STEREO;
227 encoder->audio->sample_rate = encoder->sampleRate;
228 encoder->audio->sample_fmt = encoder->sampleFormat;
229 AVDictionary* opts = 0;
230 av_dict_set(&opts, "strict", "-2", 0);
231 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
232 encoder->audio->flags |= CODEC_FLAG_GLOBAL_HEADER;
233 }
234 avcodec_open2(encoder->audio, acodec, &opts);
235 av_dict_free(&opts);
236#if LIBAVCODEC_VERSION_MAJOR >= 55
237 encoder->audioFrame = av_frame_alloc();
238#else
239 encoder->audioFrame = avcodec_alloc_frame();
240#endif
241 if (!encoder->audio->frame_size) {
242 encoder->audio->frame_size = 1;
243 }
244 encoder->audioFrame->nb_samples = encoder->audio->frame_size;
245 encoder->audioFrame->format = encoder->audio->sample_fmt;
246 encoder->audioFrame->pts = 0;
247 encoder->resampleContext = avresample_alloc_context();
248 av_opt_set_int(encoder->resampleContext, "in_channel_layout", AV_CH_LAYOUT_STEREO, 0);
249 av_opt_set_int(encoder->resampleContext, "out_channel_layout", AV_CH_LAYOUT_STEREO, 0);
250 av_opt_set_int(encoder->resampleContext, "in_sample_rate", PREFERRED_SAMPLE_RATE, 0);
251 av_opt_set_int(encoder->resampleContext, "out_sample_rate", encoder->sampleRate, 0);
252 av_opt_set_int(encoder->resampleContext, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);
253 av_opt_set_int(encoder->resampleContext, "out_sample_fmt", encoder->sampleFormat, 0);
254 avresample_open(encoder->resampleContext);
255 encoder->audioBufferSize = (encoder->audioFrame->nb_samples * PREFERRED_SAMPLE_RATE / encoder->sampleRate) * 4;
256 encoder->audioBuffer = av_malloc(encoder->audioBufferSize);
257 encoder->postaudioBufferSize = av_samples_get_buffer_size(0, encoder->audio->channels, encoder->audio->frame_size, encoder->audio->sample_fmt, 0);
258 encoder->postaudioBuffer = av_malloc(encoder->postaudioBufferSize);
259 avcodec_fill_audio_frame(encoder->audioFrame, encoder->audio->channels, encoder->audio->sample_fmt, (const uint8_t*) encoder->postaudioBuffer, encoder->postaudioBufferSize, 0);
260
261 if (encoder->audio->codec->id == AV_CODEC_ID_AAC &&
262 (strcasecmp(encoder->containerFormat, "mp4") ||
263 strcasecmp(encoder->containerFormat, "m4v") ||
264 strcasecmp(encoder->containerFormat, "mov"))) {
265 // MP4 container doesn't support the raw ADTS AAC format that the encoder spits out
266#ifdef FFMPEG_USE_NEW_BSF
267 av_bsf_alloc(av_bsf_get_by_name("aac_adtstoasc"), &encoder->absf);
268 avcodec_parameters_from_context(encoder->absf->par_in, encoder->audio);
269 av_bsf_init(encoder->absf);
270#else
271 encoder->absf = av_bitstream_filter_init("aac_adtstoasc");
272#endif
273 }
274#ifdef FFMPEG_USE_CODECPAR
275 avcodec_parameters_from_context(encoder->audioStream->codecpar, encoder->audio);
276#endif
277 }
278
279#ifdef FFMPEG_USE_CODECPAR
280 encoder->videoStream = avformat_new_stream(encoder->context, NULL);
281 encoder->video = avcodec_alloc_context3(vcodec);
282#else
283 encoder->videoStream = avformat_new_stream(encoder->context, vcodec);
284 encoder->video = encoder->videoStream->codec;
285#endif
286 encoder->video->bit_rate = encoder->videoBitrate;
287 encoder->video->width = encoder->width;
288 encoder->video->height = encoder->height;
289 encoder->video->time_base = (AVRational) { VIDEO_TOTAL_LENGTH, GBA_ARM7TDMI_FREQUENCY };
290 encoder->video->pix_fmt = encoder->pixFormat;
291 encoder->video->gop_size = 60;
292 encoder->video->max_b_frames = 3;
293 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
294 encoder->video->flags |= CODEC_FLAG_GLOBAL_HEADER;
295 }
296 if (strcmp(vcodec->name, "libx264") == 0) {
297 // Try to adaptively figure out when you can use a slower encoder
298 if (encoder->width * encoder->height > 1000000) {
299 av_opt_set(encoder->video->priv_data, "preset", "superfast", 0);
300 } else if (encoder->width * encoder->height > 500000) {
301 av_opt_set(encoder->video->priv_data, "preset", "veryfast", 0);
302 } else {
303 av_opt_set(encoder->video->priv_data, "preset", "faster", 0);
304 }
305 av_opt_set(encoder->video->priv_data, "tune", "zerolatency", 0);
306 }
307 avcodec_open2(encoder->video, vcodec, 0);
308#if LIBAVCODEC_VERSION_MAJOR >= 55
309 encoder->videoFrame = av_frame_alloc();
310#else
311 encoder->videoFrame = avcodec_alloc_frame();
312#endif
313 encoder->videoFrame->format = encoder->video->pix_fmt;
314 encoder->videoFrame->width = encoder->video->width;
315 encoder->videoFrame->height = encoder->video->height;
316 encoder->videoFrame->pts = 0;
317 _ffmpegSetVideoDimensions(&encoder->d, encoder->iwidth, encoder->iheight);
318 av_image_alloc(encoder->videoFrame->data, encoder->videoFrame->linesize, encoder->video->width, encoder->video->height, encoder->video->pix_fmt, 32);
319#ifdef FFMPEG_USE_CODECPAR
320 avcodec_parameters_from_context(encoder->videoStream->codecpar, encoder->video);
321#endif
322
323 if (avio_open(&encoder->context->pb, outfile, AVIO_FLAG_WRITE) < 0) {
324 return false;
325 }
326 return avformat_write_header(encoder->context, 0) >= 0;
327}
328
329void FFmpegEncoderClose(struct FFmpegEncoder* encoder) {
330 if (!encoder->context) {
331 return;
332 }
333 av_write_trailer(encoder->context);
334 avio_close(encoder->context->pb);
335
336 if (encoder->audioCodec) {
337 av_free(encoder->postaudioBuffer);
338 if (encoder->audioBuffer) {
339 av_free(encoder->audioBuffer);
340 }
341#if LIBAVCODEC_VERSION_MAJOR >= 55
342 av_frame_free(&encoder->audioFrame);
343#else
344 avcodec_free_frame(&encoder->audioFrame);
345#endif
346 avcodec_close(encoder->audio);
347
348 if (encoder->resampleContext) {
349 avresample_close(encoder->resampleContext);
350 }
351
352 if (encoder->absf) {
353#ifdef FFMPEG_USE_NEW_BSF
354 av_bsf_free(&encoder->absf);
355#else
356 av_bitstream_filter_close(encoder->absf);
357 encoder->absf = 0;
358#endif
359 }
360 }
361
362#if LIBAVCODEC_VERSION_MAJOR >= 55
363 av_frame_free(&encoder->videoFrame);
364#else
365 avcodec_free_frame(&encoder->videoFrame);
366#endif
367 avcodec_close(encoder->video);
368
369 sws_freeContext(encoder->scaleContext);
370 encoder->scaleContext = NULL;
371
372 avformat_free_context(encoder->context);
373 encoder->context = 0;
374}
375
376bool FFmpegEncoderIsOpen(struct FFmpegEncoder* encoder) {
377 return !!encoder->context;
378}
379
380void _ffmpegPostAudioFrame(struct mAVStream* stream, int16_t left, int16_t right) {
381 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
382 if (!encoder->context || !encoder->audioCodec) {
383 return;
384 }
385
386 if (encoder->absf && !left) {
387 // XXX: AVBSF doesn't like silence. Figure out why.
388 left = 1;
389 }
390
391 encoder->audioBuffer[encoder->currentAudioSample * 2] = left;
392 encoder->audioBuffer[encoder->currentAudioSample * 2 + 1] = right;
393
394 ++encoder->currentAudioSample;
395
396 if (encoder->currentAudioSample * 4 < encoder->audioBufferSize) {
397 return;
398 }
399
400 int channelSize = 2 * av_get_bytes_per_sample(encoder->audio->sample_fmt);
401 avresample_convert(encoder->resampleContext, 0, 0, 0,
402 (uint8_t**) &encoder->audioBuffer, 0, encoder->audioBufferSize / 4);
403
404 encoder->currentAudioSample = 0;
405 if (avresample_available(encoder->resampleContext) < encoder->audioFrame->nb_samples) {
406 return;
407 }
408#if LIBAVCODEC_VERSION_MAJOR >= 55
409 av_frame_make_writable(encoder->audioFrame);
410#endif
411 int samples = avresample_read(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize);
412
413 encoder->audioFrame->pts = av_rescale_q(encoder->currentAudioFrame, encoder->audio->time_base, encoder->audioStream->time_base);
414 encoder->currentAudioFrame += samples;
415
416 AVPacket packet;
417 av_init_packet(&packet);
418 packet.data = 0;
419 packet.size = 0;
420 packet.pts = encoder->audioFrame->pts;
421
422 int gotData;
423#ifdef FFMPEG_USE_PACKETS
424 avcodec_send_frame(encoder->audio, encoder->audioFrame);
425 gotData = avcodec_receive_packet(encoder->audio, &packet);
426 gotData = (gotData == 0) && packet.size;
427#else
428 avcodec_encode_audio2(encoder->audio, &packet, encoder->audioFrame, &gotData);
429#endif
430 if (gotData) {
431 if (encoder->absf) {
432 AVPacket tempPacket;
433
434#ifdef FFMPEG_USE_NEW_BSF
435 int success = av_bsf_send_packet(encoder->absf, &packet);
436 if (success >= 0) {
437 success = av_bsf_receive_packet(encoder->absf, &tempPacket);
438 }
439#else
440 int success = av_bitstream_filter_filter(encoder->absf, encoder->audio, 0,
441 &tempPacket.data, &tempPacket.size,
442 packet.data, packet.size, 0);
443#endif
444
445 if (success >= 0) {
446#if LIBAVUTIL_VERSION_MAJOR >= 53
447 tempPacket.buf = av_buffer_create(tempPacket.data, tempPacket.size, av_buffer_default_free, 0, 0);
448#endif
449
450#ifdef FFMPEG_USE_PACKET_UNREF
451 av_packet_move_ref(&packet, &tempPacket);
452#else
453 av_free_packet(&packet);
454 packet = tempPacket;
455#endif
456
457 packet.stream_index = encoder->audioStream->index;
458 av_interleaved_write_frame(encoder->context, &packet);
459 }
460 } else {
461 packet.stream_index = encoder->audioStream->index;
462 av_interleaved_write_frame(encoder->context, &packet);
463 }
464 }
465#ifdef FFMPEG_USE_PACKET_UNREF
466 av_packet_unref(&packet);
467#else
468 av_free_packet(&packet);
469#endif
470}
471
472void _ffmpegPostVideoFrame(struct mAVStream* stream, const color_t* pixels, size_t stride) {
473 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
474 if (!encoder->context) {
475 return;
476 }
477 stride *= BYTES_PER_PIXEL;
478
479 AVPacket packet;
480
481 av_init_packet(&packet);
482 packet.data = 0;
483 packet.size = 0;
484#if LIBAVCODEC_VERSION_MAJOR >= 55
485 av_frame_make_writable(encoder->videoFrame);
486#endif
487 encoder->videoFrame->pts = av_rescale_q(encoder->currentVideoFrame, encoder->video->time_base, encoder->videoStream->time_base);
488 packet.pts = encoder->videoFrame->pts;
489 ++encoder->currentVideoFrame;
490
491 sws_scale(encoder->scaleContext, (const uint8_t* const*) &pixels, (const int*) &stride, 0, encoder->iheight, encoder->videoFrame->data, encoder->videoFrame->linesize);
492
493 int gotData;
494#ifdef FFMPEG_USE_PACKETS
495 avcodec_send_frame(encoder->video, encoder->videoFrame);
496 gotData = avcodec_receive_packet(encoder->video, &packet) == 0;
497#else
498 avcodec_encode_video2(encoder->video, &packet, encoder->videoFrame, &gotData);
499#endif
500 if (gotData) {
501#ifndef FFMPEG_USE_PACKET_UNREF
502 if (encoder->video->coded_frame->key_frame) {
503 packet.flags |= AV_PKT_FLAG_KEY;
504 }
505#endif
506 packet.stream_index = encoder->videoStream->index;
507 av_interleaved_write_frame(encoder->context, &packet);
508 }
509#ifdef FFMPEG_USE_PACKET_UNREF
510 av_packet_unref(&packet);
511#else
512 av_free_packet(&packet);
513#endif
514}
515
516static void _ffmpegSetVideoDimensions(struct mAVStream* stream, unsigned width, unsigned height) {
517 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
518 encoder->iwidth = width;
519 encoder->iheight = height;
520 if (encoder->scaleContext) {
521 sws_freeContext(encoder->scaleContext);
522 }
523 encoder->scaleContext = sws_getContext(encoder->iwidth, encoder->iheight,
524#ifdef COLOR_16_BIT
525#ifdef COLOR_5_6_5
526 AV_PIX_FMT_RGB565,
527#else
528 AV_PIX_FMT_BGR555,
529#endif
530#else
531#ifndef USE_LIBAV
532 AV_PIX_FMT_0BGR32,
533#else
534 AV_PIX_FMT_BGR32,
535#endif
536#endif
537 encoder->videoFrame->width, encoder->videoFrame->height, encoder->video->pix_fmt,
538 SWS_POINT, 0, 0, 0);
539}