src/platform/ffmpeg/ffmpeg-encoder.c (view raw)
1/* Copyright (c) 2013-2015 Jeffrey Pfau
2 *
3 * This Source Code Form is subject to the terms of the Mozilla Public
4 * License, v. 2.0. If a copy of the MPL was not distributed with this
5 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
6#include "ffmpeg-encoder.h"
7
8#include "gba/video.h"
9
10#include <libavcodec/version.h>
11#include <libavcodec/avcodec.h>
12
13#include <libavutil/version.h>
14#if LIBAVUTIL_VERSION_MAJOR >= 53
15#include <libavutil/buffer.h>
16#endif
17#include <libavutil/imgutils.h>
18#include <libavutil/mathematics.h>
19#include <libavutil/opt.h>
20
21#include <libavresample/avresample.h>
22#include <libswscale/swscale.h>
23
24static void _ffmpegPostVideoFrame(struct GBAAVStream*, struct GBAVideoRenderer* renderer);
25static void _ffmpegPostAudioFrame(struct GBAAVStream*, int16_t left, int16_t right);
26
27enum {
28 PREFERRED_SAMPLE_RATE = 0x8000
29};
30
31void FFmpegEncoderInit(struct FFmpegEncoder* encoder) {
32 av_register_all();
33
34 encoder->d.postVideoFrame = _ffmpegPostVideoFrame;
35 encoder->d.postAudioFrame = _ffmpegPostAudioFrame;
36 encoder->d.postAudioBuffer = 0;
37
38 encoder->audioCodec = 0;
39 encoder->videoCodec = 0;
40 encoder->containerFormat = 0;
41 FFmpegEncoderSetAudio(encoder, "flac", 0);
42 FFmpegEncoderSetVideo(encoder, "png", 0);
43 FFmpegEncoderSetContainer(encoder, "matroska");
44 FFmpegEncoderSetDimensions(encoder, VIDEO_HORIZONTAL_PIXELS, VIDEO_VERTICAL_PIXELS);
45 encoder->resampleContext = 0;
46 encoder->absf = 0;
47 encoder->context = 0;
48}
49
50bool FFmpegEncoderSetAudio(struct FFmpegEncoder* encoder, const char* acodec, unsigned abr) {
51 static const struct {
52 int format;
53 int priority;
54 } priorities[] = {
55 { AV_SAMPLE_FMT_S16, 0 },
56 { AV_SAMPLE_FMT_S16P, 1 },
57 { AV_SAMPLE_FMT_S32, 2 },
58 { AV_SAMPLE_FMT_S32P, 2 },
59 { AV_SAMPLE_FMT_FLT, 3 },
60 { AV_SAMPLE_FMT_FLTP, 3 },
61 { AV_SAMPLE_FMT_DBL, 4 },
62 { AV_SAMPLE_FMT_DBLP, 4 }
63 };
64
65 if (!acodec) {
66 encoder->audioCodec = 0;
67 return true;
68 }
69
70 AVCodec* codec = avcodec_find_encoder_by_name(acodec);
71 if (!codec) {
72 return false;
73 }
74
75 if (!codec->sample_fmts) {
76 return false;
77 }
78 size_t i;
79 size_t j;
80 int priority = INT_MAX;
81 encoder->sampleFormat = AV_SAMPLE_FMT_NONE;
82 for (i = 0; codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
83 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
84 if (codec->sample_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
85 priority = priorities[j].priority;
86 encoder->sampleFormat = codec->sample_fmts[i];
87 }
88 }
89 }
90 if (encoder->sampleFormat == AV_SAMPLE_FMT_NONE) {
91 return false;
92 }
93 encoder->sampleRate = PREFERRED_SAMPLE_RATE;
94 if (codec->supported_samplerates) {
95 for (i = 0; codec->supported_samplerates[i]; ++i) {
96 if (codec->supported_samplerates[i] < PREFERRED_SAMPLE_RATE) {
97 continue;
98 }
99 if (encoder->sampleRate == PREFERRED_SAMPLE_RATE || encoder->sampleRate > codec->supported_samplerates[i]) {
100 encoder->sampleRate = codec->supported_samplerates[i];
101 }
102 }
103 } else if (codec->id == AV_CODEC_ID_AAC) {
104 // HACK: AAC doesn't support 32768Hz (it rounds to 32000), but libfaac doesn't tell us that
105 encoder->sampleRate = 44100;
106 }
107 encoder->audioCodec = acodec;
108 encoder->audioBitrate = abr;
109 return true;
110}
111
112bool FFmpegEncoderSetVideo(struct FFmpegEncoder* encoder, const char* vcodec, unsigned vbr) {
113 static const struct {
114 enum AVPixelFormat format;
115 int priority;
116 } priorities[] = {
117 { AV_PIX_FMT_RGB555, 0 },
118 { AV_PIX_FMT_BGR555, 0 },
119 { AV_PIX_FMT_RGB565, 1 },
120 { AV_PIX_FMT_BGR565, 1 },
121 { AV_PIX_FMT_RGB24, 2 },
122 { AV_PIX_FMT_BGR24, 2 },
123#ifndef USE_LIBAV
124 { AV_PIX_FMT_BGR0, 3 },
125 { AV_PIX_FMT_RGB0, 3 },
126 { AV_PIX_FMT_0BGR, 3 },
127 { AV_PIX_FMT_0RGB, 3 },
128#endif
129 { AV_PIX_FMT_YUV422P, 4 },
130 { AV_PIX_FMT_YUV444P, 5 },
131 { AV_PIX_FMT_YUV420P, 6 }
132 };
133 AVCodec* codec = avcodec_find_encoder_by_name(vcodec);
134 if (!codec) {
135 return false;
136 }
137
138 size_t i;
139 size_t j;
140 int priority = INT_MAX;
141 encoder->pixFormat = AV_PIX_FMT_NONE;
142 for (i = 0; codec->pix_fmts[i] != AV_PIX_FMT_NONE; ++i) {
143 for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
144 if (codec->pix_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
145 priority = priorities[j].priority;
146 encoder->pixFormat = codec->pix_fmts[i];
147 }
148 }
149 }
150 if (encoder->pixFormat == AV_PIX_FMT_NONE) {
151 return false;
152 }
153 encoder->videoCodec = vcodec;
154 encoder->videoBitrate = vbr;
155 return true;
156}
157
158bool FFmpegEncoderSetContainer(struct FFmpegEncoder* encoder, const char* container) {
159 AVOutputFormat* oformat = av_guess_format(container, 0, 0);
160 if (!oformat) {
161 return false;
162 }
163 encoder->containerFormat = container;
164 return true;
165}
166
167void FFmpegEncoderSetDimensions(struct FFmpegEncoder* encoder, int width, int height) {
168 encoder->width = width > 0 ? width : VIDEO_HORIZONTAL_PIXELS;
169 encoder->height = height > 0 ? height : VIDEO_VERTICAL_PIXELS;
170}
171
172bool FFmpegEncoderVerifyContainer(struct FFmpegEncoder* encoder) {
173 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
174 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
175 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
176 if ((encoder->audioCodec && !acodec) || !vcodec || !oformat) {
177 return false;
178 }
179 if (encoder->audioCodec && !avformat_query_codec(oformat, acodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
180 return false;
181 }
182 if (!avformat_query_codec(oformat, vcodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
183 return false;
184 }
185 return true;
186}
187
188bool FFmpegEncoderOpen(struct FFmpegEncoder* encoder, const char* outfile) {
189 AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
190 AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
191 if ((encoder->audioCodec && !acodec) || !vcodec || !FFmpegEncoderVerifyContainer(encoder)) {
192 return false;
193 }
194
195 encoder->currentAudioSample = 0;
196 encoder->currentAudioFrame = 0;
197 encoder->currentVideoFrame = 0;
198 encoder->nextAudioPts = 0;
199
200 AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
201#ifndef USE_LIBAV
202 avformat_alloc_output_context2(&encoder->context, oformat, 0, outfile);
203#else
204 encoder->context = avformat_alloc_context();
205 strncpy(encoder->context->filename, outfile, sizeof(encoder->context->filename));
206 encoder->context->oformat = oformat;
207#endif
208
209 if (acodec) {
210 encoder->audioStream = avformat_new_stream(encoder->context, acodec);
211 encoder->audio = encoder->audioStream->codec;
212 encoder->audio->bit_rate = encoder->audioBitrate;
213 encoder->audio->channels = 2;
214 encoder->audio->channel_layout = AV_CH_LAYOUT_STEREO;
215 encoder->audio->sample_rate = encoder->sampleRate;
216 encoder->audio->sample_fmt = encoder->sampleFormat;
217 AVDictionary* opts = 0;
218 av_dict_set(&opts, "strict", "-2", 0);
219 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
220 encoder->audio->flags |= CODEC_FLAG_GLOBAL_HEADER;
221 }
222 avcodec_open2(encoder->audio, acodec, &opts);
223 av_dict_free(&opts);
224#if LIBAVCODEC_VERSION_MAJOR >= 55
225 encoder->audioFrame = av_frame_alloc();
226#else
227 encoder->audioFrame = avcodec_alloc_frame();
228#endif
229 if (!encoder->audio->frame_size) {
230 encoder->audio->frame_size = 1;
231 }
232 encoder->audioFrame->nb_samples = encoder->audio->frame_size;
233 encoder->audioFrame->format = encoder->audio->sample_fmt;
234 encoder->audioFrame->pts = 0;
235 encoder->resampleContext = avresample_alloc_context();
236 av_opt_set_int(encoder->resampleContext, "in_channel_layout", AV_CH_LAYOUT_STEREO, 0);
237 av_opt_set_int(encoder->resampleContext, "out_channel_layout", AV_CH_LAYOUT_STEREO, 0);
238 av_opt_set_int(encoder->resampleContext, "in_sample_rate", PREFERRED_SAMPLE_RATE, 0);
239 av_opt_set_int(encoder->resampleContext, "out_sample_rate", encoder->sampleRate, 0);
240 av_opt_set_int(encoder->resampleContext, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);
241 av_opt_set_int(encoder->resampleContext, "out_sample_fmt", encoder->sampleFormat, 0);
242 avresample_open(encoder->resampleContext);
243 encoder->audioBufferSize = (encoder->audioFrame->nb_samples * PREFERRED_SAMPLE_RATE / encoder->sampleRate) * 4;
244 encoder->audioBuffer = av_malloc(encoder->audioBufferSize);
245 encoder->postaudioBufferSize = av_samples_get_buffer_size(0, encoder->audio->channels, encoder->audio->frame_size, encoder->audio->sample_fmt, 0);
246 encoder->postaudioBuffer = av_malloc(encoder->postaudioBufferSize);
247 avcodec_fill_audio_frame(encoder->audioFrame, encoder->audio->channels, encoder->audio->sample_fmt, (const uint8_t*) encoder->postaudioBuffer, encoder->postaudioBufferSize, 0);
248
249 if (encoder->audio->codec->id == AV_CODEC_ID_AAC &&
250 (strcasecmp(encoder->containerFormat, "mp4") ||
251 strcasecmp(encoder->containerFormat, "m4v") ||
252 strcasecmp(encoder->containerFormat, "mov"))) {
253 // MP4 container doesn't support the raw ADTS AAC format that the encoder spits out
254 encoder->absf = av_bitstream_filter_init("aac_adtstoasc");
255 }
256 }
257
258 encoder->videoStream = avformat_new_stream(encoder->context, vcodec);
259 encoder->video = encoder->videoStream->codec;
260 encoder->video->bit_rate = encoder->videoBitrate;
261 encoder->video->width = encoder->width;
262 encoder->video->height = encoder->height;
263 encoder->video->time_base = (AVRational) { VIDEO_TOTAL_LENGTH, GBA_ARM7TDMI_FREQUENCY };
264 encoder->video->pix_fmt = encoder->pixFormat;
265 encoder->video->gop_size = 60;
266 encoder->video->max_b_frames = 3;
267 if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
268 encoder->video->flags |= CODEC_FLAG_GLOBAL_HEADER;
269 }
270 if (strcmp(vcodec->name, "libx264") == 0) {
271 // Try to adaptively figure out when you can use a slower encoder
272 if (encoder->width * encoder->height > 1000000) {
273 av_opt_set(encoder->video->priv_data, "preset", "superfast", 0);
274 } else if (encoder->width * encoder->height > 500000) {
275 av_opt_set(encoder->video->priv_data, "preset", "veryfast", 0);
276 } else {
277 av_opt_set(encoder->video->priv_data, "preset", "faster", 0);
278 }
279 av_opt_set(encoder->video->priv_data, "tune", "zerolatency", 0);
280 }
281 avcodec_open2(encoder->video, vcodec, 0);
282#if LIBAVCODEC_VERSION_MAJOR >= 55
283 encoder->videoFrame = av_frame_alloc();
284#else
285 encoder->videoFrame = avcodec_alloc_frame();
286#endif
287 encoder->videoFrame->format = encoder->video->pix_fmt;
288 encoder->videoFrame->width = encoder->video->width;
289 encoder->videoFrame->height = encoder->video->height;
290 encoder->videoFrame->pts = 0;
291 encoder->scaleContext = sws_getContext(VIDEO_HORIZONTAL_PIXELS, VIDEO_VERTICAL_PIXELS,
292#ifdef COLOR_16_BIT
293#ifdef COLOR_5_6_5
294 AV_PIX_FMT_RGB565,
295#else
296 AV_PIX_FMT_BGR555,
297#endif
298#else
299#ifndef USE_LIBAV
300 AV_PIX_FMT_0BGR32,
301#else
302 AV_PIX_FMT_BGR32,
303#endif
304#endif
305 encoder->videoFrame->width, encoder->videoFrame->height, encoder->video->pix_fmt,
306 SWS_POINT, 0, 0, 0);
307 av_image_alloc(encoder->videoFrame->data, encoder->videoFrame->linesize, encoder->video->width, encoder->video->height, encoder->video->pix_fmt, 32);
308
309 avio_open(&encoder->context->pb, outfile, AVIO_FLAG_WRITE);
310 avformat_write_header(encoder->context, 0);
311
312 return true;
313}
314
315void FFmpegEncoderClose(struct FFmpegEncoder* encoder) {
316 if (!encoder->context) {
317 return;
318 }
319 av_write_trailer(encoder->context);
320 avio_close(encoder->context->pb);
321
322 if (encoder->audioCodec) {
323 av_free(encoder->postaudioBuffer);
324 if (encoder->audioBuffer) {
325 av_free(encoder->audioBuffer);
326 }
327#if LIBAVCODEC_VERSION_MAJOR >= 55
328 av_frame_free(&encoder->audioFrame);
329#else
330 avcodec_free_frame(&encoder->audioFrame);
331#endif
332 avcodec_close(encoder->audio);
333
334 if (encoder->resampleContext) {
335 avresample_close(encoder->resampleContext);
336 }
337
338 if (encoder->absf) {
339 av_bitstream_filter_close(encoder->absf);
340 encoder->absf = 0;
341 }
342 }
343
344#if LIBAVCODEC_VERSION_MAJOR >= 55
345 av_frame_free(&encoder->videoFrame);
346#else
347 avcodec_free_frame(&encoder->videoFrame);
348#endif
349 avcodec_close(encoder->video);
350
351 sws_freeContext(encoder->scaleContext);
352
353 avformat_free_context(encoder->context);
354 encoder->context = 0;
355}
356
357bool FFmpegEncoderIsOpen(struct FFmpegEncoder* encoder) {
358 return !!encoder->context;
359}
360
361void _ffmpegPostAudioFrame(struct GBAAVStream* stream, int16_t left, int16_t right) {
362 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
363 if (!encoder->context || !encoder->audioCodec) {
364 return;
365 }
366
367 encoder->audioBuffer[encoder->currentAudioSample * 2] = left;
368 encoder->audioBuffer[encoder->currentAudioSample * 2 + 1] = right;
369
370 ++encoder->currentAudioFrame;
371 ++encoder->currentAudioSample;
372
373 if ((encoder->currentAudioSample * 4) < encoder->audioBufferSize) {
374 return;
375 }
376 encoder->currentAudioSample = 0;
377
378 int channelSize = 2 * av_get_bytes_per_sample(encoder->audio->sample_fmt);
379 avresample_convert(encoder->resampleContext,
380 0, 0, 0,
381 (uint8_t**) &encoder->audioBuffer, 0, encoder->audioBufferSize / 4);
382 if (avresample_available(encoder->resampleContext) < encoder->audioFrame->nb_samples) {
383 return;
384 }
385#if LIBAVCODEC_VERSION_MAJOR >= 55
386 av_frame_make_writable(encoder->audioFrame);
387#endif
388 avresample_read(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize);
389
390 AVRational timeBase = { 1, PREFERRED_SAMPLE_RATE };
391 encoder->audioFrame->pts = encoder->nextAudioPts;
392 encoder->nextAudioPts = av_rescale_q(encoder->currentAudioFrame, timeBase, encoder->audioStream->time_base);
393
394 AVPacket packet;
395 av_init_packet(&packet);
396 packet.data = 0;
397 packet.size = 0;
398 int gotData;
399 avcodec_encode_audio2(encoder->audio, &packet, encoder->audioFrame, &gotData);
400 if (gotData) {
401 if (encoder->absf) {
402 AVPacket tempPacket = packet;
403 int success = av_bitstream_filter_filter(encoder->absf, encoder->audio, 0,
404 &tempPacket.data, &tempPacket.size,
405 packet.data, packet.size, 0);
406 if (success > 0) {
407#if LIBAVUTIL_VERSION_MAJOR >= 53
408 tempPacket.buf = av_buffer_create(tempPacket.data, tempPacket.size, av_buffer_default_free, 0, 0);
409#endif
410 av_free_packet(&packet);
411 }
412 packet = tempPacket;
413 }
414 packet.stream_index = encoder->audioStream->index;
415 av_interleaved_write_frame(encoder->context, &packet);
416 }
417 av_free_packet(&packet);
418}
419
420void _ffmpegPostVideoFrame(struct GBAAVStream* stream, struct GBAVideoRenderer* renderer) {
421 struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
422 if (!encoder->context) {
423 return;
424 }
425 uint8_t* pixels;
426 unsigned stride;
427 renderer->getPixels(renderer, &stride, (void**) &pixels);
428 stride *= BYTES_PER_PIXEL;
429
430 AVPacket packet;
431
432 av_init_packet(&packet);
433 packet.data = 0;
434 packet.size = 0;
435#if LIBAVCODEC_VERSION_MAJOR >= 55
436 av_frame_make_writable(encoder->videoFrame);
437#endif
438 encoder->videoFrame->pts = av_rescale_q(encoder->currentVideoFrame, encoder->video->time_base, encoder->videoStream->time_base);
439 ++encoder->currentVideoFrame;
440
441 sws_scale(encoder->scaleContext, (const uint8_t* const*) &pixels, (const int*) &stride, 0, VIDEO_VERTICAL_PIXELS, encoder->videoFrame->data, encoder->videoFrame->linesize);
442
443 int gotData;
444 avcodec_encode_video2(encoder->video, &packet, encoder->videoFrame, &gotData);
445 if (gotData) {
446 if (encoder->videoStream->codec->coded_frame->key_frame) {
447 packet.flags |= AV_PKT_FLAG_KEY;
448 }
449 packet.stream_index = encoder->videoStream->index;
450 av_interleaved_write_frame(encoder->context, &packet);
451 }
452 av_free_packet(&packet);
453}