1 /* Copyright (c) 2013-2015 Jeffrey Pfau
2  *
3  * This Source Code Form is subject to the terms of the Mozilla Public
4  * License, v. 2.0. If a copy of the MPL was not distributed with this
5  * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
6 #include "ffmpeg-encoder.h"
7 
8 #include <mgba/core/core.h>
9 #include <mgba/gba/interface.h>
10 #include <mgba/internal/gba/gba.h>
11 #include <mgba-util/math.h>
12 
13 #include <libavcodec/version.h>
14 #include <libavcodec/avcodec.h>
15 
16 #include <libavfilter/buffersink.h>
17 #include <libavfilter/buffersrc.h>
18 
19 #include <libavutil/version.h>
20 #if LIBAVUTIL_VERSION_MAJOR >= 53
21 #include <libavutil/buffer.h>
22 #endif
23 #include <libavutil/imgutils.h>
24 #include <libavutil/mathematics.h>
25 #include <libavutil/opt.h>
26 
27 #ifdef USE_LIBAVRESAMPLE
28 #include <libavresample/avresample.h>
29 #else
30 #include <libswresample/swresample.h>
31 #endif
32 #include <libswscale/swscale.h>
33 
34 static void _ffmpegPostVideoFrame(struct mAVStream*, const color_t* pixels, size_t stride);
35 static void _ffmpegPostAudioFrame(struct mAVStream*, int16_t left, int16_t right);
36 static void _ffmpegSetVideoDimensions(struct mAVStream*, unsigned width, unsigned height);
37 
38 static bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame);
39 static bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame);
40 
41 enum {
42 	PREFERRED_SAMPLE_RATE = 0x8000
43 };
44 
FFmpegEncoderInit(struct FFmpegEncoder * encoder)45 void FFmpegEncoderInit(struct FFmpegEncoder* encoder) {
46 #if LIBAVFORMAT_VERSION_INT < AV_VERSION_INT(58, 9, 100)
47 	av_register_all();
48 #endif
49 
50 	encoder->d.videoDimensionsChanged = _ffmpegSetVideoDimensions;
51 	encoder->d.postVideoFrame = _ffmpegPostVideoFrame;
52 	encoder->d.postAudioFrame = _ffmpegPostAudioFrame;
53 	encoder->d.postAudioBuffer = 0;
54 
55 	encoder->audioCodec = NULL;
56 	encoder->videoCodec = NULL;
57 	encoder->containerFormat = NULL;
58 	FFmpegEncoderSetAudio(encoder, "flac", 0);
59 	FFmpegEncoderSetVideo(encoder, "libx264", 0, 0);
60 	FFmpegEncoderSetContainer(encoder, "matroska");
61 	FFmpegEncoderSetDimensions(encoder, GBA_VIDEO_HORIZONTAL_PIXELS, GBA_VIDEO_VERTICAL_PIXELS);
62 	encoder->iwidth = GBA_VIDEO_HORIZONTAL_PIXELS;
63 	encoder->iheight = GBA_VIDEO_VERTICAL_PIXELS;
64 	encoder->frameskip = 1;
65 	encoder->skipResidue = 0;
66 	encoder->loop = false;
67 	encoder->ipixFormat =
68 #ifdef COLOR_16_BIT
69 #ifdef COLOR_5_6_5
70 	    AV_PIX_FMT_RGB565;
71 #else
72 	    AV_PIX_FMT_BGR555;
73 #endif
74 #else
75 #ifndef USE_LIBAV
76 	    AV_PIX_FMT_0BGR32;
77 #else
78 	    AV_PIX_FMT_BGR32;
79 #endif
80 #endif
81 	encoder->resampleContext = NULL;
82 	encoder->absf = NULL;
83 	encoder->context = NULL;
84 	encoder->scaleContext = NULL;
85 	encoder->audio = NULL;
86 	encoder->audioStream = NULL;
87 	encoder->audioFrame = NULL;
88 	encoder->audioBuffer = NULL;
89 	encoder->postaudioBuffer = NULL;
90 	encoder->video = NULL;
91 	encoder->videoStream = NULL;
92 	encoder->videoFrame = NULL;
93 	encoder->graph = NULL;
94 	encoder->source = NULL;
95 	encoder->sink = NULL;
96 	encoder->sinkFrame = NULL;
97 	FFmpegEncoderSetInputFrameRate(encoder, VIDEO_TOTAL_LENGTH, GBA_ARM7TDMI_FREQUENCY);
98 
99 	int i;
100 	for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
101 		encoder->filters[i] = NULL;
102 	}
103 }
104 
FFmpegEncoderSetAudio(struct FFmpegEncoder * encoder,const char * acodec,unsigned abr)105 bool FFmpegEncoderSetAudio(struct FFmpegEncoder* encoder, const char* acodec, unsigned abr) {
106 	static const struct {
107 		int format;
108 		int priority;
109 	} priorities[] = {
110 		{ AV_SAMPLE_FMT_S16, 0 },
111 		{ AV_SAMPLE_FMT_S16P, 1 },
112 		{ AV_SAMPLE_FMT_S32, 2 },
113 		{ AV_SAMPLE_FMT_S32P, 2 },
114 		{ AV_SAMPLE_FMT_FLT, 3 },
115 		{ AV_SAMPLE_FMT_FLTP, 3 },
116 		{ AV_SAMPLE_FMT_DBL, 4 },
117 		{ AV_SAMPLE_FMT_DBLP, 4 }
118 	};
119 
120 	if (!acodec) {
121 		encoder->audioCodec = 0;
122 		return true;
123 	}
124 
125 	AVCodec* codec = avcodec_find_encoder_by_name(acodec);
126 	if (!codec) {
127 		return false;
128 	}
129 
130 	if (!codec->sample_fmts) {
131 		return false;
132 	}
133 	size_t i;
134 	size_t j;
135 	int priority = INT_MAX;
136 	encoder->sampleFormat = AV_SAMPLE_FMT_NONE;
137 	for (i = 0; codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
138 		for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
139 			if (codec->sample_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
140 				priority = priorities[j].priority;
141 				encoder->sampleFormat = codec->sample_fmts[i];
142 			}
143 		}
144 	}
145 	if (encoder->sampleFormat == AV_SAMPLE_FMT_NONE) {
146 		return false;
147 	}
148 	encoder->sampleRate = PREFERRED_SAMPLE_RATE;
149 	if (codec->supported_samplerates) {
150 		for (i = 0; codec->supported_samplerates[i]; ++i) {
151 			if (codec->supported_samplerates[i] < PREFERRED_SAMPLE_RATE) {
152 				continue;
153 			}
154 			if (encoder->sampleRate == PREFERRED_SAMPLE_RATE || encoder->sampleRate > codec->supported_samplerates[i]) {
155 				encoder->sampleRate = codec->supported_samplerates[i];
156 			}
157 		}
158 	} else if (codec->id == AV_CODEC_ID_AAC) {
159 		// HACK: AAC doesn't support 32768Hz (it rounds to 32000), but libfaac doesn't tell us that
160 		encoder->sampleRate = 44100;
161 	}
162 	encoder->audioCodec = acodec;
163 	encoder->audioBitrate = abr;
164 	return true;
165 }
166 
FFmpegEncoderSetVideo(struct FFmpegEncoder * encoder,const char * vcodec,int vbr,int frameskip)167 bool FFmpegEncoderSetVideo(struct FFmpegEncoder* encoder, const char* vcodec, int vbr, int frameskip) {
168 	static const struct {
169 		enum AVPixelFormat format;
170 		int priority;
171 	} priorities[] = {
172 		{ AV_PIX_FMT_RGB555, 0 },
173 		{ AV_PIX_FMT_BGR555, 0 },
174 		{ AV_PIX_FMT_RGB565, 1 },
175 		{ AV_PIX_FMT_BGR565, 1 },
176 		{ AV_PIX_FMT_RGB24, 2 },
177 		{ AV_PIX_FMT_BGR24, 2 },
178 #ifndef USE_LIBAV
179 		{ AV_PIX_FMT_BGR0, 3 },
180 		{ AV_PIX_FMT_RGB0, 3 },
181 		{ AV_PIX_FMT_0BGR, 3 },
182 		{ AV_PIX_FMT_0RGB, 3 },
183 #endif
184 		{ AV_PIX_FMT_RGB32, 4},
185 		{ AV_PIX_FMT_BGR32, 4},
186 		{ AV_PIX_FMT_YUV444P, 5 },
187 		{ AV_PIX_FMT_YUV422P, 6 },
188 		{ AV_PIX_FMT_YUV420P, 7 },
189 		{ AV_PIX_FMT_PAL8, 8 },
190 	};
191 
192 	if (!vcodec) {
193 		encoder->videoCodec = 0;
194 		return true;
195 	}
196 
197 	AVCodec* codec = avcodec_find_encoder_by_name(vcodec);
198 	if (!codec) {
199 		return false;
200 	}
201 
202 	size_t i;
203 	size_t j;
204 	int priority = INT_MAX;
205 	encoder->pixFormat = AV_PIX_FMT_NONE;
206 	for (i = 0; codec->pix_fmts[i] != AV_PIX_FMT_NONE; ++i) {
207 		for (j = 0; j < sizeof(priorities) / sizeof(*priorities); ++j) {
208 			if (codec->pix_fmts[i] == priorities[j].format && priority > priorities[j].priority) {
209 				priority = priorities[j].priority;
210 				encoder->pixFormat = codec->pix_fmts[i];
211 			}
212 		}
213 	}
214 	if (encoder->pixFormat == AV_PIX_FMT_NONE) {
215 		return false;
216 	}
217 	if (vbr < 0 && !av_opt_find(&codec->priv_class, "crf", NULL, 0, 0)) {
218 		return false;
219 	}
220 	encoder->videoCodec = vcodec;
221 	encoder->videoBitrate = vbr;
222 	encoder->frameskip = frameskip + 1;
223 	return true;
224 }
225 
FFmpegEncoderSetContainer(struct FFmpegEncoder * encoder,const char * container)226 bool FFmpegEncoderSetContainer(struct FFmpegEncoder* encoder, const char* container) {
227 	AVOutputFormat* oformat = av_guess_format(container, 0, 0);
228 	if (!oformat) {
229 		return false;
230 	}
231 	encoder->containerFormat = container;
232 	return true;
233 }
234 
FFmpegEncoderSetDimensions(struct FFmpegEncoder * encoder,int width,int height)235 void FFmpegEncoderSetDimensions(struct FFmpegEncoder* encoder, int width, int height) {
236 	encoder->width = width > 0 ? width : GBA_VIDEO_HORIZONTAL_PIXELS;
237 	encoder->height = height > 0 ? height : GBA_VIDEO_VERTICAL_PIXELS;
238 }
239 
FFmpegEncoderSetLooping(struct FFmpegEncoder * encoder,bool loop)240 void FFmpegEncoderSetLooping(struct FFmpegEncoder* encoder, bool loop) {
241 	encoder->loop = loop;
242 }
243 
FFmpegEncoderVerifyContainer(struct FFmpegEncoder * encoder)244 bool FFmpegEncoderVerifyContainer(struct FFmpegEncoder* encoder) {
245 	AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
246 	AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
247 	AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
248 	if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !oformat || (!acodec && !vcodec)) {
249 		return false;
250 	}
251 	if (encoder->audioCodec && !avformat_query_codec(oformat, acodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
252 		return false;
253 	}
254 	if (encoder->videoCodec && !avformat_query_codec(oformat, vcodec->id, FF_COMPLIANCE_EXPERIMENTAL)) {
255 		return false;
256 	}
257 	return true;
258 }
259 
FFmpegEncoderOpen(struct FFmpegEncoder * encoder,const char * outfile)260 bool FFmpegEncoderOpen(struct FFmpegEncoder* encoder, const char* outfile) {
261 	AVCodec* acodec = avcodec_find_encoder_by_name(encoder->audioCodec);
262 	AVCodec* vcodec = avcodec_find_encoder_by_name(encoder->videoCodec);
263 	if ((encoder->audioCodec && !acodec) || (encoder->videoCodec && !vcodec) || !FFmpegEncoderVerifyContainer(encoder)) {
264 		return false;
265 	}
266 
267 	if (encoder->context) {
268 		return false;
269 	}
270 
271 	encoder->currentAudioSample = 0;
272 	encoder->currentAudioFrame = 0;
273 	encoder->currentVideoFrame = 0;
274 	encoder->skipResidue = 0;
275 
276 	AVOutputFormat* oformat = av_guess_format(encoder->containerFormat, 0, 0);
277 #ifndef USE_LIBAV
278 	avformat_alloc_output_context2(&encoder->context, oformat, 0, outfile);
279 #else
280 	encoder->context = avformat_alloc_context();
281 	strncpy(encoder->context->filename, outfile, sizeof(encoder->context->filename) - 1);
282 	encoder->context->filename[sizeof(encoder->context->filename) - 1] = '\0';
283 	encoder->context->oformat = oformat;
284 #endif
285 
286 	if (acodec) {
287 #ifdef FFMPEG_USE_CODECPAR
288 		encoder->audioStream = avformat_new_stream(encoder->context, NULL);
289 		encoder->audio = avcodec_alloc_context3(acodec);
290 #else
291 		encoder->audioStream = avformat_new_stream(encoder->context, acodec);
292 		encoder->audio = encoder->audioStream->codec;
293 #endif
294 		encoder->audio->bit_rate = encoder->audioBitrate;
295 		encoder->audio->channels = 2;
296 		encoder->audio->channel_layout = AV_CH_LAYOUT_STEREO;
297 		encoder->audio->sample_rate = encoder->sampleRate;
298 		encoder->audio->sample_fmt = encoder->sampleFormat;
299 		AVDictionary* opts = 0;
300 		av_dict_set(&opts, "strict", "-2", 0);
301 		if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
302 #ifdef AV_CODEC_FLAG_GLOBAL_HEADER
303 			encoder->audio->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
304 #else
305 			encoder->audio->flags |= CODEC_FLAG_GLOBAL_HEADER;
306 #endif
307 		}
308 		int res = avcodec_open2(encoder->audio, acodec, &opts);
309 		av_dict_free(&opts);
310 		if (res < 0) {
311 			FFmpegEncoderClose(encoder);
312 			return false;
313 		}
314 #if LIBAVCODEC_VERSION_MAJOR >= 55
315 		encoder->audioFrame = av_frame_alloc();
316 #else
317 		encoder->audioFrame = avcodec_alloc_frame();
318 #endif
319 		if (!encoder->audio->frame_size) {
320 			encoder->audio->frame_size = 1;
321 		}
322 		encoder->audioFrame->nb_samples = encoder->audio->frame_size;
323 		encoder->audioFrame->format = encoder->audio->sample_fmt;
324 		encoder->audioFrame->pts = 0;
325 #ifdef USE_LIBAVRESAMPLE
326 		encoder->resampleContext = avresample_alloc_context();
327 		av_opt_set_int(encoder->resampleContext, "in_channel_layout", AV_CH_LAYOUT_STEREO, 0);
328 		av_opt_set_int(encoder->resampleContext, "out_channel_layout", AV_CH_LAYOUT_STEREO, 0);
329 		av_opt_set_int(encoder->resampleContext, "in_sample_rate", PREFERRED_SAMPLE_RATE, 0);
330 		av_opt_set_int(encoder->resampleContext, "out_sample_rate", encoder->sampleRate, 0);
331 		av_opt_set_int(encoder->resampleContext, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);
332 		av_opt_set_int(encoder->resampleContext, "out_sample_fmt", encoder->sampleFormat, 0);
333 		avresample_open(encoder->resampleContext);
334 #else
335 		encoder->resampleContext = swr_alloc_set_opts(NULL, AV_CH_LAYOUT_STEREO, encoder->sampleFormat, encoder->sampleRate,
336 		                                              AV_CH_LAYOUT_STEREO, AV_SAMPLE_FMT_S16, PREFERRED_SAMPLE_RATE, 0, NULL);
337 		swr_init(encoder->resampleContext);
338 #endif
339 		encoder->audioBufferSize = (encoder->audioFrame->nb_samples * PREFERRED_SAMPLE_RATE / encoder->sampleRate) * 4;
340 		encoder->audioBuffer = av_malloc(encoder->audioBufferSize);
341 		encoder->postaudioBufferSize = av_samples_get_buffer_size(0, encoder->audio->channels, encoder->audio->frame_size, encoder->audio->sample_fmt, 0);
342 		encoder->postaudioBuffer = av_malloc(encoder->postaudioBufferSize);
343 		avcodec_fill_audio_frame(encoder->audioFrame, encoder->audio->channels, encoder->audio->sample_fmt, (const uint8_t*) encoder->postaudioBuffer, encoder->postaudioBufferSize, 0);
344 
345 		if (encoder->audio->codec->id == AV_CODEC_ID_AAC &&
346 		    (strcasecmp(encoder->containerFormat, "mp4") ||
347 		        strcasecmp(encoder->containerFormat, "m4v") ||
348 		        strcasecmp(encoder->containerFormat, "mov"))) {
349 			// MP4 container doesn't support the raw ADTS AAC format that the encoder spits out
350 #ifdef FFMPEG_USE_NEW_BSF
351 			av_bsf_alloc(av_bsf_get_by_name("aac_adtstoasc"), &encoder->absf);
352 			avcodec_parameters_from_context(encoder->absf->par_in, encoder->audio);
353 			av_bsf_init(encoder->absf);
354 #else
355 			encoder->absf = av_bitstream_filter_init("aac_adtstoasc");
356 #endif
357 		}
358 #ifdef FFMPEG_USE_CODECPAR
359 		avcodec_parameters_from_context(encoder->audioStream->codecpar, encoder->audio);
360 #endif
361 	}
362 
363 	if (vcodec) {
364 #ifdef FFMPEG_USE_CODECPAR
365 		encoder->videoStream = avformat_new_stream(encoder->context, NULL);
366 		encoder->video = avcodec_alloc_context3(vcodec);
367 #else
368 		encoder->videoStream = avformat_new_stream(encoder->context, vcodec);
369 		encoder->video = encoder->videoStream->codec;
370 #endif
371 		encoder->video->bit_rate = encoder->videoBitrate;
372 		encoder->video->width = encoder->width;
373 		encoder->video->height = encoder->height;
374 		encoder->video->time_base = (AVRational) { encoder->frameCycles * encoder->frameskip, encoder->cycles };
375 		encoder->video->framerate = (AVRational) { encoder->cycles, encoder->frameCycles * encoder->frameskip };
376 		encoder->videoStream->time_base = encoder->video->time_base;
377 		encoder->videoStream->avg_frame_rate = encoder->video->framerate;
378 		encoder->video->pix_fmt = encoder->pixFormat;
379 		encoder->video->gop_size = 60;
380 		encoder->video->max_b_frames = 3;
381 		if (encoder->context->oformat->flags & AVFMT_GLOBALHEADER) {
382 #ifdef AV_CODEC_FLAG_GLOBAL_HEADER
383 			encoder->video->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
384 #else
385 			encoder->video->flags |= CODEC_FLAG_GLOBAL_HEADER;
386 #endif
387 		}
388 
389 		if (encoder->video->codec->id == AV_CODEC_ID_H264 &&
390 		    (strcasecmp(encoder->containerFormat, "mp4") ||
391 		        strcasecmp(encoder->containerFormat, "m4v") ||
392 		        strcasecmp(encoder->containerFormat, "mov"))) {
393 			// QuickTime and a few other things require YUV420
394 			encoder->video->pix_fmt = AV_PIX_FMT_YUV420P;
395 		}
396 		if (encoder->video->codec->id == AV_CODEC_ID_FFV1) {
397 #if LIBAVCODEC_VERSION_MAJOR >= 57
398 			av_opt_set(encoder->video->priv_data, "coder", "range_tab", 0);
399 			av_opt_set_int(encoder->video->priv_data, "context", 1, 0);
400 #endif
401 			encoder->video->gop_size = 128;
402 			encoder->video->level = 3;
403 		}
404 
405 		if (encoder->video->codec->id == AV_CODEC_ID_PNG) {
406 			encoder->video->compression_level = 8;
407 		}
408 #if LIBAVCODEC_VERSION_INT >= AV_VERSION_INT(58, 48, 100)
409 		if (encoder->video->codec->id == AV_CODEC_ID_ZMBV) {
410 			encoder->video->compression_level = 5;
411 			encoder->video->pix_fmt = AV_PIX_FMT_BGR0;
412 		}
413 #endif
414 		if (strcmp(vcodec->name, "libx264") == 0 || strcmp(vcodec->name, "libx264rgb") == 0) {
415 			// Try to adaptively figure out when you can use a slower encoder
416 			if (encoder->width * encoder->height > 1000000) {
417 				av_opt_set(encoder->video->priv_data, "preset", "superfast", 0);
418 			} else if (encoder->width * encoder->height > 500000) {
419 				av_opt_set(encoder->video->priv_data, "preset", "veryfast", 0);
420 			} else {
421 				av_opt_set(encoder->video->priv_data, "preset", "faster", 0);
422 			}
423 			av_opt_set(encoder->video->priv_data, "tune", "zerolatency", 0);
424 			if (encoder->videoBitrate == 0) {
425 				av_opt_set(encoder->video->priv_data, "qp", "0", 0);
426 				if (strcmp(vcodec->name, "libx264") == 0) {
427 					encoder->video->pix_fmt = AV_PIX_FMT_YUV444P;
428 				}
429 			} else if (encoder->videoBitrate < 0) {
430 				av_opt_set_int(encoder->video->priv_data, "crf", -encoder->videoBitrate, 0);
431 			}
432 		} else if (encoder->videoBitrate < 0) {
433 			if (strcmp(vcodec->name, "libvpx") == 0 || strcmp(vcodec->name, "libvpx-vp9") == 0 || strcmp(vcodec->name, "libx265") == 0) {
434 				av_opt_set_int(encoder->video->priv_data, "crf", -encoder->videoBitrate, 0);
435 			} else {
436 				FFmpegEncoderClose(encoder);
437 				return false;
438 			}
439 		}
440 		if (strncmp(vcodec->name, "libvpx", 6) == 0) {
441 			av_opt_set_int(encoder->video->priv_data, "cpu-used", 2, 0);
442 			av_opt_set(encoder->video->priv_data, "deadline", "realtime", 0);
443 		}
444 		if (strcmp(vcodec->name, "libvpx-vp9") == 0 && encoder->videoBitrate == 0) {
445 			av_opt_set_int(encoder->video->priv_data, "lossless", 1, 0);
446 			av_opt_set_int(encoder->video->priv_data, "crf", 0, 0);
447 			encoder->video->gop_size = 120;
448 			encoder->video->pix_fmt = AV_PIX_FMT_GBRP;
449 		}
450 		if (strcmp(vcodec->name, "libwebp_anim") == 0 && encoder->videoBitrate == 0) {
451 			av_opt_set(encoder->video->priv_data, "lossless", "1", 0);
452 			encoder->video->pix_fmt = AV_PIX_FMT_RGB32;
453 		}
454 
455 		if (encoder->pixFormat == AV_PIX_FMT_PAL8) {
456 			encoder->graph = avfilter_graph_alloc();
457 
458 			const struct AVFilter* source = avfilter_get_by_name("buffer");
459 			const struct AVFilter* sink = avfilter_get_by_name("buffersink");
460 			const struct AVFilter* split = avfilter_get_by_name("split");
461 			const struct AVFilter* palettegen = avfilter_get_by_name("palettegen");
462 			const struct AVFilter* paletteuse = avfilter_get_by_name("paletteuse");
463 
464 			if (!source || !sink || !split || !palettegen || !paletteuse || !encoder->graph) {
465 				FFmpegEncoderClose(encoder);
466 				return false;
467 			}
468 
469 			char args[256];
470 			snprintf(args, sizeof(args), "video_size=%dx%d:pix_fmt=%d:time_base=%d/%d",
471 			         encoder->video->width, encoder->video->height, encoder->ipixFormat,
472 			         encoder->video->time_base.num, encoder->video->time_base.den);
473 
474 			int res = 0;
475 			res |= avfilter_graph_create_filter(&encoder->source, source, NULL, args, NULL, encoder->graph);
476 			res |= avfilter_graph_create_filter(&encoder->sink, sink, NULL, NULL, NULL, encoder->graph);
477 			res |= avfilter_graph_create_filter(&encoder->filters[0], split, NULL, NULL, NULL, encoder->graph);
478 			res |= avfilter_graph_create_filter(&encoder->filters[1], palettegen, NULL, "reserve_transparent=off", NULL, encoder->graph);
479 			res |= avfilter_graph_create_filter(&encoder->filters[2], paletteuse, NULL, "dither=none", NULL, encoder->graph);
480 			if (res < 0) {
481 				FFmpegEncoderClose(encoder);
482 				return false;
483 			}
484 
485 			res = 0;
486 			res |= avfilter_link(encoder->source, 0, encoder->filters[0], 0);
487 			res |= avfilter_link(encoder->filters[0], 0, encoder->filters[1], 0);
488 			res |= avfilter_link(encoder->filters[0], 1, encoder->filters[2], 0);
489 			res |= avfilter_link(encoder->filters[1], 0, encoder->filters[2], 1);
490 			res |= avfilter_link(encoder->filters[2], 0, encoder->sink, 0);
491 			if (res < 0 || avfilter_graph_config(encoder->graph, NULL) < 0) {
492 				FFmpegEncoderClose(encoder);
493 				return false;
494 			}
495 
496 #if LIBAVCODEC_VERSION_MAJOR >= 55
497 			encoder->sinkFrame = av_frame_alloc();
498 #else
499 			encoder->sinkFrame = avcodec_alloc_frame();
500 #endif
501 		}
502 		AVDictionary* opts = 0;
503 		av_dict_set(&opts, "strict", "-2", 0);
504 		int res = avcodec_open2(encoder->video, vcodec, &opts);
505 		av_dict_free(&opts);
506 		if (res < 0) {
507 			FFmpegEncoderClose(encoder);
508 			return false;
509 		}
510 #if LIBAVCODEC_VERSION_MAJOR >= 55
511 		encoder->videoFrame = av_frame_alloc();
512 #else
513 		encoder->videoFrame = avcodec_alloc_frame();
514 #endif
515 		encoder->videoFrame->format = encoder->video->pix_fmt != AV_PIX_FMT_PAL8 ? encoder->video->pix_fmt : encoder->ipixFormat;
516 		encoder->videoFrame->width = encoder->video->width;
517 		encoder->videoFrame->height = encoder->video->height;
518 		encoder->videoFrame->pts = 0;
519 		_ffmpegSetVideoDimensions(&encoder->d, encoder->iwidth, encoder->iheight);
520 		av_image_alloc(encoder->videoFrame->data, encoder->videoFrame->linesize, encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format, 32);
521 #ifdef FFMPEG_USE_CODECPAR
522 		avcodec_parameters_from_context(encoder->videoStream->codecpar, encoder->video);
523 #endif
524 	}
525 
526 	if (strcmp(encoder->containerFormat, "gif") == 0) {
527 		av_opt_set(encoder->context->priv_data, "loop", encoder->loop ? "0" : "-1", 0);
528 	} else if (strcmp(encoder->containerFormat, "apng") == 0) {
529 		av_opt_set(encoder->context->priv_data, "plays", encoder->loop ? "0" : "1", 0);
530 	} else if (strcmp(encoder->containerFormat, "webp") == 0) {
531 		av_opt_set(encoder->context->priv_data, "loop", encoder->loop ? "0" : "1", 0);
532 	}
533 
534 	AVDictionary* opts = 0;
535 	av_dict_set(&opts, "strict", "-2", 0);
536 	bool res = avio_open(&encoder->context->pb, outfile, AVIO_FLAG_WRITE) < 0 || avformat_write_header(encoder->context, &opts) < 0;
537 	av_dict_free(&opts);
538 	if (res) {
539 		FFmpegEncoderClose(encoder);
540 		return false;
541 	}
542 	return true;
543 }
544 
FFmpegEncoderClose(struct FFmpegEncoder * encoder)545 void FFmpegEncoderClose(struct FFmpegEncoder* encoder) {
546 	if (encoder->audio) {
547 		while (true) {
548 			if (!_ffmpegWriteAudioFrame(encoder, NULL)) {
549 				break;
550 			}
551 		}
552 	}
553 	if (encoder->video) {
554 		if (encoder->graph) {
555 			if (av_buffersrc_add_frame(encoder->source, NULL) >= 0) {
556 				while (true) {
557 					int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
558 					if (res < 0) {
559 						break;
560 					}
561 					_ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
562 					av_frame_unref(encoder->sinkFrame);
563 				}
564 			}
565 		}
566 		while (true) {
567 			if (!_ffmpegWriteVideoFrame(encoder, NULL)) {
568 				break;
569 			}
570 		}
571 	}
572 
573 	if (encoder->context && encoder->context->pb) {
574 		av_write_trailer(encoder->context);
575 		avio_close(encoder->context->pb);
576 	}
577 
578 	if (encoder->postaudioBuffer) {
579 		av_free(encoder->postaudioBuffer);
580 		encoder->postaudioBuffer = NULL;
581 	}
582 	if (encoder->audioBuffer) {
583 		av_free(encoder->audioBuffer);
584 		encoder->audioBuffer = NULL;
585 	}
586 
587 	if (encoder->audioFrame) {
588 #if LIBAVCODEC_VERSION_MAJOR >= 55
589 		av_frame_free(&encoder->audioFrame);
590 #else
591 		avcodec_free_frame(&encoder->audioFrame);
592 #endif
593 	}
594 	if (encoder->audio) {
595 #ifdef FFMPEG_USE_CODECPAR
596 		avcodec_free_context(&encoder->audio);
597 #else
598 		avcodec_close(encoder->audio);
599 		encoder->audio = NULL;
600 #endif
601 	}
602 
603 	if (encoder->resampleContext) {
604 #ifdef USE_LIBAVRESAMPLE
605 		avresample_close(encoder->resampleContext);
606 		encoder->resampleContext = NULL;
607 #else
608 		swr_free(&encoder->resampleContext);
609 #endif
610 	}
611 
612 	if (encoder->absf) {
613 #ifdef FFMPEG_USE_NEW_BSF
614 		av_bsf_free(&encoder->absf);
615 #else
616 		av_bitstream_filter_close(encoder->absf);
617 		encoder->absf = NULL;
618 #endif
619 	}
620 
621 	if (encoder->videoFrame) {
622 		av_freep(encoder->videoFrame->data);
623 #if LIBAVCODEC_VERSION_MAJOR >= 55
624 		av_frame_free(&encoder->videoFrame);
625 #else
626 		avcodec_free_frame(&encoder->videoFrame);
627 #endif
628 	}
629 
630 	if (encoder->sinkFrame) {
631 #if LIBAVCODEC_VERSION_MAJOR >= 55
632 		av_frame_free(&encoder->sinkFrame);
633 #else
634 		avcodec_free_frame(&encoder->sinkFrame);
635 #endif
636 		encoder->sinkFrame = NULL;
637 	}
638 
639 	if (encoder->video) {
640 #ifdef FFMPEG_USE_CODECPAR
641 		avcodec_free_context(&encoder->video);
642 #else
643 		avcodec_close(encoder->video);
644 		encoder->video = NULL;
645 #endif
646 	}
647 
648 	if (encoder->scaleContext) {
649 		sws_freeContext(encoder->scaleContext);
650 		encoder->scaleContext = NULL;
651 	}
652 
653 	if (encoder->graph) {
654 		avfilter_graph_free(&encoder->graph);
655 		encoder->graph = NULL;
656 		encoder->source = NULL;
657 		encoder->sink = NULL;
658 
659 		int i;
660 		for (i = 0; i < FFMPEG_FILTERS_MAX; ++i) {
661 			encoder->filters[i] = NULL;
662 		}
663 	}
664 
665 	if (encoder->context) {
666 		avformat_free_context(encoder->context);
667 		encoder->context = NULL;
668 	}
669 }
670 
FFmpegEncoderIsOpen(struct FFmpegEncoder * encoder)671 bool FFmpegEncoderIsOpen(struct FFmpegEncoder* encoder) {
672 	return !!encoder->context;
673 }
674 
_ffmpegPostAudioFrame(struct mAVStream * stream,int16_t left,int16_t right)675 void _ffmpegPostAudioFrame(struct mAVStream* stream, int16_t left, int16_t right) {
676 	struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
677 	if (!encoder->context || !encoder->audioCodec) {
678 		return;
679 	}
680 
681 	if (encoder->absf && !left) {
682 		// XXX: AVBSF doesn't like silence. Figure out why.
683 		left = 1;
684 	}
685 
686 	encoder->audioBuffer[encoder->currentAudioSample * 2] = left;
687 	encoder->audioBuffer[encoder->currentAudioSample * 2 + 1] = right;
688 
689 	++encoder->currentAudioSample;
690 
691 	if (encoder->currentAudioSample * 4 < encoder->audioBufferSize) {
692 		return;
693 	}
694 
695 	int channelSize = 2 * av_get_bytes_per_sample(encoder->audio->sample_fmt);
696 	encoder->currentAudioSample = 0;
697 #ifdef USE_LIBAVRESAMPLE
698 	avresample_convert(encoder->resampleContext, 0, 0, 0,
699 	                   (uint8_t**) &encoder->audioBuffer, 0, encoder->audioBufferSize / 4);
700 
701 	if (avresample_available(encoder->resampleContext) < encoder->audioFrame->nb_samples) {
702 		return;
703 	}
704 #if LIBAVCODEC_VERSION_MAJOR >= 55
705 	av_frame_make_writable(encoder->audioFrame);
706 #endif
707 	int samples = avresample_read(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize);
708 #else
709 #if LIBAVCODEC_VERSION_MAJOR >= 55
710 	av_frame_make_writable(encoder->audioFrame);
711 #endif
712 	if (swr_get_out_samples(encoder->resampleContext, 1) < encoder->audioFrame->nb_samples) {
713 		swr_convert(encoder->resampleContext, NULL, 0, (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
714 		return;
715 	}
716 	int samples = swr_convert(encoder->resampleContext, encoder->audioFrame->data, encoder->postaudioBufferSize / channelSize,
717 	                          (const uint8_t**) &encoder->audioBuffer, encoder->audioBufferSize / 4);
718 #endif
719 
720 	encoder->audioFrame->pts = encoder->currentAudioFrame;
721 	encoder->currentAudioFrame += samples;
722 
723 	_ffmpegWriteAudioFrame(encoder, encoder->audioFrame);
724 }
725 
_ffmpegWriteAudioFrame(struct FFmpegEncoder * encoder,struct AVFrame * audioFrame)726 bool _ffmpegWriteAudioFrame(struct FFmpegEncoder* encoder, struct AVFrame* audioFrame) {
727 	AVPacket packet;
728 	av_init_packet(&packet);
729 	packet.data = 0;
730 	packet.size = 0;
731 
732 	int gotData;
733 #ifdef FFMPEG_USE_PACKETS
734 	avcodec_send_frame(encoder->audio, audioFrame);
735 	gotData = avcodec_receive_packet(encoder->audio, &packet);
736 	gotData = (gotData == 0) && packet.size;
737 #else
738 	avcodec_encode_audio2(encoder->audio, &packet, audioFrame, &gotData);
739 #endif
740 	packet.pts = av_rescale_q(packet.pts, encoder->audio->time_base, encoder->audioStream->time_base);
741 	packet.dts = packet.pts;
742 
743 	if (gotData) {
744 		if (encoder->absf) {
745 			AVPacket tempPacket;
746 
747 #ifdef FFMPEG_USE_NEW_BSF
748 			int success = av_bsf_send_packet(encoder->absf, &packet);
749 			if (success >= 0) {
750 				success = av_bsf_receive_packet(encoder->absf, &tempPacket);
751 			}
752 #else
753 			int success = av_bitstream_filter_filter(encoder->absf, encoder->audio, 0,
754 			    &tempPacket.data, &tempPacket.size,
755 			    packet.data, packet.size, 0);
756 #endif
757 
758 			if (success >= 0) {
759 #if LIBAVUTIL_VERSION_MAJOR >= 53
760 				tempPacket.buf = av_buffer_create(tempPacket.data, tempPacket.size, av_buffer_default_free, 0, 0);
761 #endif
762 
763 #ifdef FFMPEG_USE_PACKET_UNREF
764 				av_packet_move_ref(&packet, &tempPacket);
765 #else
766 				av_free_packet(&packet);
767 				packet = tempPacket;
768 #endif
769 
770 				packet.stream_index = encoder->audioStream->index;
771 				av_interleaved_write_frame(encoder->context, &packet);
772 			}
773 		} else {
774 			packet.stream_index = encoder->audioStream->index;
775 			av_interleaved_write_frame(encoder->context, &packet);
776 		}
777 	}
778 #ifdef FFMPEG_USE_PACKET_UNREF
779 	av_packet_unref(&packet);
780 #else
781 	av_free_packet(&packet);
782 #endif
783 	return gotData;
784 }
785 
_ffmpegPostVideoFrame(struct mAVStream * stream,const color_t * pixels,size_t stride)786 void _ffmpegPostVideoFrame(struct mAVStream* stream, const color_t* pixels, size_t stride) {
787 	struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
788 	if (!encoder->context || !encoder->videoCodec) {
789 		return;
790 	}
791 	encoder->skipResidue = (encoder->skipResidue + 1) % encoder->frameskip;
792 	if (encoder->skipResidue) {
793 		return;
794 	}
795 	stride *= BYTES_PER_PIXEL;
796 
797 #if LIBAVCODEC_VERSION_MAJOR >= 55
798 	av_frame_make_writable(encoder->videoFrame);
799 #endif
800 	if (encoder->video->codec->id == AV_CODEC_ID_WEBP) {
801 		// TODO: Figure out why WebP is rescaling internally (should video frames not be rescaled externally?)
802 		encoder->videoFrame->pts = encoder->currentVideoFrame;
803 	} else {
804 		encoder->videoFrame->pts = av_rescale_q(encoder->currentVideoFrame, encoder->video->time_base, encoder->videoStream->time_base);
805 	}
806 	++encoder->currentVideoFrame;
807 
808 	sws_scale(encoder->scaleContext, (const uint8_t* const*) &pixels, (const int*) &stride, 0, encoder->iheight, encoder->videoFrame->data, encoder->videoFrame->linesize);
809 
810 	if (encoder->graph) {
811 		if (av_buffersrc_add_frame(encoder->source, encoder->videoFrame) < 0) {
812 			return;
813 		}
814 		while (true) {
815 			int res = av_buffersink_get_frame(encoder->sink, encoder->sinkFrame);
816 			if (res < 0) {
817 				break;
818 			}
819 			_ffmpegWriteVideoFrame(encoder, encoder->sinkFrame);
820 			av_frame_unref(encoder->sinkFrame);
821 		}
822 	} else {
823 		_ffmpegWriteVideoFrame(encoder, encoder->videoFrame);
824 	}
825 }
826 
_ffmpegWriteVideoFrame(struct FFmpegEncoder * encoder,struct AVFrame * videoFrame)827 bool _ffmpegWriteVideoFrame(struct FFmpegEncoder* encoder, struct AVFrame* videoFrame) {
828 	AVPacket packet;
829 
830 	av_init_packet(&packet);
831 	packet.data = 0;
832 	packet.size = 0;
833 
834 	int gotData;
835 #ifdef FFMPEG_USE_PACKETS
836 	avcodec_send_frame(encoder->video, videoFrame);
837 	gotData = avcodec_receive_packet(encoder->video, &packet) == 0;
838 #else
839 	avcodec_encode_video2(encoder->video, &packet, videoFrame, &gotData);
840 #endif
841 	if (gotData) {
842 #ifndef FFMPEG_USE_PACKET_UNREF
843 		if (encoder->video->coded_frame->key_frame) {
844 			packet.flags |= AV_PKT_FLAG_KEY;
845 		}
846 #endif
847 		packet.stream_index = encoder->videoStream->index;
848 		av_interleaved_write_frame(encoder->context, &packet);
849 	}
850 #ifdef FFMPEG_USE_PACKET_UNREF
851 	av_packet_unref(&packet);
852 #else
853 	av_free_packet(&packet);
854 #endif
855 
856 	return gotData;
857 }
858 
_ffmpegSetVideoDimensions(struct mAVStream * stream,unsigned width,unsigned height)859 static void _ffmpegSetVideoDimensions(struct mAVStream* stream, unsigned width, unsigned height) {
860 	struct FFmpegEncoder* encoder = (struct FFmpegEncoder*) stream;
861 	if (!encoder->context || !encoder->videoCodec) {
862 		return;
863 	}
864 	encoder->iwidth = width;
865 	encoder->iheight = height;
866 	if (encoder->scaleContext) {
867 		sws_freeContext(encoder->scaleContext);
868 	}
869 	encoder->scaleContext = sws_getContext(encoder->iwidth, encoder->iheight, encoder->ipixFormat,
870 	    encoder->videoFrame->width, encoder->videoFrame->height, encoder->videoFrame->format,
871 	    SWS_POINT, 0, 0, 0);
872 }
873 
FFmpegEncoderSetInputFrameRate(struct FFmpegEncoder * encoder,int numerator,int denominator)874 void FFmpegEncoderSetInputFrameRate(struct FFmpegEncoder* encoder, int numerator, int denominator) {
875 	reduceFraction(&numerator, &denominator);
876 	encoder->frameCycles = numerator;
877 	encoder->cycles = denominator;
878 	if (encoder->video) {
879 		encoder->video->framerate = (AVRational) { denominator, numerator * encoder->frameskip };
880 	}
881 }
882