1 /* GStreamer AAC encoder plugin
2  * Copyright (C) 2011 Kan Hu <kan.hu@linaro.org>
3  *
4  * This library is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Library General Public
6  * License as published by the Free Software Foundation; either
7  * version 2 of the License, or (at your option) any later version.
8  *
9  * This library is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12  * Library General Public License for more details.
13  *
14  * You should have received a copy of the GNU Library General Public
15  * License along with this library; if not, write to the
16  * Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
17  * Boston, MA 02110-1301, USA.
18  */
19 
20 /**
21  * SECTION:element-voaacenc
22  * @title: voaacenc
23  *
24  * AAC audio encoder based on vo-aacenc library
25  * <ulink url="http://sourceforge.net/projects/opencore-amr/files/vo-aacenc/">vo-aacenc library source file</ulink>.
26  *
27  * ## Example launch line
28  * |[
29  * gst-launch-1.0 filesrc location=abc.wav ! wavparse ! audioresample ! audioconvert ! voaacenc ! filesink location=abc.aac
30  * ]|
31  *
32  */
33 
34 #ifdef HAVE_CONFIG_H
35 #include "config.h"
36 #endif
37 
38 #include <string.h>
39 
40 #include <gst/pbutils/codec-utils.h>
41 
42 #include "gstvoaacenc.h"
43 
44 #define VOAAC_ENC_DEFAULT_BITRATE (128000)
45 #define VOAAC_ENC_DEFAULT_OUTPUTFORMAT (0)      /* RAW */
46 #define VOAAC_ENC_MPEGVERSION (4)
47 #define VOAAC_ENC_CODECDATA_LEN (2)
48 #define VOAAC_ENC_BITS_PER_SAMPLE (16)
49 
50 enum
51 {
52   PROP_0,
53   PROP_BITRATE
54 };
55 
56 #define SAMPLE_RATES " 8000, " \
57                     "11025, " \
58                     "12000, " \
59                     "16000, " \
60                     "22050, " \
61                     "24000, " \
62                     "32000, " \
63                     "44100, " \
64                     "48000, " \
65                     "64000, " \
66                     "88200, " \
67                     "96000"
68 
69 /* voaacenc only supports 1 or 2 channels */
70 static GstStaticPadTemplate sink_template = GST_STATIC_PAD_TEMPLATE ("sink",
71     GST_PAD_SINK,
72     GST_PAD_ALWAYS,
73     GST_STATIC_CAPS ("audio/x-raw, "
74         "format = (string) " GST_AUDIO_NE (S16) ", "
75         "layout = (string) interleaved, "
76         "rate = (int) { " SAMPLE_RATES " }, " "channels = (int) 1;"
77         "audio/x-raw, "
78         "format = (string) " GST_AUDIO_NE (S16) ", "
79         "layout = (string) interleaved, "
80         "rate = (int) { " SAMPLE_RATES " }, " "channels = (int) 2, "
81         "channel-mask=(bitmask)0x3")
82     );
83 
84 static GstStaticPadTemplate src_template = GST_STATIC_PAD_TEMPLATE ("src",
85     GST_PAD_SRC,
86     GST_PAD_ALWAYS,
87     GST_STATIC_CAPS ("audio/mpeg, "
88         "mpegversion = (int) 4, "
89         "rate = (int) { " SAMPLE_RATES " }, "
90         "channels = (int) [1, 2], "
91         "stream-format = (string) { adts, raw }, " "base-profile = (string) lc")
92     );
93 
94 GST_DEBUG_CATEGORY_STATIC (gst_voaacenc_debug);
95 #define GST_CAT_DEFAULT gst_voaacenc_debug
96 
97 static gboolean voaacenc_core_init (GstVoAacEnc * voaacenc);
98 static gboolean voaacenc_core_set_parameter (GstVoAacEnc * voaacenc);
99 static void voaacenc_core_uninit (GstVoAacEnc * voaacenc);
100 
101 static gboolean gst_voaacenc_start (GstAudioEncoder * enc);
102 static gboolean gst_voaacenc_stop (GstAudioEncoder * enc);
103 static gboolean gst_voaacenc_set_format (GstAudioEncoder * enc,
104     GstAudioInfo * info);
105 static GstFlowReturn gst_voaacenc_handle_frame (GstAudioEncoder * enc,
106     GstBuffer * in_buf);
107 
108 G_DEFINE_TYPE (GstVoAacEnc, gst_voaacenc, GST_TYPE_AUDIO_ENCODER);
109 
110 static void
gst_voaacenc_set_property(GObject * object,guint prop_id,const GValue * value,GParamSpec * pspec)111 gst_voaacenc_set_property (GObject * object, guint prop_id,
112     const GValue * value, GParamSpec * pspec)
113 {
114   GstVoAacEnc *self = GST_VOAACENC (object);
115 
116   switch (prop_id) {
117     case PROP_BITRATE:
118       self->bitrate = g_value_get_int (value);
119       break;
120     default:
121       G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
122       break;
123   }
124   return;
125 }
126 
127 static void
gst_voaacenc_get_property(GObject * object,guint prop_id,GValue * value,GParamSpec * pspec)128 gst_voaacenc_get_property (GObject * object, guint prop_id,
129     GValue * value, GParamSpec * pspec)
130 {
131   GstVoAacEnc *self = GST_VOAACENC (object);
132 
133   switch (prop_id) {
134     case PROP_BITRATE:
135       g_value_set_int (value, self->bitrate);
136       break;
137     default:
138       G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
139       break;
140   }
141   return;
142 }
143 
144 static void
gst_voaacenc_class_init(GstVoAacEncClass * klass)145 gst_voaacenc_class_init (GstVoAacEncClass * klass)
146 {
147   GObjectClass *object_class = G_OBJECT_CLASS (klass);
148   GstElementClass *element_class = GST_ELEMENT_CLASS (klass);
149   GstAudioEncoderClass *base_class = GST_AUDIO_ENCODER_CLASS (klass);
150 
151   object_class->set_property = GST_DEBUG_FUNCPTR (gst_voaacenc_set_property);
152   object_class->get_property = GST_DEBUG_FUNCPTR (gst_voaacenc_get_property);
153 
154   base_class->start = GST_DEBUG_FUNCPTR (gst_voaacenc_start);
155   base_class->stop = GST_DEBUG_FUNCPTR (gst_voaacenc_stop);
156   base_class->set_format = GST_DEBUG_FUNCPTR (gst_voaacenc_set_format);
157   base_class->handle_frame = GST_DEBUG_FUNCPTR (gst_voaacenc_handle_frame);
158 
159   g_object_class_install_property (object_class, PROP_BITRATE,
160       g_param_spec_int ("bitrate",
161           "Bitrate",
162           "Target Audio Bitrate (bits per second)",
163           0, 320000, VOAAC_ENC_DEFAULT_BITRATE,
164           G_PARAM_READWRITE | G_PARAM_STATIC_STRINGS));
165 
166   gst_element_class_add_static_pad_template (element_class, &sink_template);
167   gst_element_class_add_static_pad_template (element_class, &src_template);
168 
169   gst_element_class_set_static_metadata (element_class, "AAC audio encoder",
170       "Codec/Encoder/Audio", "AAC audio encoder", "Kan Hu <kan.hu@linaro.org>");
171 
172   GST_DEBUG_CATEGORY_INIT (gst_voaacenc_debug, "voaacenc", 0, "voaac encoder");
173 }
174 
175 static void
gst_voaacenc_init(GstVoAacEnc * voaacenc)176 gst_voaacenc_init (GstVoAacEnc * voaacenc)
177 {
178   GST_PAD_SET_ACCEPT_TEMPLATE (GST_AUDIO_ENCODER_SINK_PAD (voaacenc));
179   voaacenc->bitrate = VOAAC_ENC_DEFAULT_BITRATE;
180   voaacenc->output_format = VOAAC_ENC_DEFAULT_OUTPUTFORMAT;
181 
182   /* init rest */
183   voaacenc->handle = NULL;
184 }
185 
186 static gboolean
gst_voaacenc_start(GstAudioEncoder * enc)187 gst_voaacenc_start (GstAudioEncoder * enc)
188 {
189   GstVoAacEnc *voaacenc = GST_VOAACENC (enc);
190 
191   GST_DEBUG_OBJECT (enc, "start");
192 
193   if (voaacenc_core_init (voaacenc) == FALSE)
194     return FALSE;
195 
196   voaacenc->rate = 0;
197   voaacenc->channels = 0;
198 
199   return TRUE;
200 }
201 
202 static gboolean
gst_voaacenc_stop(GstAudioEncoder * enc)203 gst_voaacenc_stop (GstAudioEncoder * enc)
204 {
205   GstVoAacEnc *voaacenc = GST_VOAACENC (enc);
206 
207   GST_DEBUG_OBJECT (enc, "stop");
208   voaacenc_core_uninit (voaacenc);
209 
210   return TRUE;
211 }
212 
213 #define VOAAC_ENC_MAX_CHANNELS 6
214 /* describe the channels position */
215 static const GstAudioChannelPosition
216     aac_channel_positions[][VOAAC_ENC_MAX_CHANNELS] = {
217   {                             /* 1 ch: Mono */
218       GST_AUDIO_CHANNEL_POSITION_MONO},
219   {                             /* 2 ch: front left + front right (front stereo) */
220         GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
221       GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT},
222   {                             /* 3 ch: front center + front stereo */
223         GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER,
224         GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
225       GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT},
226   {                             /* 4 ch: front center + front stereo + back center */
227         GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER,
228         GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
229         GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
230       GST_AUDIO_CHANNEL_POSITION_REAR_CENTER},
231   {                             /* 5 ch: front center + front stereo + back stereo */
232         GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER,
233         GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
234         GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
235         GST_AUDIO_CHANNEL_POSITION_REAR_LEFT,
236       GST_AUDIO_CHANNEL_POSITION_REAR_RIGHT},
237   {                             /* 6ch: front center + front stereo + back stereo + LFE */
238         GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER,
239         GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT,
240         GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT,
241         GST_AUDIO_CHANNEL_POSITION_REAR_LEFT,
242         GST_AUDIO_CHANNEL_POSITION_REAR_RIGHT,
243       GST_AUDIO_CHANNEL_POSITION_LFE1}
244 };
245 
246 /* check downstream caps to configure format */
247 static void
gst_voaacenc_negotiate(GstVoAacEnc * voaacenc)248 gst_voaacenc_negotiate (GstVoAacEnc * voaacenc)
249 {
250   GstCaps *caps;
251 
252   caps = gst_pad_get_allowed_caps (GST_AUDIO_ENCODER_SRC_PAD (voaacenc));
253 
254   GST_DEBUG_OBJECT (voaacenc, "allowed caps: %" GST_PTR_FORMAT, caps);
255 
256   if (caps && gst_caps_get_size (caps) > 0) {
257     GstStructure *s = gst_caps_get_structure (caps, 0);
258     const gchar *str = NULL;
259 
260     if ((str = gst_structure_get_string (s, "stream-format"))) {
261       if (strcmp (str, "adts") == 0) {
262         GST_DEBUG_OBJECT (voaacenc, "use ADTS format for output");
263         voaacenc->output_format = 1;
264       } else if (strcmp (str, "raw") == 0) {
265         GST_DEBUG_OBJECT (voaacenc, "use RAW format for output");
266         voaacenc->output_format = 0;
267       } else {
268         GST_DEBUG_OBJECT (voaacenc, "unknown stream-format: %s", str);
269         voaacenc->output_format = VOAAC_ENC_DEFAULT_OUTPUTFORMAT;
270       }
271     }
272   }
273 
274   if (caps)
275     gst_caps_unref (caps);
276 }
277 
278 static gint
gst_voaacenc_get_rate_index(gint rate)279 gst_voaacenc_get_rate_index (gint rate)
280 {
281   static const gint rate_table[] = {
282     96000, 88200, 64000, 48000, 44100, 32000,
283     24000, 22050, 16000, 12000, 11025, 8000
284   };
285   gint i;
286   for (i = 0; i < G_N_ELEMENTS (rate_table); ++i) {
287     if (rate == rate_table[i]) {
288       return i;
289     }
290   }
291   return -1;
292 }
293 
294 static GstCaps *
gst_voaacenc_create_source_pad_caps(GstVoAacEnc * voaacenc)295 gst_voaacenc_create_source_pad_caps (GstVoAacEnc * voaacenc)
296 {
297   GstCaps *caps = NULL;
298   gint index;
299   GstBuffer *codec_data;
300   GstMapInfo map;
301 
302   if ((index = gst_voaacenc_get_rate_index (voaacenc->rate)) >= 0) {
303     codec_data = gst_buffer_new_and_alloc (VOAAC_ENC_CODECDATA_LEN);
304     gst_buffer_map (codec_data, &map, GST_MAP_WRITE);
305     /* LC profile only */
306     map.data[0] = ((0x02 << 3) | (index >> 1));
307     map.data[1] = ((index & 0x01) << 7) | (voaacenc->channels << 3);
308 
309     caps = gst_caps_new_simple ("audio/mpeg",
310         "mpegversion", G_TYPE_INT, VOAAC_ENC_MPEGVERSION,
311         "channels", G_TYPE_INT, voaacenc->channels,
312         "rate", G_TYPE_INT, voaacenc->rate, NULL);
313 
314     gst_codec_utils_aac_caps_set_level_and_profile (caps, map.data,
315         VOAAC_ENC_CODECDATA_LEN);
316     gst_buffer_unmap (codec_data, &map);
317 
318     if (!voaacenc->output_format) {
319       gst_caps_set_simple (caps,
320           "stream-format", G_TYPE_STRING, "raw",
321           "codec_data", GST_TYPE_BUFFER, codec_data, NULL);
322     } else {
323       gst_caps_set_simple (caps,
324           "stream-format", G_TYPE_STRING, "adts",
325           "framed", G_TYPE_BOOLEAN, TRUE, NULL);
326     }
327     gst_buffer_unref (codec_data);
328   }
329 
330   return caps;
331 }
332 
333 static gboolean
gst_voaacenc_set_format(GstAudioEncoder * benc,GstAudioInfo * info)334 gst_voaacenc_set_format (GstAudioEncoder * benc, GstAudioInfo * info)
335 {
336   gboolean ret = FALSE;
337   GstVoAacEnc *voaacenc;
338   GstCaps *src_caps;
339 
340   voaacenc = GST_VOAACENC (benc);
341 
342   /* get channel count */
343   voaacenc->channels = GST_AUDIO_INFO_CHANNELS (info);
344   voaacenc->rate = GST_AUDIO_INFO_RATE (info);
345 
346   /* precalc buffer size as it's constant now */
347   voaacenc->inbuf_size = voaacenc->channels * 2 * 1024;
348 
349   gst_voaacenc_negotiate (voaacenc);
350 
351   /* create reverse caps */
352   src_caps = gst_voaacenc_create_source_pad_caps (voaacenc);
353 
354   if (src_caps) {
355     gst_audio_encoder_set_output_format (GST_AUDIO_ENCODER (voaacenc),
356         src_caps);
357     gst_caps_unref (src_caps);
358     ret = voaacenc_core_set_parameter (voaacenc);
359   }
360 
361   /* report needs to base class */
362   gst_audio_encoder_set_frame_samples_min (benc, 1024);
363   gst_audio_encoder_set_frame_samples_max (benc, 1024);
364   gst_audio_encoder_set_frame_max (benc, 1);
365 
366   return ret;
367 }
368 
369 static GstFlowReturn
gst_voaacenc_handle_frame(GstAudioEncoder * benc,GstBuffer * buf)370 gst_voaacenc_handle_frame (GstAudioEncoder * benc, GstBuffer * buf)
371 {
372   GstVoAacEnc *voaacenc;
373   GstFlowReturn ret = GST_FLOW_OK;
374   GstBuffer *out;
375   VO_AUDIO_OUTPUTINFO output_info = { {0} };
376   VO_CODECBUFFER input = { 0 };
377   VO_CODECBUFFER output = { 0 };
378   GstMapInfo map, omap;
379   GstAudioInfo *info = gst_audio_encoder_get_audio_info (benc);
380 
381   voaacenc = GST_VOAACENC (benc);
382 
383   g_return_val_if_fail (voaacenc->handle, GST_FLOW_NOT_NEGOTIATED);
384 
385   /* we don't deal with squeezing remnants, so simply discard those */
386   if (G_UNLIKELY (buf == NULL)) {
387     GST_DEBUG_OBJECT (benc, "no data");
388     goto exit;
389   }
390 
391   if (memcmp (info->position, aac_channel_positions[info->channels - 1],
392           sizeof (GstAudioChannelPosition) * info->channels) != 0) {
393     buf = gst_buffer_make_writable (buf);
394     gst_audio_buffer_reorder_channels (buf, info->finfo->format,
395         info->channels, info->position,
396         aac_channel_positions[info->channels - 1]);
397   }
398 
399   gst_buffer_map (buf, &map, GST_MAP_READ);
400 
401   if (G_UNLIKELY (map.size < voaacenc->inbuf_size)) {
402     gst_buffer_unmap (buf, &map);
403     GST_DEBUG_OBJECT (voaacenc, "discarding trailing data %d", (gint) map.size);
404     ret = gst_audio_encoder_finish_frame (benc, NULL, -1);
405     goto exit;
406   }
407 
408   /* max size */
409   out = gst_buffer_new_and_alloc (voaacenc->inbuf_size);
410   gst_buffer_map (out, &omap, GST_MAP_WRITE);
411 
412   output.Buffer = omap.data;
413   output.Length = voaacenc->inbuf_size;
414 
415   g_assert (map.size == voaacenc->inbuf_size);
416   input.Buffer = map.data;
417   input.Length = voaacenc->inbuf_size;
418   voaacenc->codec_api.SetInputData (voaacenc->handle, &input);
419 
420   /* encode */
421   if (voaacenc->codec_api.GetOutputData (voaacenc->handle, &output,
422           &output_info) != VO_ERR_NONE) {
423     gst_buffer_unmap (buf, &map);
424     gst_buffer_unmap (out, &omap);
425     gst_buffer_unref (out);
426     goto encode_failed;
427   }
428 
429   GST_LOG_OBJECT (voaacenc, "encoded to %lu bytes", output.Length);
430   gst_buffer_unmap (buf, &map);
431   gst_buffer_unmap (out, &omap);
432   gst_buffer_resize (out, 0, output.Length);
433 
434   ret = gst_audio_encoder_finish_frame (benc, out, 1024);
435 
436 exit:
437   return ret;
438 
439   /* ERRORS */
440 encode_failed:
441   {
442     GST_ELEMENT_ERROR (voaacenc, STREAM, ENCODE, (NULL), ("encode failed"));
443     ret = GST_FLOW_ERROR;
444     goto exit;
445   }
446 }
447 
448 static VO_U32
voaacenc_core_mem_alloc(VO_S32 uID,VO_MEM_INFO * pMemInfo)449 voaacenc_core_mem_alloc (VO_S32 uID, VO_MEM_INFO * pMemInfo)
450 {
451   if (!pMemInfo)
452     return VO_ERR_INVALID_ARG;
453 
454   pMemInfo->VBuffer = g_malloc (pMemInfo->Size);
455   return 0;
456 }
457 
458 static VO_U32
voaacenc_core_mem_free(VO_S32 uID,VO_PTR pMem)459 voaacenc_core_mem_free (VO_S32 uID, VO_PTR pMem)
460 {
461   g_free (pMem);
462   return 0;
463 }
464 
465 static VO_U32
voaacenc_core_mem_set(VO_S32 uID,VO_PTR pBuff,VO_U8 uValue,VO_U32 uSize)466 voaacenc_core_mem_set (VO_S32 uID, VO_PTR pBuff, VO_U8 uValue, VO_U32 uSize)
467 {
468   memset (pBuff, uValue, uSize);
469   return 0;
470 }
471 
472 static VO_U32
voaacenc_core_mem_copy(VO_S32 uID,VO_PTR pDest,VO_PTR pSource,VO_U32 uSize)473 voaacenc_core_mem_copy (VO_S32 uID, VO_PTR pDest, VO_PTR pSource, VO_U32 uSize)
474 {
475   memcpy (pDest, pSource, uSize);
476   return 0;
477 }
478 
479 static VO_U32
voaacenc_core_mem_check(VO_S32 uID,VO_PTR pBuffer,VO_U32 uSize)480 voaacenc_core_mem_check (VO_S32 uID, VO_PTR pBuffer, VO_U32 uSize)
481 {
482   return 0;
483 }
484 
485 static gboolean
voaacenc_core_init(GstVoAacEnc * voaacenc)486 voaacenc_core_init (GstVoAacEnc * voaacenc)
487 {
488   VO_CODEC_INIT_USERDATA user_data = { 0 };
489   voGetAACEncAPI (&voaacenc->codec_api);
490 
491   voaacenc->mem_operator.Alloc = voaacenc_core_mem_alloc;
492   voaacenc->mem_operator.Copy = voaacenc_core_mem_copy;
493   voaacenc->mem_operator.Free = voaacenc_core_mem_free;
494   voaacenc->mem_operator.Set = voaacenc_core_mem_set;
495   voaacenc->mem_operator.Check = voaacenc_core_mem_check;
496   user_data.memflag = VO_IMF_USERMEMOPERATOR;
497   user_data.memData = &voaacenc->mem_operator;
498   voaacenc->codec_api.Init (&voaacenc->handle, VO_AUDIO_CodingAAC, &user_data);
499 
500   if (voaacenc->handle == NULL) {
501     return FALSE;
502   }
503   return TRUE;
504 
505 }
506 
507 static gboolean
voaacenc_core_set_parameter(GstVoAacEnc * voaacenc)508 voaacenc_core_set_parameter (GstVoAacEnc * voaacenc)
509 {
510   AACENC_PARAM params = { 0 };
511   guint32 ret;
512 
513   params.sampleRate = voaacenc->rate;
514   params.bitRate = voaacenc->bitrate;
515   params.nChannels = voaacenc->channels;
516   if (voaacenc->output_format) {
517     params.adtsUsed = 1;
518   } else {
519     params.adtsUsed = 0;
520   }
521 
522   ret =
523       voaacenc->codec_api.SetParam (voaacenc->handle, VO_PID_AAC_ENCPARAM,
524       &params);
525   if (ret != VO_ERR_NONE) {
526     GST_ERROR_OBJECT (voaacenc, "Failed to set encoder parameters");
527     return FALSE;
528   }
529   return TRUE;
530 }
531 
532 static void
voaacenc_core_uninit(GstVoAacEnc * voaacenc)533 voaacenc_core_uninit (GstVoAacEnc * voaacenc)
534 {
535   if (voaacenc->handle) {
536     voaacenc->codec_api.Uninit (voaacenc->handle);
537     voaacenc->handle = NULL;
538   }
539 }
540