1 /* Quicktime muxer plugin for GStreamer
2  * Copyright (C) 2008 Thiago Sousa Santos <thiagoss@embedded.ufcg.edu.br>
3  * Copyright (C) 2008 Mark Nauwelaerts <mnauw@users.sf.net>
4  *
5  * This library is free software; you can redistribute it and/or
6  * modify it under the terms of the GNU Library General Public
7  * License as published by the Free Software Foundation; either
8  * version 2 of the License, or (at your option) any later version.
9  *
10  * This library is distributed in the hope that it will be useful,
11  * but WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13  * Library General Public License for more details.
14  *
15  * You should have received a copy of the GNU Library General Public
16  * License along with this library; if not, write to the
17  * Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
18  * Boston, MA 02110-1301, USA.
19  */
20 /*
21  * Unless otherwise indicated, Source Code is licensed under MIT license.
22  * See further explanation attached in License Statement (distributed in the file
23  * LICENSE).
24  *
25  * Permission is hereby granted, free of charge, to any person obtaining a copy of
26  * this software and associated documentation files (the "Software"), to deal in
27  * the Software without restriction, including without limitation the rights to
28  * use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
29  * of the Software, and to permit persons to whom the Software is furnished to do
30  * so, subject to the following conditions:
31  *
32  * The above copyright notice and this permission notice shall be included in all
33  * copies or substantial portions of the Software.
34  *
35  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
36  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
37  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
38  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
39  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
40  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
41  * SOFTWARE.
42  */
43 
44 #include "gstqtmuxmap.h"
45 #include "fourcc.h"
46 
47 /* static info related to various format */
48 
49 #define COMMON_VIDEO_CAPS \
50   "width = (int) [ 16, MAX ], " \
51   "height = (int) [ 16, MAX ]"
52 
53 #define COMMON_VIDEO_CAPS_NO_FRAMERATE \
54   "width = (int) [ 16, MAX ], " \
55   "height = (int) [ 16, MAX ] "
56 
57 #define H263_CAPS \
58   "video/x-h263, " \
59   COMMON_VIDEO_CAPS
60 
61 #define H264_CAPS \
62   "video/x-h264, " \
63   "stream-format = (string) avc, " \
64   "alignment = (string) au, " \
65   COMMON_VIDEO_CAPS
66 
67 #define H265_CAPS \
68   "video/x-h265, " \
69   "stream-format = (string) { hvc1, hev1 }, " \
70   "alignment = (string) au, " \
71   COMMON_VIDEO_CAPS
72 
73 #define MPEG4V_CAPS \
74   "video/mpeg, " \
75   "mpegversion = (int) 4, "\
76   "systemstream = (boolean) false, " \
77   COMMON_VIDEO_CAPS "; " \
78   "video/x-divx, " \
79   "divxversion = (int) 5, "\
80   COMMON_VIDEO_CAPS
81 
82 #define PRORES_CAPS \
83   "video/x-prores, " \
84   "variant = (string) {standard, lt, hq, proxy, 4444, 4444xq}, " \
85   COMMON_VIDEO_CAPS
86 
87 #define CINEFORM_CAPS \
88   "video/x-cineform, " \
89   COMMON_VIDEO_CAPS
90 
91 #define SVQ_CAPS \
92   "video/x-svq, " \
93   "svqversion = (int) 3, " \
94   COMMON_VIDEO_CAPS
95 
96 #define COMMON_AUDIO_CAPS(c, r) \
97   "channels = (int) [ 1, " G_STRINGIFY (c) " ], " \
98   "rate = (int) [ 1, " G_STRINGIFY (r) " ]"
99 
100 #define PCM_CAPS \
101   "audio/x-raw, " \
102   "format = (string) { S16LE, S16BE, S8, U8 }, " \
103   "layout = (string) interleaved, " \
104   COMMON_AUDIO_CAPS (2, MAX)
105 
106 #define PCM_CAPS_FULL \
107   "audio/x-raw, " \
108   "format = (string) { S32LE, S32BE, S24LE, S24BE, S16LE, S16BE, S8, U8 }, " \
109   "layout = (string) interleaved, " \
110   COMMON_AUDIO_CAPS (2, MAX)
111 
112 #define PCM_CAPS_UNPOSITIONED \
113   "audio/x-raw, " \
114   "format = (string) { S32LE, S32BE, S24LE, S24BE, S16LE, S16BE, S8, U8 }, " \
115   "layout = (string) interleaved, " \
116   "channel-mask = (bitmask) 0, " \
117   COMMON_AUDIO_CAPS (16, MAX)
118 
119 #define MP3_CAPS \
120   "audio/mpeg, " \
121   "mpegversion = (int) 1, " \
122   "layer = (int) 3, " \
123   COMMON_AUDIO_CAPS (2, MAX)
124 
125 #define MP123_CAPS \
126   "audio/mpeg, " \
127   "mpegversion = (int) 1, " \
128   "layer = (int) [1, 3], " \
129   COMMON_AUDIO_CAPS (2, MAX)
130 
131 #define AAC_CAPS \
132   "audio/mpeg, " \
133   "mpegversion = (int) 4, " \
134   "stream-format = (string) raw, " \
135   COMMON_AUDIO_CAPS (8, MAX)
136 
137 #define AC3_CAPS \
138   "audio/x-ac3, " \
139   COMMON_AUDIO_CAPS (6, MAX)
140 
141 #define AMR_CAPS \
142   "audio/AMR, " \
143   "rate = (int) 8000, " \
144   "channels = [ 1, 2 ]; " \
145   "audio/AMR-WB, " \
146   "rate = (int) 16000, " \
147   "channels = [ 1, 2 ] "
148 
149 #define ADPCM_CAPS  \
150   "audio/x-adpcm, " \
151   "layout = (string)dvi, " \
152   "block_align = (int)[64, 8096], " \
153   COMMON_AUDIO_CAPS(2, MAX)
154 
155 #define ALAC_CAPS \
156   "audio/x-alac, " \
157   COMMON_AUDIO_CAPS(2, MAX)
158 
159 #define OPUS_CAPS \
160   "audio/x-opus, " \
161   "channel-mapping-family = (int) [0, 255], " \
162   COMMON_AUDIO_CAPS(8, MAX)
163 
164 
165 #define TEXT_UTF8 \
166   "text/x-raw, " \
167   "format=(string)utf8"
168 
169 #define CEA608_CAPS \
170   "closedcaption/x-cea-608, format=(string)s334-1a"
171 #define CEA708_CAPS \
172   "closedcaption/x-cea-708, format=(string)cdp"
173 
174 /* FIXME 0.11 - take a look at bugs #580005 and #340375 */
175 GstQTMuxFormatProp gst_qt_mux_format_list[] = {
176   /* original QuickTime format; see Apple site (e.g. qtff.pdf) */
177   {
178         GST_QT_MUX_FORMAT_QT,
179         GST_RANK_PRIMARY,
180         "qtmux",
181         "QuickTime",
182         "GstQTMux",
183         GST_STATIC_CAPS ("video/quicktime, variant = (string) apple; "
184             "video/quicktime"),
185         GST_STATIC_CAPS ("video/x-raw, "
186             "format = (string) { RGB, UYVY, v210 }, "
187             COMMON_VIDEO_CAPS "; "
188             MPEG4V_CAPS "; "
189             PRORES_CAPS "; "
190             CINEFORM_CAPS "; "
191             H263_CAPS "; "
192             H264_CAPS "; "
193             H265_CAPS "; "
194             SVQ_CAPS "; "
195             "video/x-dv, "
196             "systemstream = (boolean) false, "
197             COMMON_VIDEO_CAPS "; "
198             "image/jpeg, "
199             COMMON_VIDEO_CAPS_NO_FRAMERATE "; "
200             "image/png, "
201             COMMON_VIDEO_CAPS_NO_FRAMERATE "; "
202             "video/x-vp8, "
203             COMMON_VIDEO_CAPS "; "
204             "video/x-vp9, "
205             COMMON_VIDEO_CAPS "; "
206             "video/x-dirac, "
207             COMMON_VIDEO_CAPS "; " "video/x-qt-part, " COMMON_VIDEO_CAPS "; "
208             "video/x-av1, " COMMON_VIDEO_CAPS),
209         GST_STATIC_CAPS (PCM_CAPS_FULL "; "
210             PCM_CAPS_UNPOSITIONED " ; "
211             MP123_CAPS " ; "
212             AAC_CAPS " ; "
213             AC3_CAPS " ; "
214             ADPCM_CAPS " ; "
215             "audio/x-alaw, " COMMON_AUDIO_CAPS (2, MAX) "; "
216             "audio/x-mulaw, " COMMON_AUDIO_CAPS (2, MAX) "; "
217             AMR_CAPS " ; " ALAC_CAPS " ; " OPUS_CAPS),
218         GST_STATIC_CAPS (TEXT_UTF8),
219       GST_STATIC_CAPS (CEA608_CAPS "; " CEA708_CAPS)}
220   ,
221   /* ISO 14496-14: mp42 as ISO base media extension
222    * (supersedes original ISO 144996-1 mp41) */
223   {
224         GST_QT_MUX_FORMAT_MP4,
225         GST_RANK_PRIMARY,
226         "mp4mux",
227         "MP4",
228         "GstMP4Mux",
229         GST_STATIC_CAPS ("video/quicktime, variant = (string) iso"),
230         GST_STATIC_CAPS (MPEG4V_CAPS "; " H264_CAPS ";" H265_CAPS ";"
231             "video/x-mp4-part," COMMON_VIDEO_CAPS "; "
232             "video/x-av1, " COMMON_VIDEO_CAPS),
233         GST_STATIC_CAPS (MP123_CAPS "; "
234             AAC_CAPS " ; " AC3_CAPS " ; " ALAC_CAPS " ; " OPUS_CAPS),
235         GST_STATIC_CAPS (TEXT_UTF8),
236       GST_STATIC_CAPS_NONE}
237   ,
238   /* Microsoft Smooth Streaming fmp4/isml */
239   /* TODO add WMV/WMA support */
240   {
241         GST_QT_MUX_FORMAT_ISML,
242         GST_RANK_PRIMARY,
243         "ismlmux",
244         "ISML",
245         "GstISMLMux",
246         GST_STATIC_CAPS ("video/quicktime, variant = (string) iso-fragmented"),
247         GST_STATIC_CAPS (MPEG4V_CAPS "; " H264_CAPS),
248         GST_STATIC_CAPS (MP3_CAPS "; " AAC_CAPS),
249         GST_STATIC_CAPS_NONE,
250       GST_STATIC_CAPS_NONE}
251   ,
252   /* 3GPP Technical Specification 26.244 V7.3.0
253    * (extended in 3GPP2 File Formats for Multimedia Services) */
254   {
255         GST_QT_MUX_FORMAT_3GP,
256         GST_RANK_PRIMARY,
257         "3gppmux",
258         "3GPP",
259         "Gst3GPPMux",
260         GST_STATIC_CAPS ("video/quicktime, variant = (string) 3gpp"),
261         GST_STATIC_CAPS (H263_CAPS "; " MPEG4V_CAPS "; " H264_CAPS),
262         GST_STATIC_CAPS (AMR_CAPS "; " MP3_CAPS "; " AAC_CAPS "; " AC3_CAPS),
263         GST_STATIC_CAPS (TEXT_UTF8),
264       GST_STATIC_CAPS_NONE}
265   ,
266   /* ISO 15444-3: Motion-JPEG-2000 (also ISO base media extension) */
267   {
268         GST_QT_MUX_FORMAT_MJ2,
269         GST_RANK_PRIMARY,
270         "mj2mux",
271         "MJ2",
272         "GstMJ2Mux",
273         GST_STATIC_CAPS ("video/mj2"),
274         GST_STATIC_CAPS ("image/x-j2c, " COMMON_VIDEO_CAPS "; "
275             "image/x-jpc, " COMMON_VIDEO_CAPS),
276         GST_STATIC_CAPS (PCM_CAPS),
277         GST_STATIC_CAPS_NONE,
278       GST_STATIC_CAPS_NONE}
279   ,
280   {
281         GST_QT_MUX_FORMAT_NONE,
282       }
283 };
284 
285 /* pretty static, but may turn out needed a few times */
286 AtomsTreeFlavor
gst_qt_mux_map_format_to_flavor(GstQTMuxFormat format)287 gst_qt_mux_map_format_to_flavor (GstQTMuxFormat format)
288 {
289   if (format == GST_QT_MUX_FORMAT_QT)
290     return ATOMS_TREE_FLAVOR_MOV;
291   else if (format == GST_QT_MUX_FORMAT_3GP)
292     return ATOMS_TREE_FLAVOR_3GP;
293   else if (format == GST_QT_MUX_FORMAT_ISML)
294     return ATOMS_TREE_FLAVOR_ISML;
295   else
296     return ATOMS_TREE_FLAVOR_ISOM;
297 }
298 
299 static void
gst_qt_mux_map_check_tracks(AtomMOOV * moov,gint * _video,gint * _audio,gboolean * _has_h264)300 gst_qt_mux_map_check_tracks (AtomMOOV * moov, gint * _video, gint * _audio,
301     gboolean * _has_h264)
302 {
303   GList *it;
304   gint video = 0, audio = 0;
305   gboolean has_h264 = FALSE;
306 
307   for (it = moov->traks; it != NULL; it = g_list_next (it)) {
308     AtomTRAK *track = it->data;
309 
310     if (track->is_video) {
311       video++;
312       if (track->is_h264)
313         has_h264 = TRUE;
314     } else
315       audio++;
316   }
317 
318   if (_video)
319     *_video = video;
320   if (_audio)
321     *_audio = audio;
322   if (_has_h264)
323     *_has_h264 = has_h264;
324 }
325 
326 /* pretty static, but possibly dynamic format info */
327 
328 /* notes:
329  * - avc1 brand is not used, since the specific extensions indicated by it
330  *   are not used (e.g. sample groupings, etc)
331  * - TODO: maybe even more 3GPP brand fine-tuning ??
332  *   (but that might need ftyp rewriting at the end) */
333 void
gst_qt_mux_map_format_to_header(GstQTMuxFormat format,GstBuffer ** _prefix,guint32 * _major,guint32 * _version,GList ** _compatible,AtomMOOV * moov,GstClockTime longest_chunk,gboolean faststart)334 gst_qt_mux_map_format_to_header (GstQTMuxFormat format, GstBuffer ** _prefix,
335     guint32 * _major, guint32 * _version, GList ** _compatible, AtomMOOV * moov,
336     GstClockTime longest_chunk, gboolean faststart)
337 {
338   static const guint32 qt_brands[] = { 0 };
339   static const guint32 mp4_brands[] =
340       { FOURCC_mp41, FOURCC_isom, FOURCC_iso2, 0 };
341   static const guint32 isml_brands[] = { FOURCC_iso2, 0 };
342   static const guint32 gpp_brands[] = { FOURCC_isom, FOURCC_iso2, 0 };
343   static const guint32 mjp2_brands[] = { FOURCC_isom, FOURCC_iso2, 0 };
344   static const guint8 mjp2_prefix[] =
345       { 0, 0, 0, 12, 'j', 'P', ' ', ' ', 0x0D, 0x0A, 0x87, 0x0A };
346   const guint32 *comp = NULL;
347   guint32 major = 0, version = 0;
348   GstBuffer *prefix = NULL;
349   GList *result = NULL;
350 
351   g_return_if_fail (_prefix != NULL);
352   g_return_if_fail (_major != NULL);
353   g_return_if_fail (_version != NULL);
354   g_return_if_fail (_compatible != NULL);
355 
356   switch (format) {
357     case GST_QT_MUX_FORMAT_QT:
358       major = FOURCC_qt__;
359       comp = qt_brands;
360       version = 0x20050300;
361       break;
362     case GST_QT_MUX_FORMAT_MP4:
363       major = FOURCC_mp42;
364       comp = mp4_brands;
365       break;
366     case GST_QT_MUX_FORMAT_ISML:
367       major = FOURCC_isml;
368       comp = isml_brands;
369       break;
370     case GST_QT_MUX_FORMAT_3GP:
371     {
372       gint video, audio;
373       gboolean has_h264;
374 
375       gst_qt_mux_map_check_tracks (moov, &video, &audio, &has_h264);
376       /* only track restriction really matters for Basic Profile */
377       if (video <= 1 && audio <= 1) {
378         /* it seems only newer spec knows about H264 */
379         major = has_h264 ? FOURCC_3gp6 : FOURCC_3gp4;
380         version = has_h264 ? 0x100 : 0x200;
381       } else {
382         major = FOURCC_3gg6;
383         version = 0x100;
384       }
385       comp = gpp_brands;
386 
387       /*
388        * We assume that we have chunks in dts order
389        */
390       if (faststart && longest_chunk <= GST_SECOND) {
391         /* add progressive download profile */
392         result = g_list_append (result, GUINT_TO_POINTER (FOURCC_3gr6));
393       }
394       break;
395     }
396     case GST_QT_MUX_FORMAT_MJ2:
397     {
398       major = FOURCC_mjp2;
399       comp = mjp2_brands;
400       version = 0;
401       prefix = gst_buffer_new_and_alloc (sizeof (mjp2_prefix));
402       gst_buffer_fill (prefix, 0, mjp2_prefix, sizeof (mjp2_prefix));
403       break;
404     }
405     default:
406       g_assert_not_reached ();
407       break;
408   }
409 
410   /* convert list to list, hm */
411   while (comp && *comp != 0) {
412     /* order matters over efficiency */
413     result = g_list_append (result, GUINT_TO_POINTER (*comp));
414     comp++;
415   }
416 
417   *_major = major;
418   *_version = version;
419   *_prefix = prefix;
420   *_compatible = result;
421 
422   /* TODO 3GPP may include mp42 as compatible if applicable */
423   /* TODO 3GPP major brand 3gp7 if at most 1 video and audio track */
424 }
425