1 /*****************************************************************************
2 * ttml.c : TTML subtitles demux
3 *****************************************************************************
4 * Copyright (C) 2015-2017 VLC authors and VideoLAN
6 * Authors: Hugo Beauzée-Luyssen <hugo@beauzee.fr>
7 * Sushma Reddy <sushma.reddy@research.iiit.ac.in>
9 * This program is free software; you can redistribute it and/or modify it
10 * under the terms of the GNU Lesser General Public License as published by
11 * the Free Software Foundation; either version 2.1 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU Lesser General Public License for more details.
19 * You should have received a copy of the GNU Lesser General Public License
20 * along with this program; if not, write to the Free Software Foundation,
21 * Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
22 *****************************************************************************/
28 #include <vlc_common.h>
29 #include <vlc_demux.h>
31 #include <vlc_strings.h>
32 #include <vlc_memstream.h>
33 #include <vlc_es_out.h>
34 #include <vlc_charset.h> /* FromCharset */
40 #include "../codec/ttml/ttml.h"
42 //#define TTML_DEMUX_DEBUG
47 xml_reader_t
* p_reader
;
49 vlc_tick_t i_next_demux_time
;
53 tt_node_t
*p_rootnode
;
55 tt_timings_t temporal_extent
;
58 * All timings are stored unique and ordered.
59 * Being begin or end times of sub sequence,
60 * we use them as 'point of change' for output filtering.
70 static char *tt_genTiming( tt_time_t t
)
72 if( !tt_time_Valid( &t
) )
74 unsigned f
= t
.base
% CLOCK_FREQ
;
76 unsigned h
= t
.base
/ 3600;
77 unsigned m
= t
.base
% 3600 / 60;
78 unsigned s
= t
.base
% 60;
84 const char *lz
= "000000";
85 const char *psz_lz
= &lz
[6];
86 /* add leading zeroes */
87 for( unsigned i
=10*f
; i
<CLOCK_FREQ
; i
*= 10 )
89 /* strip trailing zeroes */
90 for( ; f
> 0 && (f
% 10) == 0; f
/= 10 );
91 i_ret
= asprintf( &psz
, "%02u:%02u:%02u.%s%u",
96 i_ret
= asprintf( &psz
, "%02u:%02u:%02u:%s%u",
97 h
, m
, s
, t
.frames
< 10 ? "0" : "", t
.frames
);
101 i_ret
= asprintf( &psz
, "%02u:%02u:%02u",
105 return i_ret
< 0 ? NULL
: psz
;
108 static void tt_node_AttributesToText( struct vlc_memstream
*p_stream
, const tt_node_t
* p_node
)
110 bool b_timed_node
= false;
111 const vlc_dictionary_t
* p_attr_dict
= &p_node
->attr_dict
;
112 for( int i
= 0; i
< p_attr_dict
->i_size
; ++i
)
114 for ( vlc_dictionary_entry_t
* p_entry
= p_attr_dict
->p_entries
[i
];
115 p_entry
!= NULL
; p_entry
= p_entry
->p_next
)
117 const char *psz_value
= NULL
;
119 if( !strcmp(p_entry
->psz_key
, "begin") ||
120 !strcmp(p_entry
->psz_key
, "end") ||
121 !strcmp(p_entry
->psz_key
, "dur") )
124 /* will remove duration */
127 else if( !strcmp(p_entry
->psz_key
, "timeContainer") )
129 /* also remove sequential timings info (all abs now) */
134 psz_value
= (char const*)p_entry
->p_value
;
137 if( psz_value
== NULL
)
140 vlc_memstream_printf( p_stream
, " %s=\"%s\"",
141 p_entry
->psz_key
, psz_value
);
147 if( tt_time_Valid( &p_node
->timings
.begin
) )
149 char *psz
= tt_genTiming( p_node
->timings
.begin
);
150 vlc_memstream_printf( p_stream
, " begin=\"%s\"", psz
);
154 if( tt_time_Valid( &p_node
->timings
.end
) )
156 char *psz
= tt_genTiming( p_node
->timings
.end
);
157 vlc_memstream_printf( p_stream
, " end=\"%s\"", psz
);
163 static void tt_node_ToText( struct vlc_memstream
*p_stream
, const tt_basenode_t
*p_basenode
,
164 const tt_time_t
*playbacktime
)
166 if( p_basenode
->i_type
== TT_NODE_TYPE_ELEMENT
)
168 const tt_node_t
*p_node
= (const tt_node_t
*) p_basenode
;
170 if( tt_time_Valid( playbacktime
) &&
171 !tt_timings_Contains( &p_node
->timings
, playbacktime
) )
174 vlc_memstream_putc( p_stream
, '<' );
175 vlc_memstream_puts( p_stream
, p_node
->psz_node_name
);
177 tt_node_AttributesToText( p_stream
, p_node
);
179 if( tt_node_HasChild( p_node
) )
181 vlc_memstream_putc( p_stream
, '>' );
183 #ifdef TTML_DEMUX_DEBUG
184 vlc_memstream_printf( p_stream
, "<!-- starts %ld ends %ld -->",
185 tt_time_Convert( &p_node
->timings
.begin
),
186 tt_time_Convert( &p_node
->timings
.end
) );
189 for( const tt_basenode_t
*p_child
= p_node
->p_child
;
190 p_child
; p_child
= p_child
->p_next
)
192 tt_node_ToText( p_stream
, p_child
, playbacktime
);
195 vlc_memstream_printf( p_stream
, "</%s>", p_node
->psz_node_name
);
198 vlc_memstream_puts( p_stream
, "/>" );
202 const tt_textnode_t
*p_textnode
= (const tt_textnode_t
*) p_basenode
;
203 vlc_memstream_puts( p_stream
, p_textnode
->psz_text
);
207 static int Control( demux_t
* p_demux
, int i_query
, va_list args
)
209 demux_sys_t
*p_sys
= p_demux
->p_sys
;
217 *va_arg( args
, bool * ) = true;
220 *va_arg( args
, vlc_tick_t
* ) = p_sys
->i_next_demux_time
;
223 if( p_sys
->times
.i_count
)
225 tt_time_t t
= tt_time_Create( va_arg( args
, vlc_tick_t
) - VLC_TICK_0
);
226 size_t i_index
= tt_timings_FindLowerIndex( p_sys
->times
.p_array
,
227 p_sys
->times
.i_count
, t
, &b
);
228 p_sys
->times
.i_current
= i_index
;
229 p_sys
->b_first_time
= true;
233 case DEMUX_SET_NEXT_DEMUX_TIME
:
234 p_sys
->i_next_demux_time
= va_arg( args
, vlc_tick_t
);
235 p_sys
->b_slave
= true;
237 case DEMUX_GET_LENGTH
:
238 if( p_sys
->times
.i_count
)
240 tt_time_t t
= tt_time_Sub( p_sys
->times
.p_array
[p_sys
->times
.i_count
- 1],
241 p_sys
->temporal_extent
.begin
);
242 *va_arg( args
, vlc_tick_t
* ) = tt_time_Convert( &t
);
246 case DEMUX_GET_POSITION
:
247 pf
= va_arg( args
, double * );
248 if( p_sys
->times
.i_current
>= p_sys
->times
.i_count
)
252 else if( p_sys
->times
.i_count
> 0 )
254 i64
= tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_count
- 1] );
255 *pf
= (double) p_sys
->i_next_demux_time
/ (i64
+ VLC_TICK_FROM_MS(500));
262 case DEMUX_SET_POSITION
:
263 f
= va_arg( args
, double );
264 if( p_sys
->times
.i_count
)
266 i64
= f
* tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_count
- 1] );
267 tt_time_t t
= tt_time_Create( i64
);
268 size_t i_index
= tt_timings_FindLowerIndex( p_sys
->times
.p_array
,
269 p_sys
->times
.i_count
, t
, &b
);
270 p_sys
->times
.i_current
= i_index
;
271 p_sys
->b_first_time
= true;
275 case DEMUX_CAN_PAUSE
:
276 case DEMUX_SET_PAUSE_STATE
:
277 case DEMUX_CAN_CONTROL_PACE
:
278 return demux_vaControlHelper( p_demux
->s
, 0, -1, 0, 1, i_query
, args
);
280 case DEMUX_GET_PTS_DELAY
:
283 case DEMUX_GET_ATTACHMENTS
:
284 case DEMUX_GET_TITLE_INFO
:
285 case DEMUX_HAS_UNSUPPORTED_META
:
286 case DEMUX_CAN_RECORD
:
294 static int ReadTTML( demux_t
* p_demux
)
296 demux_sys_t
* p_sys
= p_demux
->p_sys
;
297 const char* psz_node_name
;
301 int i_type
= xml_ReaderNextNode( p_sys
->p_reader
, &psz_node_name
);
302 bool b_empty
= xml_ReaderIsEmptyElement( p_sys
->p_reader
);
304 if( i_type
<= XML_READER_NONE
)
312 case XML_READER_STARTELEM
:
313 if( tt_node_NameCompare( psz_node_name
, "tt" ) ||
314 p_sys
->p_rootnode
!= NULL
)
317 p_sys
->p_rootnode
= tt_node_New( p_sys
->p_reader
, NULL
, psz_node_name
);
320 if( !p_sys
->p_rootnode
||
321 tt_nodes_Read( p_sys
->p_reader
, p_sys
->p_rootnode
) != VLC_SUCCESS
)
325 case XML_READER_ENDELEM
:
326 if( !p_sys
->p_rootnode
||
327 tt_node_NameCompare( psz_node_name
, p_sys
->p_rootnode
->psz_node_name
) )
334 if( p_sys
->p_rootnode
== NULL
)
340 static int Demux( demux_t
* p_demux
)
342 demux_sys_t
* p_sys
= p_demux
->p_sys
;
344 /* Last one must be an end time */
345 while( p_sys
->times
.i_current
+ 1 < p_sys
->times
.i_count
&&
346 tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_current
] ) <= p_sys
->i_next_demux_time
)
348 const vlc_tick_t i_playbacktime
=
349 tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_current
] );
350 const vlc_tick_t i_playbackendtime
=
351 tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_current
+ 1] ) - 1;
353 if ( !p_sys
->b_slave
&& p_sys
->b_first_time
)
355 es_out_SetPCR( p_demux
->out
, VLC_TICK_0
+ i_playbacktime
);
356 p_sys
->b_first_time
= false;
359 struct vlc_memstream stream
;
361 if( vlc_memstream_open( &stream
) )
362 return VLC_DEMUXER_EGENERIC
;
364 tt_node_ToText( &stream
, (tt_basenode_t
*) p_sys
->p_rootnode
,
365 &p_sys
->times
.p_array
[p_sys
->times
.i_current
] );
367 if( vlc_memstream_close( &stream
) == VLC_SUCCESS
)
369 block_t
* p_block
= block_heap_Alloc( stream
.ptr
, stream
.length
);
373 p_block
->i_pts
= VLC_TICK_0
+ i_playbacktime
;
374 p_block
->i_length
= i_playbackendtime
- i_playbacktime
;
376 es_out_Send( p_demux
->out
, p_sys
->p_es
, p_block
);
380 p_sys
->times
.i_current
++;
383 if ( !p_sys
->b_slave
)
385 es_out_SetPCR( p_demux
->out
, VLC_TICK_0
+ p_sys
->i_next_demux_time
);
386 p_sys
->i_next_demux_time
+= VLC_TICK_FROM_MS(125);
389 if( p_sys
->times
.i_current
+ 1 >= p_sys
->times
.i_count
)
390 return VLC_DEMUXER_EOF
;
392 return VLC_DEMUXER_SUCCESS
;
395 int tt_OpenDemux( vlc_object_t
* p_this
)
397 demux_t
*p_demux
= (demux_t
*)p_this
;
400 const uint8_t *p_peek
;
401 ssize_t i_peek
= vlc_stream_Peek( p_demux
->s
, &p_peek
, 2048 );
402 if( unlikely( i_peek
<= 32 ) )
405 const char *psz_xml
= (const char *) p_peek
;
406 size_t i_xml
= i_peek
;
408 /* Try to probe without xml module/loading the full document */
409 char *psz_alloc
= NULL
;
410 switch( GetQWBE(p_peek
) )
412 /* See RFC 3023 Part 4 */
413 case UINT64_C(0xFFFE3C003F007800): /* UTF16 BOM<? */
414 case UINT64_C(0xFFFE3C003F007400): /* UTF16 BOM<t */
415 case UINT64_C(0xFEFF003C003F0078): /* UTF16 BOM<? */
416 case UINT64_C(0xFEFF003C003F0074): /* UTF16 BOM<t */
417 psz_alloc
= FromCharset( "UTF-16", p_peek
, i_peek
);
419 case UINT64_C(0x3C003F0078006D00): /* UTF16-LE <?xm */
420 case UINT64_C(0x3C003F0074007400): /* UTF16-LE <tt */
421 psz_alloc
= FromCharset( "UTF-16LE", p_peek
, i_peek
);
423 case UINT64_C(0x003C003F0078006D): /* UTF16-BE <?xm */
424 case UINT64_C(0x003C003F00740074): /* UTF16-BE <tt */
425 psz_alloc
= FromCharset( "UTF-16BE", p_peek
, i_peek
);
427 case UINT64_C(0xEFBBBF3C3F786D6C): /* UTF8 BOM<?xml */
428 case UINT64_C(0x3C3F786D6C207665): /* UTF8 <?xml ve */
429 case UINT64_C(0xEFBBBF3C74742078): /* UTF8 BOM<tt x*/
432 if(GetDWBE(p_peek
) != UINT32_C(0x3C747420)) /* tt node without xml document marker */
439 i_xml
= strlen( psz_alloc
);
442 /* Simplified probing. Valid TTML must have a namespace declaration */
443 const char *psz_tt
= strnstr( psz_xml
, "tt", i_xml
);
444 if( !psz_tt
|| psz_tt
== psz_xml
||
445 ((size_t)(&psz_tt
[2] - (const char*)p_peek
)) == i_xml
|| isalpha(psz_tt
[2]) ||
446 (psz_tt
[-1] != ':' && psz_tt
[-1] != '<') )
453 const char * const rgsz
[] =
455 "=\"http://www.w3.org/ns/ttml\"",
456 "=\"http://www.w3.org/2004/11/ttaf1\"",
457 "=\"http://www.w3.org/2006/04/ttaf1\"",
458 "=\"http://www.w3.org/2006/10/ttaf1\"",
460 const char *psz_ns
= NULL
;
461 for( size_t i
=0; i
<ARRAY_SIZE(rgsz
) && !psz_ns
; i
++ )
463 psz_ns
= strnstr( psz_xml
, rgsz
[i
],
464 i_xml
- (psz_tt
- psz_xml
) );
471 p_demux
->p_sys
= p_sys
= calloc( 1, sizeof( *p_sys
) );
472 if( unlikely( p_sys
== NULL
) )
475 p_sys
->b_first_time
= true;
476 p_sys
->temporal_extent
.i_type
= TT_TIMINGS_PARALLEL
;
477 tt_time_Init( &p_sys
->temporal_extent
.begin
);
478 tt_time_Init( &p_sys
->temporal_extent
.end
);
479 tt_time_Init( &p_sys
->temporal_extent
.dur
);
480 p_sys
->temporal_extent
.begin
.base
= 0;
482 p_sys
->p_xml
= xml_Create( p_demux
);
486 p_sys
->p_reader
= xml_ReaderCreate( p_sys
->p_xml
, p_demux
->s
);
487 if( !p_sys
->p_reader
)
490 #ifndef TTML_DEMUX_DEBUG
491 p_sys
->p_reader
->obj
.flags
|= OBJECT_FLAGS_QUIET
;
494 if( ReadTTML( p_demux
) != VLC_SUCCESS
)
497 tt_timings_Resolve( (tt_basenode_t
*) p_sys
->p_rootnode
, &p_sys
->temporal_extent
,
498 &p_sys
->times
.p_array
, &p_sys
->times
.i_count
);
500 #ifdef TTML_DEMUX_DEBUG
502 struct vlc_memstream stream
;
504 if( vlc_memstream_open( &stream
) )
509 tt_node_ToText( &stream
, (tt_basenode_t
*)p_sys
->p_rootnode
, &t
/* invalid */ );
511 vlc_memstream_putc( &stream
, '\0' );
513 if( vlc_memstream_close( &stream
) == VLC_SUCCESS
)
515 msg_Dbg( p_demux
, "%s", stream
.ptr
);
521 p_demux
->pf_demux
= Demux
;
522 p_demux
->pf_control
= Control
;
525 es_format_Init( &fmt
, SPU_ES
, VLC_CODEC_TTML
);
526 p_sys
->p_es
= es_out_Add( p_demux
->out
, &fmt
);
530 es_format_Clean( &fmt
);
535 tt_CloseDemux( p_demux
);
540 void tt_CloseDemux( demux_t
* p_demux
)
542 demux_sys_t
* p_sys
= p_demux
->p_sys
;
544 if( p_sys
->p_rootnode
)
545 tt_node_RecursiveDelete( p_sys
->p_rootnode
);
548 es_out_Del( p_demux
->out
, p_sys
->p_es
);
550 if( p_sys
->p_reader
)
551 xml_ReaderDelete( p_sys
->p_reader
);
554 xml_Delete( p_sys
->p_xml
);
556 free( p_sys
->times
.p_array
);