1 /*****************************************************************************
2 * ttml.c : TTML subtitles demux
3 *****************************************************************************
4 * Copyright (C) 2015-2017 VLC authors and VideoLAN
6 * Authors: Hugo Beauzée-Luyssen <hugo@beauzee.fr>
7 * Sushma Reddy <sushma.reddy@research.iiit.ac.in>
9 * This program is free software; you can redistribute it and/or modify it
10 * under the terms of the GNU Lesser General Public License as published by
11 * the Free Software Foundation; either version 2.1 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU Lesser General Public License for more details.
19 * You should have received a copy of the GNU Lesser General Public License
20 * along with this program; if not, write to the Free Software Foundation,
21 * Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
22 *****************************************************************************/
28 #include <vlc_common.h>
29 #include <vlc_demux.h>
31 #include <vlc_strings.h>
32 #include <vlc_memstream.h>
33 #include <vlc_es_out.h>
34 #include <vlc_charset.h> /* FromCharset */
40 #include "../codec/ttml/ttml.h"
42 //#define TTML_DEMUX_DEBUG
47 xml_reader_t
* p_reader
;
49 vlc_tick_t i_next_demux_time
;
53 tt_node_t
*p_rootnode
;
55 tt_timings_t temporal_extent
;
58 * All timings are stored unique and ordered.
59 * Being begin or end times of sub sequence,
60 * we use them as 'point of change' for output filtering.
70 static char *tt_genTiming( tt_time_t t
)
72 if( !tt_time_Valid( &t
) )
74 unsigned f
= t
.base
% CLOCK_FREQ
;
76 unsigned h
= t
.base
/ 3600;
77 unsigned m
= t
.base
% 3600 / 60;
78 unsigned s
= t
.base
% 60;
84 const char *lz
= "000000";
85 const char *psz_lz
= &lz
[6];
86 /* add leading zeroes */
87 for( unsigned i
=10*f
; i
<CLOCK_FREQ
; i
*= 10 )
89 /* strip trailing zeroes */
90 for( ; f
> 0 && (f
% 10) == 0; f
/= 10 );
91 i_ret
= asprintf( &psz
, "%02u:%02u:%02u.%s%u",
96 i_ret
= asprintf( &psz
, "%02u:%02u:%02u:%s%u",
97 h
, m
, s
, t
.frames
< 10 ? "0" : "", t
.frames
);
101 i_ret
= asprintf( &psz
, "%02u:%02u:%02u",
105 return i_ret
< 0 ? NULL
: psz
;
108 static void tt_node_AttributesToText( struct vlc_memstream
*p_stream
, const tt_node_t
* p_node
)
110 bool b_timed_node
= false;
111 const vlc_dictionary_t
* p_attr_dict
= &p_node
->attr_dict
;
112 for( int i
= 0; i
< p_attr_dict
->i_size
; ++i
)
114 for ( vlc_dictionary_entry_t
* p_entry
= p_attr_dict
->p_entries
[i
];
115 p_entry
!= NULL
; p_entry
= p_entry
->p_next
)
117 const char *psz_value
= NULL
;
119 if( !strcmp(p_entry
->psz_key
, "begin") ||
120 !strcmp(p_entry
->psz_key
, "end") ||
121 !strcmp(p_entry
->psz_key
, "dur") )
124 /* will remove duration */
127 else if( !strcmp(p_entry
->psz_key
, "timeContainer") )
129 /* also remove sequential timings info (all abs now) */
134 psz_value
= (char const*)p_entry
->p_value
;
137 if( psz_value
== NULL
)
140 vlc_memstream_printf( p_stream
, " %s=\"%s\"",
141 p_entry
->psz_key
, psz_value
);
147 if( tt_time_Valid( &p_node
->timings
.begin
) )
149 char *psz
= tt_genTiming( p_node
->timings
.begin
);
150 vlc_memstream_printf( p_stream
, " begin=\"%s\"", psz
);
154 if( tt_time_Valid( &p_node
->timings
.end
) )
156 char *psz
= tt_genTiming( p_node
->timings
.end
);
157 vlc_memstream_printf( p_stream
, " end=\"%s\"", psz
);
163 static void tt_node_ToText( struct vlc_memstream
*p_stream
, const tt_basenode_t
*p_basenode
,
164 const tt_time_t
*playbacktime
)
166 if( p_basenode
->i_type
== TT_NODE_TYPE_ELEMENT
)
168 const tt_node_t
*p_node
= (const tt_node_t
*) p_basenode
;
170 if( tt_time_Valid( playbacktime
) &&
171 !tt_timings_Contains( &p_node
->timings
, playbacktime
) )
174 vlc_memstream_putc( p_stream
, '<' );
175 vlc_memstream_puts( p_stream
, p_node
->psz_node_name
);
177 tt_node_AttributesToText( p_stream
, p_node
);
179 if( tt_node_HasChild( p_node
) )
181 vlc_memstream_putc( p_stream
, '>' );
183 #ifdef TTML_DEMUX_DEBUG
184 vlc_memstream_printf( p_stream
, "<!-- starts %ld ends %ld -->",
185 tt_time_Convert( &p_node
->timings
.begin
),
186 tt_time_Convert( &p_node
->timings
.end
) );
189 for( const tt_basenode_t
*p_child
= p_node
->p_child
;
190 p_child
; p_child
= p_child
->p_next
)
192 tt_node_ToText( p_stream
, p_child
, playbacktime
);
195 vlc_memstream_printf( p_stream
, "</%s>", p_node
->psz_node_name
);
198 vlc_memstream_puts( p_stream
, "/>" );
202 const tt_textnode_t
*p_textnode
= (const tt_textnode_t
*) p_basenode
;
203 vlc_memstream_puts( p_stream
, p_textnode
->psz_text
);
207 static int Control( demux_t
* p_demux
, int i_query
, va_list args
)
209 demux_sys_t
*p_sys
= p_demux
->p_sys
;
217 *va_arg( args
, bool * ) = true;
220 pi64
= va_arg( args
, int64_t * );
221 *pi64
= p_sys
->i_next_demux_time
;
224 i64
= va_arg( args
, int64_t );
225 if( p_sys
->times
.i_count
)
227 tt_time_t t
= tt_time_Create( i64
- VLC_TICK_0
);
228 size_t i_index
= tt_timings_FindLowerIndex( p_sys
->times
.p_array
,
229 p_sys
->times
.i_count
, t
, &b
);
230 p_sys
->times
.i_current
= i_index
;
231 p_sys
->b_first_time
= true;
235 case DEMUX_SET_NEXT_DEMUX_TIME
:
236 p_sys
->i_next_demux_time
= va_arg( args
, vlc_tick_t
);
237 p_sys
->b_slave
= true;
239 case DEMUX_GET_LENGTH
:
240 pi64
= va_arg( args
, int64_t * );
241 if( p_sys
->times
.i_count
)
243 tt_time_t t
= tt_time_Sub( p_sys
->times
.p_array
[p_sys
->times
.i_count
- 1],
244 p_sys
->temporal_extent
.begin
);
245 *pi64
= tt_time_Convert( &t
);
249 case DEMUX_GET_POSITION
:
250 pf
= va_arg( args
, double * );
251 if( p_sys
->times
.i_current
>= p_sys
->times
.i_count
)
255 else if( p_sys
->times
.i_count
> 0 )
257 i64
= tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_count
- 1] );
258 *pf
= (double) p_sys
->i_next_demux_time
/ (i64
+ 0.5);
265 case DEMUX_SET_POSITION
:
266 f
= va_arg( args
, double );
267 if( p_sys
->times
.i_count
)
269 i64
= f
* tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_count
- 1] );
270 tt_time_t t
= tt_time_Create( i64
);
271 size_t i_index
= tt_timings_FindLowerIndex( p_sys
->times
.p_array
,
272 p_sys
->times
.i_count
, t
, &b
);
273 p_sys
->times
.i_current
= i_index
;
274 p_sys
->b_first_time
= true;
278 case DEMUX_CAN_PAUSE
:
279 case DEMUX_SET_PAUSE_STATE
:
280 case DEMUX_CAN_CONTROL_PACE
:
281 return demux_vaControlHelper( p_demux
->s
, 0, -1, 0, 1, i_query
, args
);
283 case DEMUX_GET_PTS_DELAY
:
286 case DEMUX_GET_ATTACHMENTS
:
287 case DEMUX_GET_TITLE_INFO
:
288 case DEMUX_HAS_UNSUPPORTED_META
:
289 case DEMUX_CAN_RECORD
:
297 static int ReadTTML( demux_t
* p_demux
)
299 demux_sys_t
* p_sys
= p_demux
->p_sys
;
300 const char* psz_node_name
;
304 int i_type
= xml_ReaderNextNode( p_sys
->p_reader
, &psz_node_name
);
305 bool b_empty
= xml_ReaderIsEmptyElement( p_sys
->p_reader
);
307 if( i_type
<= XML_READER_NONE
)
315 case XML_READER_STARTELEM
:
316 if( tt_node_NameCompare( psz_node_name
, "tt" ) ||
317 p_sys
->p_rootnode
!= NULL
)
320 p_sys
->p_rootnode
= tt_node_New( p_sys
->p_reader
, NULL
, psz_node_name
);
323 if( !p_sys
->p_rootnode
||
324 tt_nodes_Read( p_sys
->p_reader
, p_sys
->p_rootnode
) != VLC_SUCCESS
)
328 case XML_READER_ENDELEM
:
329 if( !p_sys
->p_rootnode
||
330 tt_node_NameCompare( psz_node_name
, p_sys
->p_rootnode
->psz_node_name
) )
337 if( p_sys
->p_rootnode
== NULL
)
343 static int Demux( demux_t
* p_demux
)
345 demux_sys_t
* p_sys
= p_demux
->p_sys
;
347 /* Last one must be an end time */
348 while( p_sys
->times
.i_current
+ 1 < p_sys
->times
.i_count
&&
349 tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_current
] ) <= p_sys
->i_next_demux_time
)
351 const vlc_tick_t i_playbacktime
=
352 tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_current
] );
353 const vlc_tick_t i_playbackendtime
=
354 tt_time_Convert( &p_sys
->times
.p_array
[p_sys
->times
.i_current
+ 1] ) - 1;
356 if ( !p_sys
->b_slave
&& p_sys
->b_first_time
)
358 es_out_SetPCR( p_demux
->out
, VLC_TICK_0
+ i_playbacktime
);
359 p_sys
->b_first_time
= false;
362 struct vlc_memstream stream
;
364 if( vlc_memstream_open( &stream
) )
365 return VLC_DEMUXER_EGENERIC
;
367 tt_node_ToText( &stream
, (tt_basenode_t
*) p_sys
->p_rootnode
,
368 &p_sys
->times
.p_array
[p_sys
->times
.i_current
] );
370 if( vlc_memstream_close( &stream
) == VLC_SUCCESS
)
372 block_t
* p_block
= block_heap_Alloc( stream
.ptr
, stream
.length
);
376 p_block
->i_pts
= VLC_TICK_0
+ i_playbacktime
;
377 p_block
->i_length
= i_playbackendtime
- i_playbacktime
;
379 es_out_Send( p_demux
->out
, p_sys
->p_es
, p_block
);
383 p_sys
->times
.i_current
++;
386 if ( !p_sys
->b_slave
)
388 es_out_SetPCR( p_demux
->out
, VLC_TICK_0
+ p_sys
->i_next_demux_time
);
389 p_sys
->i_next_demux_time
+= VLC_TICK_FROM_MS(125);
392 if( p_sys
->times
.i_current
+ 1 >= p_sys
->times
.i_count
)
393 return VLC_DEMUXER_EOF
;
395 return VLC_DEMUXER_SUCCESS
;
398 int tt_OpenDemux( vlc_object_t
* p_this
)
400 demux_t
*p_demux
= (demux_t
*)p_this
;
403 const uint8_t *p_peek
;
404 ssize_t i_peek
= vlc_stream_Peek( p_demux
->s
, &p_peek
, 2048 );
405 if( unlikely( i_peek
<= 32 ) )
408 const char *psz_xml
= (const char *) p_peek
;
409 size_t i_xml
= i_peek
;
411 /* Try to probe without xml module/loading the full document */
412 char *psz_alloc
= NULL
;
413 switch( GetQWBE(p_peek
) )
415 /* See RFC 3023 Part 4 */
416 case UINT64_C(0xFFFE3C003F007800): /* UTF16 BOM<? */
417 case UINT64_C(0xFFFE3C003F007400): /* UTF16 BOM<t */
418 case UINT64_C(0xFEFF003C003F0078): /* UTF16 BOM<? */
419 case UINT64_C(0xFEFF003C003F0074): /* UTF16 BOM<t */
420 psz_alloc
= FromCharset( "UTF-16", p_peek
, i_peek
);
422 case UINT64_C(0x3C003F0078006D00): /* UTF16-LE <?xm */
423 case UINT64_C(0x3C003F0074007400): /* UTF16-LE <tt */
424 psz_alloc
= FromCharset( "UTF-16LE", p_peek
, i_peek
);
426 case UINT64_C(0x003C003F0078006D): /* UTF16-BE <?xm */
427 case UINT64_C(0x003C003F00740074): /* UTF16-BE <tt */
428 psz_alloc
= FromCharset( "UTF-16BE", p_peek
, i_peek
);
430 case UINT64_C(0xEFBBBF3C3F786D6C): /* UTF8 BOM<?xml */
431 case UINT64_C(0x3C3F786D6C207665): /* UTF8 <?xml ve */
432 case UINT64_C(0xEFBBBF3C74742078): /* UTF8 BOM<tt x*/
435 if(GetDWBE(p_peek
) != UINT32_C(0x3C747420)) /* tt node without xml document marker */
442 i_xml
= strlen( psz_alloc
);
445 /* Simplified probing. Valid TTML must have a namespace declaration */
446 const char *psz_tt
= strnstr( psz_xml
, "tt", i_xml
);
447 if( !psz_tt
|| psz_tt
== psz_xml
||
448 ((size_t)(&psz_tt
[2] - (const char*)p_peek
)) == i_xml
|| isalpha(psz_tt
[2]) ||
449 (psz_tt
[-1] != ':' && psz_tt
[-1] != '<') )
456 const char * const rgsz
[] =
458 "=\"http://www.w3.org/ns/ttml\"",
459 "=\"http://www.w3.org/2004/11/ttaf1\"",
460 "=\"http://www.w3.org/2006/04/ttaf1\"",
461 "=\"http://www.w3.org/2006/10/ttaf1\"",
463 const char *psz_ns
= NULL
;
464 for( size_t i
=0; i
<ARRAY_SIZE(rgsz
) && !psz_ns
; i
++ )
466 psz_ns
= strnstr( psz_xml
, rgsz
[i
],
467 i_xml
- (psz_tt
- psz_xml
) );
474 p_demux
->p_sys
= p_sys
= calloc( 1, sizeof( *p_sys
) );
475 if( unlikely( p_sys
== NULL
) )
478 p_sys
->b_first_time
= true;
479 p_sys
->temporal_extent
.i_type
= TT_TIMINGS_PARALLEL
;
480 tt_time_Init( &p_sys
->temporal_extent
.begin
);
481 tt_time_Init( &p_sys
->temporal_extent
.end
);
482 tt_time_Init( &p_sys
->temporal_extent
.dur
);
483 p_sys
->temporal_extent
.begin
.base
= 0;
485 p_sys
->p_xml
= xml_Create( p_demux
);
489 p_sys
->p_reader
= xml_ReaderCreate( p_sys
->p_xml
, p_demux
->s
);
490 if( !p_sys
->p_reader
)
493 #ifndef TTML_DEMUX_DEBUG
494 p_sys
->p_reader
->obj
.flags
|= OBJECT_FLAGS_QUIET
;
497 if( ReadTTML( p_demux
) != VLC_SUCCESS
)
500 tt_timings_Resolve( (tt_basenode_t
*) p_sys
->p_rootnode
, &p_sys
->temporal_extent
,
501 &p_sys
->times
.p_array
, &p_sys
->times
.i_count
);
503 #ifdef TTML_DEMUX_DEBUG
505 struct vlc_memstream stream
;
507 if( vlc_memstream_open( &stream
) )
512 tt_node_ToText( &stream
, (tt_basenode_t
*)p_sys
->p_rootnode
, &t
/* invalid */ );
514 vlc_memstream_putc( &stream
, '\0' );
516 if( vlc_memstream_close( &stream
) == VLC_SUCCESS
)
518 msg_Dbg( p_demux
, "%s", stream
.ptr
);
524 p_demux
->pf_demux
= Demux
;
525 p_demux
->pf_control
= Control
;
528 es_format_Init( &fmt
, SPU_ES
, VLC_CODEC_TTML
);
529 p_sys
->p_es
= es_out_Add( p_demux
->out
, &fmt
);
533 es_format_Clean( &fmt
);
538 tt_CloseDemux( p_demux
);
543 void tt_CloseDemux( demux_t
* p_demux
)
545 demux_sys_t
* p_sys
= p_demux
->p_sys
;
547 if( p_sys
->p_rootnode
)
548 tt_node_RecursiveDelete( p_sys
->p_rootnode
);
551 es_out_Del( p_demux
->out
, p_sys
->p_es
);
553 if( p_sys
->p_reader
)
554 xml_ReaderDelete( p_sys
->p_reader
);
557 xml_Delete( p_sys
->p_xml
);
559 free( p_sys
->times
.p_array
);