Make that per 3MB per video track, not 3MB per file.
[libmkv.git] / src / matroska.c
blob6198b5f0cb545a80c174f53f005bed88709608a2
1 /*****************************************************************************
2 * matroska.c:
3 *****************************************************************************
4 * Copyright (C) 2005 x264 project
5 * $Id: $
7 * Authors: Mike Matsnev
8 * Nathan Caldwell
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111, USA.
23 *****************************************************************************/
24 #include "libmkv.h"
25 #include "matroska.h"
26 #include "config.h"
28 int mk_seekFile(mk_Writer *w, uint64_t pos) {
29 if (fseek(w->fp, pos, SEEK_SET))
30 return -1;
32 w->f_pos = pos;
34 if (pos > w->f_eof)
35 w->f_eof = pos;
37 return 0;
40 int mk_writeVoid(mk_Context *c, uint64_t length) {
41 char *c_void = calloc(length, sizeof(char));
43 CHECK(mk_writeID(c, 0xec));
44 CHECK(mk_writeSize(c, length));
45 CHECK(mk_appendContextData(c, c_void, length));
46 free(c_void);
47 return 0;
50 char *mk_laceXiph(uint64_t *sizes, uint8_t num_frames, uint64_t *output_size) {
51 unsigned i, j;
52 uint64_t offset = 0;
53 uint64_t alloc_size = num_frames * 6; // Complete guess. We'll realloc if we need more space, though.
54 char *laced = calloc(alloc_size, sizeof(char));
55 if (laced == NULL)
56 return NULL;
58 laced[offset++] = num_frames;
59 for (i = 0; i < num_frames; i++)
61 for (j = sizes[i]; j >= 255 ; j -= 255)
63 laced[offset++] = 255;
64 if (offset + 1 >= alloc_size) {
65 int avg_sz = offset / (i - 1); // Compute approximate average bytes/frame
66 alloc_size += avg_sz * (num_frames - i); // Add our average + number of frames left to size
67 if ((laced = realloc(laced, alloc_size)) == NULL)
68 return NULL;
71 laced[offset++] = j;
74 if (output_size != NULL)
75 *output_size = offset;
77 return laced;
80 mk_Writer *mk_createWriter(const char *filename, int64_t timescale, uint8_t vlc_compat) {
81 mk_Writer *w = calloc(1, sizeof(*w));
82 if (w == NULL)
83 return NULL;
85 w->root = mk_createContext(w, NULL, 0);
86 if (w->root == NULL) {
87 free(w);
88 return NULL;
91 if ((w->cues = mk_createContext(w, w->root, 0x1c53bb6b)) == NULL) // Cues
93 mk_destroyContexts(w);
94 free(w);
95 return NULL;
98 w->fp = fopen(filename, "wb");
99 if (w->fp == NULL) {
100 mk_destroyContexts(w);
101 free(w);
102 return NULL;
105 w->timescale = timescale;
106 w->vlc_compat = vlc_compat;
108 return w;
111 int mk_writeHeader(mk_Writer *w, const char *writingApp) {
112 mk_Context *c;
114 if (w->wrote_header)
115 return -1;
117 if ((c = mk_createContext(w, w->root, 0x1a45dfa3)) == NULL) // EBML
118 return -1;
119 CHECK(mk_writeUInt(c, 0x4286, 1)); // EBMLVersion
120 CHECK(mk_writeUInt(c, 0x42f7, 1)); // EBMLReadVersion
121 CHECK(mk_writeUInt(c, 0x42f2, 4)); // EBMLMaxIDLength
122 CHECK(mk_writeUInt(c, 0x42f3, 8)); // EBMLMaxSizeLength
123 CHECK(mk_writeStr(c, 0x4282, "matroska")); // DocType
124 CHECK(mk_writeUInt(c, 0x4287, 1)); // DocTypeVersion
125 CHECK(mk_writeUInt(c, 0x4285, 1)); // DocTypeReadversion
126 CHECK(mk_closeContext(c, 0));
128 if ((c = mk_createContext(w, w->root, 0x18538067)) == NULL) // Segment
129 return -1;
130 CHECK(mk_flushContextID(c));
131 w->segment_ptr = c->d_cur;
132 CHECK(mk_closeContext(c, &w->segment_ptr));
134 if (w->vlc_compat)
136 CHECK(mk_writeVoid(w->root, 0x100)); // 256 bytes should be enough room for our Seek entries.
137 CHECK(mk_writeVoid(w->root, 0x800)); // 2048 bytes for Chapters.
138 CHECK(mk_writeVoid(w->root, 0x1000)); // 4096 bytes for Cues.
139 } else
141 w->seek_data.seekhead = 0x80000000;
142 CHECK(mk_writeSeek(w, &w->seekhead_ptr));
143 w->seek_data.seekhead = 0;
146 if ((c = mk_createContext(w, w->root, 0x1549a966)) == NULL) // SegmentInfo
147 return -1;
148 w->seek_data.segmentinfo = w->root->d_cur - w->segment_ptr;
149 CHECK(mk_writeStr(c, 0x4d80, PACKAGE_STRING)); // MuxingApp
150 CHECK(mk_writeStr(c, 0x5741, writingApp)); // WritingApp
151 CHECK(mk_writeUInt(c, 0x2ad7b1, w->timescale)); // TimecodeScale
152 CHECK(mk_writeFloat(c, 0x4489, 0)); // Duration
153 w->duration_ptr = c->d_cur - 4;
154 CHECK(mk_closeContext(c, &w->duration_ptr));
156 w->seek_data.tracks = w->root->d_cur - w->segment_ptr;
158 if (w->tracks) {
159 CHECK(mk_closeContext(w->tracks, 0));
162 CHECK(mk_flushContextData(w->root));
164 w->wrote_header = 1;
165 w->def_duration = w->tracks_arr[0]->default_duration;
166 return 0;
169 static int mk_closeCluster(mk_Writer *w) {
170 if (w->cluster.context == NULL)
171 return 0;
172 w->cluster.count++;
173 CHECK(mk_closeContext(w->cluster.context, 0));
174 w->cluster.context = NULL;
175 CHECK(mk_flushContextData(w->root));
176 return 0;
179 int mk_flushFrame(mk_Writer *w, mk_Track *track) {
180 mk_Context *c, *tp;
181 int64_t delta, ref = 0;
182 unsigned fsize, bgsize;
183 uint8_t flags, c_delta_flags[2];
184 int i;
185 char *laced = NULL;
186 uint64_t length = 0;
188 if (!track->in_frame)
189 return 0;
191 delta = track->frame.timecode/w->timescale - w->cluster.tc_scaled;
192 if (delta > 32767ll || delta < -32768ll)
193 CHECK(mk_closeCluster(w));
195 if (w->cluster.context == NULL) {
196 w->cluster.tc_scaled = track->frame.timecode / w->timescale;
197 w->cluster.context = mk_createContext(w, w->root, 0x1f43b675); // Cluster
198 if (w->cluster.context == NULL)
199 return -1;
201 w->cluster.pointer = w->f_pos - w->segment_ptr;
203 CHECK(mk_writeUInt(w->cluster.context, 0xe7, w->cluster.tc_scaled)); // Cluster Timecode
205 delta = 0;
206 w->cluster.block_count = 0;
209 fsize = track->frame.data ? track->frame.data->d_cur : 0;
210 bgsize = fsize + 4 + mk_ebmlSizeSize(fsize + 4) + 1;
211 if (!track->frame.keyframe) {
212 ref = track->prev_frame_tc_scaled - w->cluster.tc_scaled - delta;
213 bgsize += 1 + 1 + mk_ebmlSIntSize(ref);
216 CHECK(mk_writeID(w->cluster.context, 0xa0)); // BlockGroup
217 CHECK(mk_writeSize(w->cluster.context, bgsize));
218 CHECK(mk_writeID(w->cluster.context, 0xa1)); // Block
220 switch (track->frame.lacing) {
221 case MK_LACING_XIPH:
222 laced = mk_laceXiph(track->frame.lacing_sizes, track->frame.lacing_num_frames, &length);
223 break;
224 case MK_LACING_EBML:
225 length += mk_ebmlSizeSize(track->frame.lacing_sizes[0]) + 1;
226 for (i = 1; i < track->frame.lacing_num_frames; i++)
227 length += mk_ebmlSizeSize(track->frame.lacing_sizes[i] << 1);
228 break;
229 case MK_LACING_FIXED:
231 laced = calloc(1, sizeof(char));
232 laced[0] = track->frame.lacing_num_frames;
233 ++length;
235 break;
238 CHECK(mk_writeSize(w->cluster.context, fsize + 4 + length));
239 CHECK(mk_writeSize(w->cluster.context, track->track_id)); // track number
241 w->cluster.block_count++;
243 c_delta_flags[0] = delta >> 8;
244 c_delta_flags[1] = delta;
245 CHECK(mk_appendContextData(w->cluster.context, c_delta_flags, 2));
247 flags = ( track->frame.keyframe << 8 ) | track->frame.lacing;
248 CHECK(mk_appendContextData(w->cluster.context, &flags, 1));
249 if (track->frame.lacing) {
250 if (track->frame.lacing == MK_LACING_EBML) {
251 CHECK(mk_appendContextData(w->cluster.context, &track->frame.lacing_num_frames, 1));
252 CHECK(mk_writeSize(w->cluster.context, track->frame.lacing_sizes[0]));
253 for (i = 1; i < track->frame.lacing_num_frames; i++)
255 CHECK(mk_writeSSize(w->cluster.context, track->frame.lacing_sizes[i] - track->frame.lacing_sizes[i-1]));
257 } else if (length > 0 && laced != NULL) {
258 CHECK(mk_appendContextData(w->cluster.context, laced, length));
259 free(laced);
260 laced = NULL;
264 if (track->frame.data) {
265 CHECK(mk_appendContextData(w->cluster.context, track->frame.data->data, track->frame.data->d_cur));
266 track->frame.data->d_cur = 0;
268 if (!track->frame.keyframe)
269 CHECK(mk_writeSInt(w->cluster.context, 0xfb, ref)); // ReferenceBlock
271 if (track->frame.keyframe && (track->track_type & MK_TRACK_VIDEO) && (track->prev_cue_pos + 3*CLSIZE) >= w->f_pos) {
272 if ((c = mk_createContext(w, w->cues, 0xbb)) == NULL) // CuePoint
273 return -1;
274 CHECK(mk_writeUInt(c, 0xb3, track->frame.timecode)); // CueTime
276 if ((tp = mk_createContext(w, c, 0xb7)) == NULL) // CueTrackPositions
277 return -1;
278 CHECK(mk_writeUInt(tp, 0xf7, track->track_id)); // CueTrack
279 CHECK(mk_writeUInt(tp, 0xf1, w->cluster.pointer)); // CueClusterPosition
280 // CHECK(mk_writeUInt(c, 0x5378, w->cluster.block_count)); // CueBlockNumber
281 CHECK(mk_closeContext(tp, 0));
282 CHECK(mk_closeContext(c, 0));
285 track->in_frame = 0;
286 track->prev_frame_tc_scaled = w->cluster.tc_scaled + delta;
288 if (w->cluster.context->d_cur > CLSIZE)
289 CHECK(mk_closeCluster(w));
291 return 0;
294 int mk_startFrame(mk_Writer *w, mk_Track *track) {
295 if (mk_flushFrame(w, track) < 0)
296 return -1;
298 track->in_frame = 1;
299 track->frame.keyframe = 0;
300 track->frame.lacing = MK_LACING_NONE;
301 track->frame.lacing_num_frames = 0;
302 track->frame.lacing_sizes = NULL;
304 return 0;
307 int mk_setFrameFlags(mk_Writer *w, mk_Track *track, int64_t timestamp, unsigned keyframe) {
308 if (!track->in_frame)
309 return -1;
311 track->frame.timecode = timestamp;
312 track->frame.keyframe = keyframe != 0;
314 if (track->max_frame_tc < timestamp)
315 track->max_frame_tc = timestamp;
317 return 0;
320 int mk_setFrameLacing(mk_Writer *w, mk_Track *track, uint8_t lacing, uint8_t num_frames, uint32_t sizes[]) {
321 if (!track->in_frame)
322 return -1;
323 track->frame.lacing_sizes = calloc(num_frames, sizeof(uint32_t));
325 track->frame.lacing = lacing;
326 track->frame.lacing_num_frames = num_frames;
327 memcpy(track->frame.lacing_sizes, sizes, num_frames);
329 return 0;
332 int mk_addFrameData(mk_Writer *w, mk_Track *track, const void *data, unsigned size) {
333 if (!track->in_frame)
334 return -1;
336 if (track->frame.data == NULL)
337 if ((track->frame.data = mk_createContext(w, NULL, 0)) == NULL)
338 return -1;
340 return mk_appendContextData(track->frame.data, data, size);
343 /* The offset of the SeekHead is returned in *pointer. */
344 int mk_writeSeek(mk_Writer *w, int64_t *pointer) {
345 mk_Context *c, *s;
346 int64_t seekhead_ptr;
348 if ((c = mk_createContext(w, w->root, 0x114d9b74)) == NULL) // SeekHead
349 return -1;
350 if (pointer != NULL)
351 seekhead_ptr = w->f_pos;
352 if (w->seek_data.seekhead) {
353 if ((s = mk_createContext(w, c, 0x4dbb)) == NULL) // Seek
354 return -1;
355 CHECK(mk_writeUInt(s, 0x53ab, 0x114d9b74)); // SeekID
356 CHECK(mk_writeUInt(s, 0x53ac, w->seek_data.seekhead)); // SeekPosition
357 CHECK(mk_closeContext(s, 0));
359 if (w->seek_data.segmentinfo) {
360 if ((s = mk_createContext(w, c, 0x4dbb)) == NULL) // Seek
361 return -1;
362 CHECK(mk_writeUInt(s, 0x53ab, 0x1549a966)); // SeekID
363 CHECK(mk_writeUInt(s, 0x53ac, w->seek_data.segmentinfo)); // SeekPosition
364 CHECK(mk_closeContext(s, 0));
366 if (w->seek_data.tracks) {
367 if ((s = mk_createContext(w, c, 0x4dbb)) == NULL) // Seek
368 return -1;
369 CHECK(mk_writeUInt(s, 0x53ab, 0x1654ae6b)); // SeekID
370 CHECK(mk_writeUInt(s, 0x53ac, w->seek_data.tracks)); // SeekPosition
371 CHECK(mk_closeContext(s, 0));
373 if (w->seek_data.cues) {
374 if ((s = mk_createContext(w, c, 0x4dbb)) == NULL) // Seek
375 return -1;
376 CHECK(mk_writeUInt(s, 0x53ab, 0x1c53bb6b)); // SeekID
377 CHECK(mk_writeUInt(s, 0x53ac, w->seek_data.cues)); // SeekPosition
378 CHECK(mk_closeContext(s, 0));
380 if (w->seek_data.attachments) {
381 if ((s = mk_createContext(w, c, 0x4dbb)) == NULL) // Seek
382 return -1;
383 CHECK(mk_writeUInt(s, 0x53ab, 0x1941a469)); // SeekID
384 CHECK(mk_writeUInt(s, 0x53ac, w->seek_data.attachments)); // SeekPosition
385 CHECK(mk_closeContext(s, 0));
387 if (w->seek_data.chapters) {
388 if ((s = mk_createContext(w, c, 0x4dbb)) == NULL) // Seek
389 return -1;
390 CHECK(mk_writeUInt(s, 0x53ab, 0x1043a770)); // SeekID
391 CHECK(mk_writeUInt(s, 0x53ac, w->seek_data.chapters)); // SeekPosition
392 CHECK(mk_closeContext(s, 0));
394 if (w->seek_data.tags) {
395 if ((s = mk_createContext(w, c, 0x4dbb)) == NULL) // Seek
396 return -1;
397 CHECK(mk_writeUInt(s, 0x53ab, 0x1254c367)); // SeekID
398 CHECK(mk_writeUInt(s, 0x53ac, w->seek_data.tags)); // SeekPosition
399 CHECK(mk_closeContext(s, 0));
401 CHECK(mk_closeContext(c, 0));
403 if (pointer != NULL)
404 *pointer = seekhead_ptr;
406 return 0;
409 int mk_close(mk_Writer *w) {
410 int i, ret = 0;
411 mk_Track *tk;
412 int64_t max_frame_tc = w->tracks_arr[0]->max_frame_tc;
413 uint64_t segment_size = 0;
414 unsigned char c_size[8];
416 for (i = w->num_tracks - 1; i >= 0; i--)
418 tk = w->tracks_arr[i];
419 w->tracks_arr[i] = NULL;
420 --w->num_tracks;
421 if (mk_flushFrame(w, tk) < 0)
422 ret = -1;
423 free(tk);
424 tk = NULL;
427 if (mk_closeCluster(w) < 0)
428 ret = -1;
430 if (w->chapters != NULL)
432 if (w->vlc_compat) {
433 if (mk_seekFile(w, w->segment_ptr + 0x103) < 0)
434 ret = -1;
436 w->seek_data.chapters = w->f_pos - w->segment_ptr;
437 mk_writeChapters(w);
438 if (w->vlc_compat) {
439 if (mk_flushContextData(w->root) < 0)
440 ret = -1;
441 if (mk_writeVoid(w->root, (0x800 - (w->f_pos - w->segment_ptr))) < 0)
442 ret = -1;
444 if (mk_flushContextData(w->root) < 0)
445 ret = -1;
448 w->seek_data.cues = w->f_pos - w->segment_ptr;
449 // if (w->vlc_compat) {
450 // if (mk_seekFile(w, w->segment_ptr + 259 + 2051) < 0)
451 // ret = -1;
452 // }
453 if (mk_closeContext(w->cues, 0) < 0)
454 ret = -1;
455 if (w->vlc_compat) {
456 if (mk_flushContextData(w->root) < 0)
457 ret = -1;
458 if (mk_writeVoid(w->root, (0x1000 - (w->f_pos - w->segment_ptr))) < 0)
459 ret = -1;
461 if (mk_flushContextData(w->root) < 0)
462 ret = -1;
464 if (w->wrote_header) {
465 if (w->vlc_compat) {
466 if (mk_seekFile(w, w->segment_ptr) < 0)
467 ret = -1;
470 if (mk_writeSeek(w, &w->seek_data.seekhead) < 0)
471 ret = -1;
472 w->seek_data.seekhead -= w->segment_ptr;
474 if (w->vlc_compat)
476 if (mk_flushContextData(w->root) < 0)
477 ret = -1;
478 if (mk_writeVoid(w->root, (256 - (w->f_pos - w->segment_ptr))) < 0)
479 ret = -1;
482 if (mk_flushContextData(w->root) < 0)
483 ret = -1;
485 if (!w->vlc_compat)
487 int i = w->seek_data.segmentinfo;
488 w->seek_data.segmentinfo = 0;
489 w->seek_data.tracks = 0;
490 w->seek_data.cues = 0;
491 w->seek_data.chapters = 0;
492 w->seek_data.attachments = 0;
493 w->seek_data.tags = 0;
494 if (mk_seekFile(w, w->segment_ptr) < 0)
495 ret = -1;
496 if (mk_writeSeek(w, NULL) < 0 ||
497 mk_flushContextData(w->root) < 0)
498 ret = -1;
499 if (((i + w->segment_ptr) - w->f_pos - 2) > 1)
500 if (mk_writeVoid(w->root, (i + w->segment_ptr) - w->f_pos - 2) < 0 ||
501 mk_flushContextData(w->root) < 0)
502 ret = -1;
505 if (mk_seekFile(w, w->duration_ptr) < 0)
506 ret = -1;
507 if (mk_writeFloatRaw(w->root, (float)((double)(max_frame_tc+w->def_duration) / w->timescale)) < 0 ||
508 mk_flushContextData(w->root) < 0)
509 ret = -1;
510 if (mk_seekFile(w, w->segment_ptr - 8) < 0)
511 ret = -1;
512 segment_size = w->f_eof - w->segment_ptr;
513 for (i = 7; i > 0; --i)
514 c_size[i] = segment_size >> (8 * (7-i));
515 c_size[i] = 0x01;
516 if (mk_appendContextData(w->root, &c_size, 8) < 0 ||
517 mk_flushContextData(w->root) < 0)
518 ret = -1;
521 if (mk_closeContext(w->root, 0) < 0)
522 ret = -1;
523 mk_destroyContexts(w);
524 fclose(w->fp);
525 free(w->tracks_arr);
526 free(w);
528 return ret;