2011-06-15 11:19:50 -07:00
|
|
|
|
|
|
|
|
2011-05-12 17:24:54 +02:00
|
|
|
// Simple Extensible Binary Markup Language (ebml) reader and writer on a
|
2011-03-22 13:59:17 -07:00
|
|
|
// cursor model. See the specification here:
|
|
|
|
// http://www.matroska.org/technical/specs/rfc/index.html
|
2011-09-12 16:13:28 -07:00
|
|
|
import option::{some, none};
|
2011-03-22 13:59:17 -07:00
|
|
|
|
2011-07-27 14:19:39 +02:00
|
|
|
type ebml_tag = {id: uint, size: uint};
|
2011-06-15 11:19:50 -07:00
|
|
|
|
2011-07-27 14:19:39 +02:00
|
|
|
type ebml_state = {ebml_tag: ebml_tag, tag_pos: uint, data_pos: uint};
|
2011-03-22 13:59:17 -07:00
|
|
|
|
2011-06-15 11:19:50 -07:00
|
|
|
|
2011-03-22 13:59:17 -07:00
|
|
|
// TODO: When we have module renaming, make "reader" and "writer" separate
|
|
|
|
// modules within this file.
|
|
|
|
|
2011-05-12 17:24:54 +02:00
|
|
|
// ebml reading
|
2011-08-04 17:24:54 -07:00
|
|
|
type doc = {data: @[u8], start: uint, end: uint};
|
2011-07-27 14:19:39 +02:00
|
|
|
|
2011-09-12 11:27:30 +02:00
|
|
|
fn vint_at(data: [u8], start: uint) -> {val: uint, next: uint} {
|
2011-08-19 15:16:48 -07:00
|
|
|
let a = data[start];
|
2011-07-27 14:19:39 +02:00
|
|
|
if a & 0x80u8 != 0u8 { ret {val: a & 0x7fu8 as uint, next: start + 1u}; }
|
|
|
|
if a & 0x40u8 != 0u8 {
|
2011-08-19 15:16:48 -07:00
|
|
|
ret {val: (a & 0x3fu8 as uint) << 8u | (data[start + 1u] as uint),
|
2011-07-27 14:19:39 +02:00
|
|
|
next: start + 2u};
|
2011-08-19 15:16:48 -07:00
|
|
|
} else if a & 0x20u8 != 0u8 {
|
2011-07-27 14:19:39 +02:00
|
|
|
ret {val:
|
|
|
|
(a & 0x1fu8 as uint) << 16u |
|
2011-08-19 15:16:48 -07:00
|
|
|
(data[start + 1u] as uint) << 8u |
|
|
|
|
(data[start + 2u] as uint),
|
2011-07-27 14:19:39 +02:00
|
|
|
next: start + 3u};
|
2011-08-19 15:16:48 -07:00
|
|
|
} else if a & 0x10u8 != 0u8 {
|
2011-07-27 14:19:39 +02:00
|
|
|
ret {val:
|
|
|
|
(a & 0x0fu8 as uint) << 24u |
|
2011-08-19 15:16:48 -07:00
|
|
|
(data[start + 1u] as uint) << 16u |
|
|
|
|
(data[start + 2u] as uint) << 8u |
|
|
|
|
(data[start + 3u] as uint),
|
2011-07-27 14:19:39 +02:00
|
|
|
next: start + 4u};
|
2011-06-15 11:19:50 -07:00
|
|
|
} else { log_err "vint too big"; fail; }
|
2011-03-22 13:59:17 -07:00
|
|
|
}
|
|
|
|
|
2011-09-12 11:27:30 +02:00
|
|
|
fn new_doc(data: @[u8]) -> doc {
|
2011-08-12 10:56:57 -07:00
|
|
|
ret {data: data, start: 0u, end: vec::len::<u8>(*data)};
|
2011-04-07 02:53:25 +02:00
|
|
|
}
|
2011-03-22 13:59:17 -07:00
|
|
|
|
2011-09-12 11:27:30 +02:00
|
|
|
fn doc_at(data: @[u8], start: uint) -> doc {
|
2011-08-08 15:30:37 -07:00
|
|
|
let elt_tag = vint_at(*data, start);
|
|
|
|
let elt_size = vint_at(*data, elt_tag.next);
|
2011-07-27 14:19:39 +02:00
|
|
|
let end = elt_size.next + elt_size.val;
|
|
|
|
ret {data: data, start: elt_size.next, end: end};
|
2011-03-22 13:59:17 -07:00
|
|
|
}
|
|
|
|
|
2011-08-10 09:27:11 -07:00
|
|
|
fn maybe_get_doc(d: doc, tg: uint) -> option::t<doc> {
|
2011-07-27 14:19:39 +02:00
|
|
|
let pos = d.start;
|
|
|
|
while pos < d.end {
|
2011-08-08 15:30:37 -07:00
|
|
|
let elt_tag = vint_at(*d.data, pos);
|
|
|
|
let elt_size = vint_at(*d.data, elt_tag.next);
|
2011-07-26 14:06:02 +02:00
|
|
|
pos = elt_size.next + elt_size.val;
|
2011-07-27 14:19:39 +02:00
|
|
|
if elt_tag.val == tg {
|
2011-08-12 10:56:57 -07:00
|
|
|
ret some::<doc>({data: d.data, start: elt_size.next, end: pos});
|
2011-03-25 17:53:46 -07:00
|
|
|
}
|
2011-03-22 13:59:17 -07:00
|
|
|
}
|
2011-08-12 10:56:57 -07:00
|
|
|
ret none::<doc>;
|
2011-03-22 13:59:17 -07:00
|
|
|
}
|
|
|
|
|
2011-07-27 14:19:39 +02:00
|
|
|
fn get_doc(d: doc, tg: uint) -> doc {
|
|
|
|
alt maybe_get_doc(d, tg) {
|
|
|
|
some(d) { ret d; }
|
|
|
|
none. {
|
2011-09-02 15:34:58 -07:00
|
|
|
log_err "failed to find block with tag " + uint::to_str(tg, 10u);
|
2011-07-27 14:19:39 +02:00
|
|
|
fail;
|
|
|
|
}
|
2011-04-07 02:53:25 +02:00
|
|
|
}
|
2011-03-22 13:59:17 -07:00
|
|
|
}
|
|
|
|
|
2011-10-21 12:31:48 +02:00
|
|
|
fn docs(d: doc, it: block(uint, doc)) {
|
2011-07-27 14:19:39 +02:00
|
|
|
let pos = d.start;
|
|
|
|
while pos < d.end {
|
2011-08-08 15:30:37 -07:00
|
|
|
let elt_tag = vint_at(*d.data, pos);
|
|
|
|
let elt_size = vint_at(*d.data, elt_tag.next);
|
2011-07-26 14:06:02 +02:00
|
|
|
pos = elt_size.next + elt_size.val;
|
2011-10-21 12:31:48 +02:00
|
|
|
it(elt_tag.val, {data: d.data, start: elt_size.next, end: pos});
|
2011-03-31 14:37:09 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-10-21 12:31:48 +02:00
|
|
|
fn tagged_docs(d: doc, tg: uint, it: block(doc)) {
|
2011-07-27 14:19:39 +02:00
|
|
|
let pos = d.start;
|
|
|
|
while pos < d.end {
|
2011-08-08 15:30:37 -07:00
|
|
|
let elt_tag = vint_at(*d.data, pos);
|
|
|
|
let elt_size = vint_at(*d.data, elt_tag.next);
|
2011-07-26 14:06:02 +02:00
|
|
|
pos = elt_size.next + elt_size.val;
|
2011-07-27 14:19:39 +02:00
|
|
|
if elt_tag.val == tg {
|
2011-10-21 12:31:48 +02:00
|
|
|
it({data: d.data, start: elt_size.next, end: pos});
|
2011-04-07 02:53:25 +02:00
|
|
|
}
|
|
|
|
}
|
2011-03-31 14:37:09 -07:00
|
|
|
}
|
|
|
|
|
2011-08-12 10:56:57 -07:00
|
|
|
fn doc_data(d: doc) -> [u8] { ret vec::slice::<u8>(*d.data, d.start, d.end); }
|
2011-03-22 13:59:17 -07:00
|
|
|
|
2011-09-12 11:27:30 +02:00
|
|
|
fn be_uint_from_bytes(data: @[u8], start: uint, size: uint) -> uint {
|
2011-07-27 14:19:39 +02:00
|
|
|
let sz = size;
|
2011-05-02 17:47:24 -07:00
|
|
|
assert (sz <= 4u);
|
2011-07-27 14:19:39 +02:00
|
|
|
let val = 0u;
|
|
|
|
let pos = start;
|
|
|
|
while sz > 0u {
|
2011-04-07 02:53:25 +02:00
|
|
|
sz -= 1u;
|
2011-08-19 15:16:48 -07:00
|
|
|
val += (data[pos] as uint) << sz * 8u;
|
2011-04-07 02:53:25 +02:00
|
|
|
pos += 1u;
|
|
|
|
}
|
|
|
|
ret val;
|
2011-03-31 14:37:09 -07:00
|
|
|
}
|
|
|
|
|
2011-07-27 14:19:39 +02:00
|
|
|
fn doc_as_uint(d: doc) -> uint {
|
2011-04-07 02:53:25 +02:00
|
|
|
ret be_uint_from_bytes(d.data, d.start, d.end - d.start);
|
2011-03-22 13:59:17 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2011-06-15 11:19:50 -07:00
|
|
|
// ebml writing
|
2011-08-11 19:14:38 -07:00
|
|
|
type writer = {writer: io::buf_writer, mutable size_positions: [uint]};
|
2011-07-27 14:19:39 +02:00
|
|
|
|
2011-09-12 11:27:30 +02:00
|
|
|
fn write_sized_vint(w: io::buf_writer, n: uint, size: uint) {
|
2011-08-04 17:24:54 -07:00
|
|
|
let buf: [u8];
|
2011-07-27 14:19:39 +02:00
|
|
|
alt size {
|
2011-08-19 15:16:48 -07:00
|
|
|
1u { buf = [0x80u8 | (n as u8)]; }
|
|
|
|
2u { buf = [0x40u8 | (n >> 8u as u8), n & 0xffu as u8]; }
|
2011-07-27 14:19:39 +02:00
|
|
|
3u {
|
|
|
|
buf =
|
2011-08-19 15:16:48 -07:00
|
|
|
[0x20u8 | (n >> 16u as u8), n >> 8u & 0xffu as u8,
|
|
|
|
n & 0xffu as u8];
|
2011-07-27 14:19:39 +02:00
|
|
|
}
|
|
|
|
4u {
|
|
|
|
buf =
|
2011-08-19 15:16:48 -07:00
|
|
|
[0x10u8 | (n >> 24u as u8), n >> 16u & 0xffu as u8,
|
|
|
|
n >> 8u & 0xffu as u8, n & 0xffu as u8];
|
2011-07-27 14:19:39 +02:00
|
|
|
}
|
|
|
|
_ { log_err "vint to write too big"; fail; }
|
2011-03-22 17:28:35 -07:00
|
|
|
}
|
|
|
|
w.write(buf);
|
|
|
|
}
|
|
|
|
|
2011-09-12 11:27:30 +02:00
|
|
|
fn write_vint(w: io::buf_writer, n: uint) {
|
2011-07-27 14:19:39 +02:00
|
|
|
if n < 0x7fu { write_sized_vint(w, n, 1u); ret; }
|
|
|
|
if n < 0x4000u { write_sized_vint(w, n, 2u); ret; }
|
|
|
|
if n < 0x200000u { write_sized_vint(w, n, 3u); ret; }
|
|
|
|
if n < 0x10000000u { write_sized_vint(w, n, 4u); ret; }
|
2011-04-19 12:02:06 +02:00
|
|
|
log_err "vint to write too big";
|
2011-03-22 17:28:35 -07:00
|
|
|
fail;
|
|
|
|
}
|
|
|
|
|
2011-09-12 11:27:30 +02:00
|
|
|
fn create_writer(w: io::buf_writer) -> writer {
|
2011-08-19 15:16:48 -07:00
|
|
|
let size_positions: [uint] = [];
|
2011-07-27 14:19:39 +02:00
|
|
|
ret {writer: w, mutable size_positions: size_positions};
|
2011-03-22 17:28:35 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2011-06-15 11:19:50 -07:00
|
|
|
// TODO: Provide a function to write the standard ebml header.
|
2011-09-12 11:27:30 +02:00
|
|
|
fn start_tag(w: writer, tag_id: uint) {
|
2011-05-12 17:24:54 +02:00
|
|
|
// Write the tag ID:
|
2011-03-22 17:28:35 -07:00
|
|
|
|
2011-06-15 11:19:50 -07:00
|
|
|
write_vint(w.writer, tag_id);
|
2011-03-22 17:28:35 -07:00
|
|
|
// Write a placeholder four-byte size.
|
2011-06-15 11:19:50 -07:00
|
|
|
|
2011-08-19 15:16:48 -07:00
|
|
|
w.size_positions += [w.writer.tell()];
|
|
|
|
let zeroes: [u8] = [0u8, 0u8, 0u8, 0u8];
|
2011-03-22 17:28:35 -07:00
|
|
|
w.writer.write(zeroes);
|
|
|
|
}
|
|
|
|
|
2011-09-12 11:27:30 +02:00
|
|
|
fn end_tag(w: writer) {
|
2011-08-12 10:56:57 -07:00
|
|
|
let last_size_pos = vec::pop::<uint>(w.size_positions);
|
2011-07-27 14:19:39 +02:00
|
|
|
let cur_pos = w.writer.tell();
|
2011-08-11 19:14:38 -07:00
|
|
|
w.writer.seek(last_size_pos as int, io::seek_set);
|
2011-03-22 17:28:35 -07:00
|
|
|
write_sized_vint(w.writer, cur_pos - last_size_pos - 4u, 4u);
|
2011-08-11 19:14:38 -07:00
|
|
|
w.writer.seek(cur_pos as int, io::seek_set);
|
2011-03-22 17:28:35 -07:00
|
|
|
}
|
|
|
|
// TODO: optionally perform "relaxations" on end_tag to more efficiently
|
|
|
|
// encode sizes; this is a fixed point iteration
|