rust/src/comp/metadata/tydecode.rs

416 lines
12 KiB
Rust
Raw Normal View History

// Type decoding
2011-06-27 18:03:01 -05:00
2011-11-10 10:41:42 -06:00
import std::{vec, str, uint};
2011-09-12 18:13:28 -05:00
import std::option::{none, some};
import syntax::ast;
import syntax::ast::*;
import syntax::ast_util;
import syntax::ast_util::respan;
import middle::ty;
export parse_def_id;
export parse_ty_data;
// Compact string representation for ty::t values. API ty_str &
// parse_from_str. Extra parameters are for converting to/from def_ids in the
// data buffer. Whatever format you choose should not contain pipe characters.
// Callback to translate defs to strs or back:
type str_def = fn@(str) -> ast::def_id;
type pstate =
{data: @[u8], crate: int, mutable pos: uint, len: uint, tcx: ty::ctxt};
fn peek(st: @pstate) -> u8 { ret st.data[st.pos]; }
2011-07-27 07:19:39 -05:00
fn next(st: @pstate) -> u8 {
let ch = st.data[st.pos];
st.pos = st.pos + 1u;
ret ch;
}
2011-07-27 07:19:39 -05:00
fn parse_ident(st: @pstate, sd: str_def, last: char) -> ast::ident {
fn is_last(b: char, c: char) -> bool { ret c == b; }
ret parse_ident_(st, sd, bind is_last(last, _));
}
fn parse_ident_(st: @pstate, _sd: str_def, is_last: fn@(char) -> bool) ->
2011-07-27 07:19:39 -05:00
ast::ident {
2011-09-02 17:34:58 -05:00
let rslt = "";
2011-07-27 07:19:39 -05:00
while !is_last(peek(st) as char) {
rslt += str::unsafe_from_byte(next(st));
}
ret rslt;
}
fn parse_ty_data(data: @[u8], crate_num: int, pos: uint, len: uint,
2011-07-27 07:19:39 -05:00
sd: str_def, tcx: ty::ctxt) -> ty::t {
let st =
@{data: data, crate: crate_num, mutable pos: pos, len: len, tcx: tcx};
let result = parse_ty(st, sd);
ret result;
}
fn parse_ret_ty(st: @pstate, sd: str_def) -> (ast::ret_style, ty::t) {
2011-07-27 07:19:39 -05:00
alt peek(st) as char {
'!' { next(st); (ast::noreturn, ty::mk_bot(st.tcx)) }
_ { (ast::return_val, parse_ty(st, sd)) }
}
}
fn parse_constrs(st: @pstate, sd: str_def) -> [@ty::constr] {
let rslt: [@ty::constr] = [];
2011-07-27 07:19:39 -05:00
alt peek(st) as char {
':' {
do {
next(st);
let one: @ty::constr =
parse_constr::<uint>(st, sd, parse_constr_arg);
rslt += [one];
2011-07-27 07:19:39 -05:00
} while peek(st) as char == ';'
}
_ { }
}
ret rslt;
}
// FIXME less copy-and-paste
fn parse_ty_constrs(st: @pstate, sd: str_def) -> [@ty::type_constr] {
let rslt: [@ty::type_constr] = [];
2011-07-27 07:19:39 -05:00
alt peek(st) as char {
':' {
do {
next(st);
let one: @ty::type_constr =
parse_constr::<path>(st, sd, parse_ty_constr_arg);
rslt += [one];
2011-07-27 07:19:39 -05:00
} while peek(st) as char == ';'
}
_ { }
}
ret rslt;
}
2011-07-27 07:19:39 -05:00
fn parse_path(st: @pstate, sd: str_def) -> ast::path {
let idents: [ast::ident] = [];
2011-07-27 07:19:39 -05:00
fn is_last(c: char) -> bool { ret c == '(' || c == ':'; }
idents += [parse_ident_(st, sd, is_last)];
2011-07-27 07:19:39 -05:00
while true {
alt peek(st) as char {
':' { next(st); next(st); }
c {
if c == '(' {
ret respan(ast_util::dummy_sp(),
{global: false, idents: idents, types: []});
} else { idents += [parse_ident_(st, sd, is_last)]; }
2011-07-27 07:19:39 -05:00
}
}
}
fail "parse_path: ill-formed path";
}
type arg_parser<T> = fn(@pstate, str_def) -> ast::constr_arg_general_<T>;
2011-07-27 07:19:39 -05:00
fn parse_constr_arg(st: @pstate, _sd: str_def) -> ast::fn_constr_arg {
2011-07-27 07:19:39 -05:00
alt peek(st) as char {
'*' { st.pos += 1u; ret ast::carg_base; }
c {
/* how will we disambiguate between
an arg index and a lit argument? */
2011-07-27 07:19:39 -05:00
if c >= '0' && c <= '9' {
next(st);
2011-07-27 07:19:39 -05:00
// FIXME
ret ast::carg_ident((c as uint) - 48u);
} else {
log_err "Lit args are unimplemented";
fail; // FIXME
}
/*
else {
auto lit = parse_lit(st, sd, ',');
args += [respan(st.span, ast::carg_lit(lit))];
}
*/
}
}
}
2011-07-27 07:19:39 -05:00
fn parse_ty_constr_arg(st: @pstate, sd: str_def) ->
ast::constr_arg_general_<path> {
2011-07-27 07:19:39 -05:00
alt peek(st) as char {
'*' { st.pos += 1u; ret ast::carg_base; }
c { ret ast::carg_ident(parse_path(st, sd)); }
}
}
fn parse_constr<copy T>(st: @pstate, sd: str_def, pser: arg_parser<T>) ->
@ty::constr_general<T> {
let sp = ast_util::dummy_sp(); // FIXME: use a real span
let args: [@sp_constr_arg<T>] = [];
2011-07-27 07:19:39 -05:00
let pth: path = parse_path(st, sd);
let ignore: char = next(st) as char;
assert (ignore as char == '(');
let def = parse_def(st, sd);
let an_arg: constr_arg_general_<T>;
2011-07-27 07:19:39 -05:00
do {
an_arg = pser(st, sd);
// FIXME use a real span
args += [@respan(sp, an_arg)];
ignore = next(st) as char;
2011-07-27 07:19:39 -05:00
} while ignore == ';'
assert (ignore == ')');
ret @respan(sp, {path: pth, args: args, id: def});
}
2011-07-27 07:19:39 -05:00
fn parse_ty(st: @pstate, sd: str_def) -> ty::t {
alt next(st) as char {
'n' { ret ty::mk_nil(st.tcx); }
'z' { ret ty::mk_bot(st.tcx); }
'b' { ret ty::mk_bool(st.tcx); }
'i' { ret ty::mk_int(st.tcx); }
'u' { ret ty::mk_uint(st.tcx); }
'l' { ret ty::mk_float(st.tcx); }
'M' {
alt next(st) as char {
'b' { ret ty::mk_mach(st.tcx, ast::ty_u8); }
'w' { ret ty::mk_mach(st.tcx, ast::ty_u16); }
'l' { ret ty::mk_mach(st.tcx, ast::ty_u32); }
'd' { ret ty::mk_mach(st.tcx, ast::ty_u64); }
'B' { ret ty::mk_mach(st.tcx, ast::ty_i8); }
'W' { ret ty::mk_mach(st.tcx, ast::ty_i16); }
'L' { ret ty::mk_mach(st.tcx, ast::ty_i32); }
'D' { ret ty::mk_mach(st.tcx, ast::ty_i64); }
'f' { ret ty::mk_mach(st.tcx, ast::ty_f32); }
'F' { ret ty::mk_mach(st.tcx, ast::ty_f64); }
}
2011-07-27 07:19:39 -05:00
}
'c' { ret ty::mk_char(st.tcx); }
'S' { ret ty::mk_str(st.tcx); }
2011-07-27 07:19:39 -05:00
't' {
assert (next(st) as char == '[');
let def = parse_def(st, sd);
let params: [ty::t] = [];
while peek(st) as char != ']' { params += [parse_ty(st, sd)]; }
2011-07-27 07:19:39 -05:00
st.pos = st.pos + 1u;
ret ty::mk_tag(st.tcx, def, params);
}
'p' {
let k =
alt next(st) as char {
's' { kind_sendable }
'c' { kind_copyable }
'a' { kind_noncopyable }
c {
log_err "unexpected char in encoded type param: ";
log_err c;
fail
}
};
ret ty::mk_param(st.tcx, parse_int(st) as uint, k);
}
2011-07-27 07:19:39 -05:00
'@' { ret ty::mk_box(st.tcx, parse_mt(st, sd)); }
'~' { ret ty::mk_uniq(st.tcx, parse_mt(st, sd)); }
2011-07-27 07:19:39 -05:00
'*' { ret ty::mk_ptr(st.tcx, parse_mt(st, sd)); }
2011-08-18 16:32:25 -05:00
'I' { ret ty::mk_vec(st.tcx, parse_mt(st, sd)); }
2011-07-27 07:19:39 -05:00
'R' {
assert (next(st) as char == '[');
let fields: [ty::field] = [];
2011-07-27 07:19:39 -05:00
while peek(st) as char != ']' {
2011-09-02 17:34:58 -05:00
let name = "";
2011-07-27 07:19:39 -05:00
while peek(st) as char != '=' {
name += str::unsafe_from_byte(next(st));
}
st.pos = st.pos + 1u;
fields += [{ident: name, mt: parse_mt(st, sd)}];
}
2011-07-27 07:19:39 -05:00
st.pos = st.pos + 1u;
ret ty::mk_rec(st.tcx, fields);
}
'T' {
assert (next(st) as char == '[');
let params = [];
while peek(st) as char != ']' { params += [parse_ty(st, sd)]; }
st.pos = st.pos + 1u;
ret ty::mk_tup(st.tcx, params);
}
2011-07-27 07:19:39 -05:00
'F' {
let func = parse_ty_fn(st, sd);
ret ty::mk_fn(st.tcx, ast::proto_shared(ast::sugar_normal),
func.args, func.ty, func.cf,
2011-07-27 07:19:39 -05:00
func.cs);
}
'f' {
let func = parse_ty_fn(st, sd);
ret ty::mk_fn(st.tcx, ast::proto_bare, func.args, func.ty, func.cf,
func.cs);
}
2011-07-27 07:19:39 -05:00
'B' {
let func = parse_ty_fn(st, sd);
ret ty::mk_fn(st.tcx, ast::proto_block, func.args, func.ty, func.cf,
func.cs);
}
'N' {
let func = parse_ty_fn(st, sd);
2011-11-20 12:15:40 -06:00
ret ty::mk_native_fn(st.tcx, func.args, func.ty);
2011-07-27 07:19:39 -05:00
}
'O' {
assert (next(st) as char == '[');
let methods: [ty::method] = [];
2011-07-27 07:19:39 -05:00
while peek(st) as char != ']' {
let proto;
alt next(st) as char {
'f' { proto = ast::proto_bare; }
}
2011-09-02 17:34:58 -05:00
let name = "";
2011-07-27 07:19:39 -05:00
while peek(st) as char != '[' {
name += str::unsafe_from_byte(next(st));
}
2011-07-27 07:19:39 -05:00
let func = parse_ty_fn(st, sd);
methods +=
[{proto: proto,
ident: name,
inputs: func.args,
output: func.ty,
cf: func.cf,
constrs: func.cs}];
}
2011-07-27 07:19:39 -05:00
st.pos += 1u;
ret ty::mk_obj(st.tcx, methods);
}
'r' {
assert (next(st) as char == '[');
let def = parse_def(st, sd);
let inner = parse_ty(st, sd);
let params: [ty::t] = [];
while peek(st) as char != ']' { params += [parse_ty(st, sd)]; }
2011-07-27 07:19:39 -05:00
st.pos = st.pos + 1u;
ret ty::mk_res(st.tcx, def, inner, params);
}
'X' { ret ty::mk_var(st.tcx, parse_int(st)); }
'E' { let def = parse_def(st, sd); ret ty::mk_native(st.tcx, def); }
'Y' { ret ty::mk_type(st.tcx); }
'#' {
let pos = parse_hex(st);
assert (next(st) as char == ':');
let len = parse_hex(st);
assert (next(st) as char == '#');
alt st.tcx.rcache.find({cnum: st.crate, pos: pos, len: len}) {
some(tt) { ret tt; }
none. {
let ps = @{pos: pos, len: len with *st};
let tt = parse_ty(ps, sd);
st.tcx.rcache.insert({cnum: st.crate, pos: pos, len: len}, tt);
ret tt;
}
}
2011-07-27 07:19:39 -05:00
}
'A' {
assert (next(st) as char == '[');
let tt = parse_ty(st, sd);
let tcs = parse_ty_constrs(st, sd);
assert (next(st) as char == ']');
ret ty::mk_constr(st.tcx, tt, tcs);
}
c { log_err "unexpected char in type string: "; log_err c; fail; }
}
}
2011-07-27 07:19:39 -05:00
fn parse_mt(st: @pstate, sd: str_def) -> ty::mt {
let mut;
alt peek(st) as char {
'm' { next(st); mut = ast::mut; }
'?' { next(st); mut = ast::maybe_mut; }
_ { mut = ast::imm; }
}
2011-07-27 07:19:39 -05:00
ret {ty: parse_ty(st, sd), mut: mut};
}
2011-07-27 07:19:39 -05:00
fn parse_def(st: @pstate, sd: str_def) -> ast::def_id {
2011-09-02 17:34:58 -05:00
let def = "";
while peek(st) as char != '|' { def += str::unsafe_from_byte(next(st)); }
st.pos = st.pos + 1u;
ret sd(def);
}
2011-07-27 07:19:39 -05:00
fn parse_int(st: @pstate) -> int {
let n = 0;
while true {
let cur = peek(st) as char;
if cur < '0' || cur > '9' { break; }
st.pos = st.pos + 1u;
n *= 10;
n += (cur as int) - ('0' as int);
}
ret n;
}
2011-07-27 07:19:39 -05:00
fn parse_hex(st: @pstate) -> uint {
let n = 0u;
while true {
let cur = peek(st) as char;
if (cur < '0' || cur > '9') && (cur < 'a' || cur > 'f') { break; }
st.pos = st.pos + 1u;
n *= 16u;
2011-07-27 07:19:39 -05:00
if '0' <= cur && cur <= '9' {
n += (cur as uint) - ('0' as uint);
} else { n += 10u + (cur as uint) - ('a' as uint); }
}
ret n;
}
2011-07-27 07:19:39 -05:00
fn parse_ty_fn(st: @pstate, sd: str_def) ->
{args: [ty::arg], ty: ty::t, cf: ast::ret_style, cs: [@ty::constr]} {
assert (next(st) as char == '[');
let inputs: [ty::arg] = [];
2011-07-27 07:19:39 -05:00
while peek(st) as char != ']' {
let mode = alt peek(st) as char {
'&' { ast::by_mut_ref }
'-' { ast::by_move }
'+' { ast::by_copy }
'=' { ast::by_ref }
'#' { ast::by_val }
};
st.pos += 1u;
inputs += [{mode: mode, ty: parse_ty(st, sd)}];
}
st.pos += 1u; // eat the ']'
2011-07-27 07:19:39 -05:00
let cs = parse_constrs(st, sd);
let (ret_style, ret_ty) = parse_ret_ty(st, sd);
ret {args: inputs, ty: ret_ty, cf: ret_style, cs: cs};
}
// Rust metadata parsing
fn parse_def_id(buf: [u8]) -> ast::def_id {
2011-07-27 07:19:39 -05:00
let colon_idx = 0u;
let len = vec::len::<u8>(buf);
while colon_idx < len && buf[colon_idx] != ':' as u8 { colon_idx += 1u; }
2011-07-27 07:19:39 -05:00
if colon_idx == len {
log_err "didn't find ':' when parsing def id";
fail;
}
let crate_part = vec::slice::<u8>(buf, 0u, colon_idx);
let def_part = vec::slice::<u8>(buf, colon_idx + 1u, len);
let crate_part_vec = [];
let def_part_vec = [];
for b: u8 in crate_part { crate_part_vec += [b]; }
for b: u8 in def_part { def_part_vec += [b]; }
2011-07-27 07:19:39 -05:00
let crate_num = uint::parse_buf(crate_part_vec, 10u) as int;
let def_num = uint::parse_buf(def_part_vec, 10u) as int;
ret {crate: crate_num, node: def_num};
}
//
// Local Variables:
// mode: rust
// fill-column: 78;
// indent-tabs-mode: nil
// c-basic-offset: 4
// buffer-file-coding-system: utf-8-unix
// End:
//