// Type decoding import syntax::ast; import syntax::ast::*; import syntax::ast_util; import syntax::ast_util::respan; import middle::ty; import std::map::hashmap; export parse_ty_data, parse_def_id, parse_ident; export parse_bounds_data; // Compact string representation for ty::t values. API ty_str & // parse_from_str. Extra parameters are for converting to/from def_ids in the // data buffer. Whatever format you choose should not contain pipe characters. // Callback to translate defs to strs or back: type conv_did = fn(ast::def_id) -> ast::def_id; type pstate = {data: @[u8], crate: int, mut pos: uint, tcx: ty::ctxt}; fn peek(st: @pstate) -> char { st.data[st.pos] as char } fn next(st: @pstate) -> char { let ch = st.data[st.pos] as char; st.pos = st.pos + 1u; ret ch; } fn next_byte(st: @pstate) -> u8 { let b = st.data[st.pos]; st.pos = st.pos + 1u; ret b; } fn parse_ident(st: @pstate, last: char) -> ast::ident { fn is_last(b: char, c: char) -> bool { ret c == b; } ret parse_ident_(st, bind is_last(last, _)); } fn parse_ident_(st: @pstate, is_last: fn@(char) -> bool) -> ast::ident { let mut rslt = ""; while !is_last(peek(st)) { rslt += str::from_byte(next_byte(st)); } ret rslt; } fn parse_ty_data(data: @[u8], crate_num: int, pos: uint, tcx: ty::ctxt, conv: conv_did) -> ty::t { let st = @{data: data, crate: crate_num, mut pos: pos, tcx: tcx}; parse_ty(st, conv) } fn parse_ret_ty(st: @pstate, conv: conv_did) -> (ast::ret_style, ty::t) { alt peek(st) { '!' { next(st); (ast::noreturn, ty::mk_bot(st.tcx)) } _ { (ast::return_val, parse_ty(st, conv)) } } } fn parse_constrs(st: @pstate, conv: conv_did) -> [@ty::constr] { let mut rslt: [@ty::constr] = []; alt peek(st) { ':' { do { next(st); rslt += [parse_constr(st, conv, parse_constr_arg)]; } while peek(st) == ';' } _ { } } ret rslt; } // FIXME less copy-and-paste fn parse_ty_constrs(st: @pstate, conv: conv_did) -> [@ty::type_constr] { let mut rslt: [@ty::type_constr] = []; alt peek(st) { ':' { do { next(st); rslt += [parse_constr(st, conv, parse_ty_constr_arg)]; } while peek(st) == ';' } _ { } } ret rslt; } fn parse_path(st: @pstate) -> @ast::path { let mut idents: [ast::ident] = []; fn is_last(c: char) -> bool { ret c == '(' || c == ':'; } idents += [parse_ident_(st, is_last)]; loop { alt peek(st) { ':' { next(st); next(st); } c { if c == '(' { ret @respan(ast_util::dummy_sp(), {global: false, idents: idents, types: []}); } else { idents += [parse_ident_(st, is_last)]; } } } }; } fn parse_constr_arg(st: @pstate) -> ast::fn_constr_arg { alt peek(st) { '*' { st.pos += 1u; ret ast::carg_base; } c { /* how will we disambiguate between an arg index and a lit argument? */ if c >= '0' && c <= '9' { next(st); // FIXME ret ast::carg_ident((c as uint) - 48u); } else { #error("Lit args are unimplemented"); fail; // FIXME } /* else { auto lit = parse_lit(st, conv, ','); args += [respan(st.span, ast::carg_lit(lit))]; } */ } } } fn parse_ty_constr_arg(st: @pstate) -> ast::constr_arg_general_<@path> { alt peek(st) { '*' { st.pos += 1u; ret ast::carg_base; } c { ret ast::carg_ident(parse_path(st)); } } } fn parse_constr(st: @pstate, conv: conv_did, pser: fn(@pstate) -> ast::constr_arg_general_) -> @ty::constr_general { let sp = ast_util::dummy_sp(); // FIXME: use a real span let mut args: [@sp_constr_arg] = []; let pth = parse_path(st); let mut ignore: char = next(st); assert (ignore == '('); let def = parse_def(st, conv); let mut an_arg: constr_arg_general_; do { an_arg = pser(st); // FIXME use a real span args += [@respan(sp, an_arg)]; ignore = next(st); } while ignore == ';' assert (ignore == ')'); ret @respan(sp, {path: pth, args: args, id: def}); } fn parse_ty_rust_fn(st: @pstate, conv: conv_did, p: ast::proto) -> ty::t { ret ty::mk_fn(st.tcx, {proto: p with parse_ty_fn(st, conv)}); } fn parse_proto(c: char) -> ast::proto { alt c { '~' { ast::proto_uniq } '@' { ast::proto_box } '*' { ast::proto_any } '&' { ast::proto_block } 'n' { ast::proto_bare } _ { fail "illegal fn type kind " + str::from_char(c); } } } fn parse_ty(st: @pstate, conv: conv_did) -> ty::t { alt check next(st) { 'n' { ret ty::mk_nil(st.tcx); } 'z' { ret ty::mk_bot(st.tcx); } 'b' { ret ty::mk_bool(st.tcx); } 'i' { ret ty::mk_int(st.tcx); } 'u' { ret ty::mk_uint(st.tcx); } 'l' { ret ty::mk_float(st.tcx); } 'M' { alt check next(st) { 'b' { ret ty::mk_mach_uint(st.tcx, ast::ty_u8); } 'w' { ret ty::mk_mach_uint(st.tcx, ast::ty_u16); } 'l' { ret ty::mk_mach_uint(st.tcx, ast::ty_u32); } 'd' { ret ty::mk_mach_uint(st.tcx, ast::ty_u64); } 'B' { ret ty::mk_mach_int(st.tcx, ast::ty_i8); } 'W' { ret ty::mk_mach_int(st.tcx, ast::ty_i16); } 'L' { ret ty::mk_mach_int(st.tcx, ast::ty_i32); } 'D' { ret ty::mk_mach_int(st.tcx, ast::ty_i64); } 'f' { ret ty::mk_mach_float(st.tcx, ast::ty_f32); } 'F' { ret ty::mk_mach_float(st.tcx, ast::ty_f64); } } } 'c' { ret ty::mk_char(st.tcx); } 'S' { ret ty::mk_str(st.tcx); } 't' { assert (next(st) == '['); let def = parse_def(st, conv); let mut params: [ty::t] = []; while peek(st) != ']' { params += [parse_ty(st, conv)]; } st.pos = st.pos + 1u; ret ty::mk_enum(st.tcx, def, params); } 'x' { assert (next(st) == '['); let def = parse_def(st, conv); let mut params: [ty::t] = []; while peek(st) != ']' { params += [parse_ty(st, conv)]; } st.pos = st.pos + 1u; ret ty::mk_iface(st.tcx, def, params); } 'p' { let did = parse_def(st, conv); ret ty::mk_param(st.tcx, parse_int(st) as uint, did); } 's' { assert next(st) == '['; let mut params = []; while peek(st) != ']' { params += [parse_ty(st, conv)]; } st.pos += 1u; ret ty::mk_self(st.tcx, params); } '@' { ret ty::mk_box(st.tcx, parse_mt(st, conv)); } '~' { ret ty::mk_uniq(st.tcx, parse_mt(st, conv)); } '*' { ret ty::mk_ptr(st.tcx, parse_mt(st, conv)); } 'I' { ret ty::mk_vec(st.tcx, parse_mt(st, conv)); } 'R' { assert (next(st) == '['); let mut fields: [ty::field] = []; while peek(st) != ']' { let mut name = ""; while peek(st) != '=' { name += str::from_byte(next_byte(st)); } st.pos = st.pos + 1u; fields += [{ident: name, mt: parse_mt(st, conv)}]; } st.pos = st.pos + 1u; ret ty::mk_rec(st.tcx, fields); } 'T' { assert (next(st) == '['); let mut params = []; while peek(st) != ']' { params += [parse_ty(st, conv)]; } st.pos = st.pos + 1u; ret ty::mk_tup(st.tcx, params); } 'f' { let proto = parse_proto(next(st)); parse_ty_rust_fn(st, conv, proto) } 'r' { assert (next(st) == '['); let def = parse_def(st, conv); let inner = parse_ty(st, conv); let mut params: [ty::t] = []; while peek(st) != ']' { params += [parse_ty(st, conv)]; } st.pos = st.pos + 1u; ret ty::mk_res(st.tcx, def, inner, params); } 'X' { ret ty::mk_var(st.tcx, ty::ty_vid(parse_int(st) as uint)); } 'Y' { ret ty::mk_type(st.tcx); } 'C' { let ck = alt check next(st) { '&' { ty::ck_block } '@' { ty::ck_box } '~' { ty::ck_uniq } }; ret ty::mk_opaque_closure_ptr(st.tcx, ck); } '#' { let pos = parse_hex(st); assert (next(st) == ':'); let len = parse_hex(st); assert (next(st) == '#'); alt st.tcx.rcache.find({cnum: st.crate, pos: pos, len: len}) { some(tt) { ret tt; } none { let ps = @{pos: pos with *st}; let tt = parse_ty(ps, conv); st.tcx.rcache.insert({cnum: st.crate, pos: pos, len: len}, tt); ret tt; } } } 'A' { assert (next(st) == '['); let tt = parse_ty(st, conv); let tcs = parse_ty_constrs(st, conv); assert (next(st) == ']'); ret ty::mk_constr(st.tcx, tt, tcs); } '"' { let def = parse_def(st, conv); let inner = parse_ty(st, conv); ty::mk_with_id(st.tcx, inner, def) } 'B' { ty::mk_opaque_box(st.tcx) } 'a' { #debug("saw a class"); assert (next(st) == '['); #debug("saw a ["); let did = parse_def(st, conv); #debug("parsed a def_id %?", did); let mut params: [ty::t] = []; while peek(st) != ']' { params += [parse_ty(st, conv)]; } assert (next(st) == ']'); ret ty::mk_class(st.tcx, did, params); } c { #error("unexpected char in type string: %c", c); fail;} } } fn parse_mt(st: @pstate, conv: conv_did) -> ty::mt { let mut m; alt peek(st) { 'm' { next(st); m = ast::m_mutbl; } '?' { next(st); m = ast::m_const; } _ { m = ast::m_imm; } } ret {ty: parse_ty(st, conv), mutbl: m}; } fn parse_def(st: @pstate, conv: conv_did) -> ast::def_id { let mut def = []; while peek(st) != '|' { def += [next_byte(st)]; } st.pos = st.pos + 1u; ret conv(parse_def_id(def)); } fn parse_int(st: @pstate) -> int { let mut n = 0; loop { let cur = peek(st); if cur < '0' || cur > '9' { ret n; } st.pos = st.pos + 1u; n *= 10; n += (cur as int) - ('0' as int); }; } fn parse_hex(st: @pstate) -> uint { let mut n = 0u; loop { let cur = peek(st); if (cur < '0' || cur > '9') && (cur < 'a' || cur > 'f') { ret n; } st.pos = st.pos + 1u; n *= 16u; if '0' <= cur && cur <= '9' { n += (cur as uint) - ('0' as uint); } else { n += 10u + (cur as uint) - ('a' as uint); } }; } fn parse_ty_fn(st: @pstate, conv: conv_did) -> ty::fn_ty { assert (next(st) == '['); let mut inputs: [ty::arg] = []; while peek(st) != ']' { let mode = alt check peek(st) { '&' { ast::by_mutbl_ref } '-' { ast::by_move } '+' { ast::by_copy } '=' { ast::by_ref } '#' { ast::by_val } }; st.pos += 1u; inputs += [{mode: ast::expl(mode), ty: parse_ty(st, conv)}]; } st.pos += 1u; // eat the ']' let cs = parse_constrs(st, conv); let (ret_style, ret_ty) = parse_ret_ty(st, conv); ret {proto: ast::proto_bare, inputs: inputs, output: ret_ty, ret_style: ret_style, constraints: cs}; } // Rust metadata parsing fn parse_def_id(buf: [u8]) -> ast::def_id { let mut colon_idx = 0u; let len = vec::len(buf); while colon_idx < len && buf[colon_idx] != ':' as u8 { colon_idx += 1u; } if colon_idx == len { #error("didn't find ':' when parsing def id"); fail; } let crate_part = vec::slice(buf, 0u, colon_idx); let def_part = vec::slice(buf, colon_idx + 1u, len); let crate_num = alt uint::parse_buf(crate_part, 10u) { some(cn) { cn as int } none { fail (#fmt("internal error: parse_def_id: error parsing %? \ as crate", crate_part)); } }; let def_num = alt uint::parse_buf(def_part, 10u) { some(dn) { dn as int } none { fail (#fmt("internal error: parse_def_id: error parsing %? \ as id", def_part)); } }; ret {crate: crate_num, node: def_num}; } fn parse_bounds_data(data: @[u8], start: uint, crate_num: int, tcx: ty::ctxt, conv: conv_did) -> @[ty::param_bound] { let st = @{data: data, crate: crate_num, mut pos: start, tcx: tcx}; parse_bounds(st, conv) } fn parse_bounds(st: @pstate, conv: conv_did) -> @[ty::param_bound] { let mut bounds = []; loop { bounds += [alt check next(st) { 'S' { ty::bound_send } 'C' { ty::bound_copy } 'I' { ty::bound_iface(parse_ty(st, conv)) } '.' { break; } }]; } @bounds } // // Local Variables: // mode: rust // fill-column: 78; // indent-tabs-mode: nil // c-basic-offset: 4 // buffer-file-coding-system: utf-8-unix // End: //