// Copyright 2012-2014 The Rust Project Developers. See the COPYRIGHT // file at the top-level directory of this distribution and at // http://rust-lang.org/COPYRIGHT. // // Licensed under the Apache License, Version 2.0 or the MIT license // , at your // option. This file may not be copied, modified, or distributed // except according to those terms. // Type decoding // tjc note: Would be great to have a `match check` macro equivalent // for some of these #![allow(non_camel_case_types)] use middle::subst; use middle::subst::VecPerParamSpace; use middle::ty; use std::rc::Rc; use std::str; use std::string::String; use std::uint; use syntax::abi; use syntax::ast; use syntax::ast::*; use syntax::parse::token; // Compact string representation for ty::t values. API ty_str & // parse_from_str. Extra parameters are for converting to/from def_ids in the // data buffer. Whatever format you choose should not contain pipe characters. // Def id conversion: when we encounter def-ids, they have to be translated. // For example, the crate number must be converted from the crate number used // in the library we are reading from into the local crate numbers in use // here. To perform this translation, the type decoder is supplied with a // conversion function of type `conv_did`. // // Sometimes, particularly when inlining, the correct translation of the // def-id will depend on where it originated from. Therefore, the conversion // function is given an indicator of the source of the def-id. See // astencode.rs for more information. pub enum DefIdSource { // Identifies a struct, trait, enum, etc. NominalType, // Identifies a type alias (`type X = ...`). TypeWithId, // Identifies a type parameter (`fn foo() { ... }`). TypeParameter, // Identifies a region parameter (`fn foo<'X>() { ... }`). RegionParameter, } pub type conv_did<'a> = |source: DefIdSource, ast::DefId|: 'a -> ast::DefId; pub struct PState<'a> { data: &'a [u8], krate: ast::CrateNum, pos: uint, tcx: &'a ty::ctxt } fn peek(st: &PState) -> char { st.data[st.pos] as char } fn next(st: &mut PState) -> char { let ch = st.data[st.pos] as char; st.pos = st.pos + 1u; return ch; } fn next_byte(st: &mut PState) -> u8 { let b = st.data[st.pos]; st.pos = st.pos + 1u; return b; } fn scan(st: &mut PState, is_last: |char| -> bool, op: |&[u8]| -> R) -> R { let start_pos = st.pos; debug!("scan: '{}' (start)", st.data[st.pos] as char); while !is_last(st.data[st.pos] as char) { st.pos += 1; debug!("scan: '{}'", st.data[st.pos] as char); } let end_pos = st.pos; st.pos += 1; return op(st.data.slice(start_pos, end_pos)); } pub fn parse_ident(st: &mut PState, last: char) -> ast::Ident { fn is_last(b: char, c: char) -> bool { return c == b; } return parse_ident_(st, |a| is_last(last, a) ); } fn parse_ident_(st: &mut PState, is_last: |char| -> bool) -> ast::Ident { scan(st, is_last, |bytes| { token::str_to_ident(str::from_utf8(bytes).unwrap()) }) } pub fn parse_state_from_data<'a>(data: &'a [u8], crate_num: ast::CrateNum, pos: uint, tcx: &'a ty::ctxt) -> PState<'a> { PState { data: data, krate: crate_num, pos: pos, tcx: tcx } } fn data_log_string(data: &[u8], pos: uint) -> String { let mut buf = String::new(); buf.push_str("<<"); for i in range(pos, data.len()) { let c = data[i]; if c > 0x20 && c <= 0x7F { buf.push_char(c as char); } else { buf.push_char('.'); } } buf.push_str(">>"); buf } pub fn parse_ty_data(data: &[u8], crate_num: ast::CrateNum, pos: uint, tcx: &ty::ctxt, conv: conv_did) -> ty::t { debug!("parse_ty_data {}", data_log_string(data, pos)); let mut st = parse_state_from_data(data, crate_num, pos, tcx); parse_ty(&mut st, conv) } pub fn parse_bare_fn_ty_data(data: &[u8], crate_num: ast::CrateNum, pos: uint, tcx: &ty::ctxt, conv: conv_did) -> ty::BareFnTy { debug!("parse_bare_fn_ty_data {}", data_log_string(data, pos)); let mut st = parse_state_from_data(data, crate_num, pos, tcx); parse_bare_fn_ty(&mut st, conv) } pub fn parse_trait_ref_data(data: &[u8], crate_num: ast::CrateNum, pos: uint, tcx: &ty::ctxt, conv: conv_did) -> ty::TraitRef { debug!("parse_trait_ref_data {}", data_log_string(data, pos)); let mut st = parse_state_from_data(data, crate_num, pos, tcx); parse_trait_ref(&mut st, conv) } pub fn parse_substs_data(data: &[u8], crate_num: ast::CrateNum, pos: uint, tcx: &ty::ctxt, conv: conv_did) -> subst::Substs { debug!("parse_substs_data {}", data_log_string(data, pos)); let mut st = parse_state_from_data(data, crate_num, pos, tcx); parse_substs(&mut st, conv) } fn parse_size(st: &mut PState) -> Option { assert_eq!(next(st), '/'); if peek(st) == '|' { assert_eq!(next(st), '|'); None } else { let n = parse_uint(st); assert_eq!(next(st), '|'); Some(n) } } fn parse_trait_store(st: &mut PState, conv: conv_did) -> ty::TraitStore { match next(st) { '~' => ty::UniqTraitStore, '&' => ty::RegionTraitStore(parse_region(st, conv), parse_mutability(st)), c => { st.tcx.sess.bug(format!("parse_trait_store(): bad input '{}'", c).as_slice()) } } } fn parse_vec_per_param_space(st: &mut PState, f: |&mut PState| -> T) -> VecPerParamSpace { let mut r = VecPerParamSpace::empty(); for &space in subst::ParamSpace::all().iter() { assert_eq!(next(st), '['); while peek(st) != ']' { r.push(space, f(st)); } assert_eq!(next(st), ']'); } r } fn parse_substs(st: &mut PState, conv: conv_did) -> subst::Substs { let regions = parse_region_substs(st, |x,y| conv(x,y)); let types = parse_vec_per_param_space(st, |st| parse_ty(st, |x,y| conv(x,y))); return subst::Substs { types: types, regions: regions }; } fn parse_region_substs(st: &mut PState, conv: conv_did) -> subst::RegionSubsts { match next(st) { 'e' => subst::ErasedRegions, 'n' => { subst::NonerasedRegions( parse_vec_per_param_space( st, |st| parse_region(st, |x,y| conv(x,y)))) } _ => fail!("parse_bound_region: bad input") } } fn parse_bound_region(st: &mut PState, conv: conv_did) -> ty::BoundRegion { match next(st) { 'a' => { let id = parse_uint(st); assert_eq!(next(st), '|'); ty::BrAnon(id) } '[' => { let def = parse_def(st, RegionParameter, |x,y| conv(x,y)); let ident = token::str_to_ident(parse_str(st, ']').as_slice()); ty::BrNamed(def, ident.name) } 'f' => { let id = parse_uint(st); assert_eq!(next(st), '|'); ty::BrFresh(id) } _ => fail!("parse_bound_region: bad input") } } fn parse_region(st: &mut PState, conv: conv_did) -> ty::Region { match next(st) { 'b' => { assert_eq!(next(st), '['); let id = parse_uint(st) as ast::NodeId; assert_eq!(next(st), '|'); let br = parse_bound_region(st, |x,y| conv(x,y)); assert_eq!(next(st), ']'); ty::ReLateBound(id, br) } 'B' => { assert_eq!(next(st), '['); let node_id = parse_uint(st) as ast::NodeId; assert_eq!(next(st), '|'); let space = parse_param_space(st); assert_eq!(next(st), '|'); let index = parse_uint(st); assert_eq!(next(st), '|'); let nm = token::str_to_ident(parse_str(st, ']').as_slice()); ty::ReEarlyBound(node_id, space, index, nm.name) } 'f' => { assert_eq!(next(st), '['); let id = parse_uint(st) as ast::NodeId; assert_eq!(next(st), '|'); let br = parse_bound_region(st, |x,y| conv(x,y)); assert_eq!(next(st), ']'); ty::ReFree(ty::FreeRegion {scope_id: id, bound_region: br}) } 's' => { let id = parse_uint(st) as ast::NodeId; assert_eq!(next(st), '|'); ty::ReScope(id) } 't' => { ty::ReStatic } 'e' => { ty::ReStatic } _ => fail!("parse_region: bad input") } } fn parse_opt(st: &mut PState, f: |&mut PState| -> T) -> Option { match next(st) { 'n' => None, 's' => Some(f(st)), _ => fail!("parse_opt: bad input") } } fn parse_str(st: &mut PState, term: char) -> String { let mut result = String::new(); while peek(st) != term { unsafe { result.push_bytes([next_byte(st)]) } } next(st); result } fn parse_trait_ref(st: &mut PState, conv: conv_did) -> ty::TraitRef { let def = parse_def(st, NominalType, |x,y| conv(x,y)); let substs = parse_substs(st, |x,y| conv(x,y)); ty::TraitRef {def_id: def, substs: substs} } fn parse_ty(st: &mut PState, conv: conv_did) -> ty::t { match next(st) { 'n' => return ty::mk_nil(), 'z' => return ty::mk_bot(), 'b' => return ty::mk_bool(), 'i' => return ty::mk_int(), 'u' => return ty::mk_uint(), 'M' => { match next(st) { 'b' => return ty::mk_mach_uint(ast::TyU8), 'w' => return ty::mk_mach_uint(ast::TyU16), 'l' => return ty::mk_mach_uint(ast::TyU32), 'd' => return ty::mk_mach_uint(ast::TyU64), 'B' => return ty::mk_mach_int(ast::TyI8), 'W' => return ty::mk_mach_int(ast::TyI16), 'L' => return ty::mk_mach_int(ast::TyI32), 'D' => return ty::mk_mach_int(ast::TyI64), 'f' => return ty::mk_mach_float(ast::TyF32), 'F' => return ty::mk_mach_float(ast::TyF64), _ => fail!("parse_ty: bad numeric type") } } 'c' => return ty::mk_char(), 't' => { assert_eq!(next(st), '['); let def = parse_def(st, NominalType, |x,y| conv(x,y)); let substs = parse_substs(st, |x,y| conv(x,y)); assert_eq!(next(st), ']'); return ty::mk_enum(st.tcx, def, substs); } 'x' => { assert_eq!(next(st), '['); let def = parse_def(st, NominalType, |x,y| conv(x,y)); let substs = parse_substs(st, |x,y| conv(x,y)); let bounds = parse_bounds(st, |x,y| conv(x,y)); assert_eq!(next(st), ']'); return ty::mk_trait(st.tcx, def, substs, bounds.builtin_bounds); } 'p' => { let did = parse_def(st, TypeParameter, |x,y| conv(x,y)); debug!("parsed ty_param: did={:?}", did); let index = parse_uint(st); assert_eq!(next(st), '|'); let space = parse_param_space(st); assert_eq!(next(st), '|'); return ty::mk_param(st.tcx, space, index, did); } '@' => return ty::mk_box(st.tcx, parse_ty(st, |x,y| conv(x,y))), '~' => return ty::mk_uniq(st.tcx, parse_ty(st, |x,y| conv(x,y))), '*' => return ty::mk_ptr(st.tcx, parse_mt(st, |x,y| conv(x,y))), '&' => { let r = parse_region(st, |x,y| conv(x,y)); let mt = parse_mt(st, |x,y| conv(x,y)); return ty::mk_rptr(st.tcx, r, mt); } 'V' => { let mt = parse_mt(st, |x,y| conv(x,y)); let sz = parse_size(st); return ty::mk_vec(st.tcx, mt, sz); } 'v' => { return ty::mk_str(st.tcx); } 'T' => { assert_eq!(next(st), '['); let mut params = Vec::new(); while peek(st) != ']' { params.push(parse_ty(st, |x,y| conv(x,y))); } st.pos = st.pos + 1u; return ty::mk_tup(st.tcx, params); } 'f' => { return ty::mk_closure(st.tcx, parse_closure_ty(st, |x,y| conv(x,y))); } 'F' => { return ty::mk_bare_fn(st.tcx, parse_bare_fn_ty(st, |x,y| conv(x,y))); } '#' => { let pos = parse_hex(st); assert_eq!(next(st), ':'); let len = parse_hex(st); assert_eq!(next(st), '#'); let key = ty::creader_cache_key {cnum: st.krate, pos: pos, len: len }; match st.tcx.rcache.borrow().find_copy(&key) { Some(tt) => return tt, None => {} } let mut ps = PState { pos: pos, .. *st }; let tt = parse_ty(&mut ps, |x,y| conv(x,y)); st.tcx.rcache.borrow_mut().insert(key, tt); return tt; } '"' => { let _ = parse_def(st, TypeWithId, |x,y| conv(x,y)); let inner = parse_ty(st, |x,y| conv(x,y)); inner } 'a' => { assert_eq!(next(st), '['); let did = parse_def(st, NominalType, |x,y| conv(x,y)); let substs = parse_substs(st, |x,y| conv(x,y)); assert_eq!(next(st), ']'); return ty::mk_struct(st.tcx, did, substs); } 'e' => { return ty::mk_err(); } c => { fail!("unexpected char in type string: {}", c);} } } fn parse_mutability(st: &mut PState) -> ast::Mutability { match peek(st) { 'm' => { next(st); ast::MutMutable } _ => { ast::MutImmutable } } } fn parse_mt(st: &mut PState, conv: conv_did) -> ty::mt { let m = parse_mutability(st); ty::mt { ty: parse_ty(st, |x,y| conv(x,y)), mutbl: m } } fn parse_def(st: &mut PState, source: DefIdSource, conv: conv_did) -> ast::DefId { return conv(source, scan(st, |c| { c == '|' }, parse_def_id)); } fn parse_uint(st: &mut PState) -> uint { let mut n = 0; loop { let cur = peek(st); if cur < '0' || cur > '9' { return n; } st.pos = st.pos + 1u; n *= 10; n += (cur as uint) - ('0' as uint); }; } fn parse_param_space(st: &mut PState) -> subst::ParamSpace { subst::ParamSpace::from_uint(parse_uint(st)) } fn parse_hex(st: &mut PState) -> uint { let mut n = 0u; loop { let cur = peek(st); if (cur < '0' || cur > '9') && (cur < 'a' || cur > 'f') { return n; } st.pos = st.pos + 1u; n *= 16u; if '0' <= cur && cur <= '9' { n += (cur as uint) - ('0' as uint); } else { n += 10u + (cur as uint) - ('a' as uint); } }; } fn parse_fn_style(c: char) -> FnStyle { match c { 'u' => UnsafeFn, 'n' => NormalFn, _ => fail!("parse_fn_style: bad fn_style {}", c) } } fn parse_abi_set(st: &mut PState) -> abi::Abi { assert_eq!(next(st), '['); scan(st, |c| c == ']', |bytes| { let abi_str = str::from_utf8(bytes).unwrap(); abi::lookup(abi_str.as_slice()).expect(abi_str) }) } fn parse_onceness(c: char) -> ast::Onceness { match c { 'o' => ast::Once, 'm' => ast::Many, _ => fail!("parse_onceness: bad onceness") } } fn parse_closure_ty(st: &mut PState, conv: conv_did) -> ty::ClosureTy { let fn_style = parse_fn_style(next(st)); let onceness = parse_onceness(next(st)); let store = parse_trait_store(st, |x,y| conv(x,y)); let bounds = parse_bounds(st, |x,y| conv(x,y)); let sig = parse_sig(st, |x,y| conv(x,y)); ty::ClosureTy { fn_style: fn_style, onceness: onceness, store: store, bounds: bounds.builtin_bounds, sig: sig } } fn parse_bare_fn_ty(st: &mut PState, conv: conv_did) -> ty::BareFnTy { let fn_style = parse_fn_style(next(st)); let abi = parse_abi_set(st); let sig = parse_sig(st, |x,y| conv(x,y)); ty::BareFnTy { fn_style: fn_style, abi: abi, sig: sig } } fn parse_sig(st: &mut PState, conv: conv_did) -> ty::FnSig { assert_eq!(next(st), '['); let id = parse_uint(st) as ast::NodeId; assert_eq!(next(st), '|'); let mut inputs = Vec::new(); while peek(st) != ']' { inputs.push(parse_ty(st, |x,y| conv(x,y))); } st.pos += 1u; // eat the ']' let variadic = match next(st) { 'V' => true, 'N' => false, r => fail!(format!("bad variadic: {}", r)), }; let ret_ty = parse_ty(st, |x,y| conv(x,y)); ty::FnSig {binder_id: id, inputs: inputs, output: ret_ty, variadic: variadic} } // Rust metadata parsing pub fn parse_def_id(buf: &[u8]) -> ast::DefId { let mut colon_idx = 0u; let len = buf.len(); while colon_idx < len && buf[colon_idx] != ':' as u8 { colon_idx += 1u; } if colon_idx == len { error!("didn't find ':' when parsing def id"); fail!(); } let crate_part = buf.slice(0u, colon_idx); let def_part = buf.slice(colon_idx + 1u, len); let crate_num = match uint::parse_bytes(crate_part, 10u) { Some(cn) => cn as ast::CrateNum, None => fail!("internal error: parse_def_id: crate number expected, but found {:?}", crate_part) }; let def_num = match uint::parse_bytes(def_part, 10u) { Some(dn) => dn as ast::NodeId, None => fail!("internal error: parse_def_id: id expected, but found {:?}", def_part) }; ast::DefId { krate: crate_num, node: def_num } } pub fn parse_type_param_def_data(data: &[u8], start: uint, crate_num: ast::CrateNum, tcx: &ty::ctxt, conv: conv_did) -> ty::TypeParameterDef { let mut st = parse_state_from_data(data, crate_num, start, tcx); parse_type_param_def(&mut st, conv) } fn parse_type_param_def(st: &mut PState, conv: conv_did) -> ty::TypeParameterDef { let ident = parse_ident(st, ':'); let def_id = parse_def(st, NominalType, |x,y| conv(x,y)); let space = parse_param_space(st); assert_eq!(next(st), '|'); let index = parse_uint(st); assert_eq!(next(st), '|'); let bounds = Rc::new(parse_bounds(st, |x,y| conv(x,y))); let default = parse_opt(st, |st| parse_ty(st, |x,y| conv(x,y))); ty::TypeParameterDef { ident: ident, def_id: def_id, space: space, index: index, bounds: bounds, default: default } } fn parse_bounds(st: &mut PState, conv: conv_did) -> ty::ParamBounds { let mut param_bounds = ty::ParamBounds { builtin_bounds: ty::empty_builtin_bounds(), trait_bounds: Vec::new() }; loop { match next(st) { 'S' => { param_bounds.builtin_bounds.add(ty::BoundSend); } 'O' => { param_bounds.builtin_bounds.add(ty::BoundStatic); } 'Z' => { param_bounds.builtin_bounds.add(ty::BoundSized); } 'P' => { param_bounds.builtin_bounds.add(ty::BoundCopy); } 'T' => { param_bounds.builtin_bounds.add(ty::BoundShare); } 'I' => { param_bounds.trait_bounds.push(Rc::new(parse_trait_ref(st, |x,y| conv(x,y)))); } '.' => { return param_bounds; } c => { fail!("parse_bounds: bad bounds ('{}')", c) } } } }