rust/src/rustc/metadata/decoder.rs

579 lines
19 KiB
Rust
Raw Normal View History

2011-07-08 01:29:09 -05:00
// Decoding metadata from a single crate's metadata
2011-06-27 18:03:01 -05:00
import std::{ebml, map, io};
import std::map::hashmap;
import io::writer_util;
2011-09-12 18:13:28 -05:00
import syntax::{ast, ast_util};
import driver::session::session;
2011-06-30 19:03:08 -05:00
import front::attr;
import middle::ty;
import middle::ast_map;
import common::*;
import tydecode::{parse_ty_data, parse_def_id, parse_bounds_data};
import syntax::print::pprust;
import cmd=cstore::crate_metadata;
import middle::trans::common::maps;
export get_symbol;
export get_enum_variants;
export get_type;
export get_type_param_count;
export get_impl_iface;
export lookup_def;
export lookup_item_name;
export get_impl_iface;
export resolve_path;
export get_crate_attributes;
export list_crate_metadata;
export crate_dep;
export get_crate_deps;
2011-12-11 09:23:38 -06:00
export get_crate_hash;
export get_impls_for_mod;
export get_iface_methods;
export get_crate_module_paths;
export get_item_path;
export maybe_get_item_ast;
// Used internally by astencode:
export translate_def_id;
// A function that takes a def_id relative to the crate being searched and
// returns a def_id relative to the compilation environment, i.e. if we hit a
// def_id for an item defined in another crate, somebody needs to figure out
// what crate that's in and give us a def_id that makes sense for the current
// build.
2011-07-27 07:19:39 -05:00
fn lookup_hash(d: ebml::doc, eq_fn: fn@([u8]) -> bool, hash: uint) ->
2011-08-12 00:58:14 -05:00
[ebml::doc] {
let index = ebml::get_doc(d, tag_index);
let table = ebml::get_doc(index, tag_index_table);
2011-07-27 07:19:39 -05:00
let hash_pos = table.start + hash % 256u * 4u;
let pos = io::u64_from_be_bytes(*d.data, hash_pos, 4u) as uint;
let {tag:_, doc:bucket} = ebml::doc_at(d.data, pos);
// Awkward logic because we can't ret from foreach yet
let result: [ebml::doc] = [];
2011-07-27 07:19:39 -05:00
let belt = tag_index_buckets_bucket_elt;
ebml::tagged_docs(bucket, belt) {|elt|
let pos = io::u64_from_be_bytes(*elt.data, elt.start, 4u) as uint;
if eq_fn(vec::slice::<u8>(*elt.data, elt.start + 4u, elt.end)) {
result += [ebml::doc_at(d.data, pos).doc];
}
};
ret result;
}
fn maybe_find_item(item_id: int, items: ebml::doc) -> option<ebml::doc> {
fn eq_item(bytes: [u8], item_id: int) -> bool {
ret io::u64_from_be_bytes(bytes, 0u, 4u) as int == item_id;
}
2011-07-27 07:19:39 -05:00
let eqer = bind eq_item(_, item_id);
let found = lookup_hash(items, eqer, hash_node_id(item_id));
2011-08-15 18:38:23 -05:00
if vec::len(found) == 0u {
ret option::none::<ebml::doc>;
} else { ret option::some::<ebml::doc>(found[0]); }
}
fn find_item(item_id: int, items: ebml::doc) -> ebml::doc {
ret option::get(maybe_find_item(item_id, items));
}
2011-08-12 00:58:14 -05:00
// Looks up an item in the given metadata and returns an ebml doc pointing
// to the item data.
fn lookup_item(item_id: int, data: @[u8]) -> ebml::doc {
2011-08-12 00:58:14 -05:00
let items = ebml::get_doc(ebml::new_doc(data), tag_items);
ret find_item(item_id, items);
}
fn item_family(item: ebml::doc) -> char {
2011-08-12 00:58:14 -05:00
let fam = ebml::get_doc(item, tag_items_data_item_family);
ebml::doc_as_u8(fam) as char
}
fn item_symbol(item: ebml::doc) -> str {
2011-08-12 00:58:14 -05:00
let sym = ebml::get_doc(item, tag_items_data_item_symbol);
ret str::from_bytes(ebml::doc_data(sym));
}
fn variant_enum_id(d: ebml::doc) -> ast::def_id {
let tagdoc = ebml::get_doc(d, tag_items_data_item_enum_id);
2011-08-12 00:58:14 -05:00
ret parse_def_id(ebml::doc_data(tagdoc));
}
fn variant_disr_val(d: ebml::doc) -> option<int> {
option::chain(ebml::maybe_get_doc(d, tag_disr_val)) {|val_doc|
int::parse_buf(ebml::doc_data(val_doc), 10u)
}
}
fn doc_type(doc: ebml::doc, tcx: ty::ctxt, cdata: cmd) -> ty::t {
let tp = ebml::get_doc(doc, tag_items_data_item_type);
parse_ty_data(tp.data, cdata.cnum, tp.start, tcx, {|did|
translate_def_id(cdata, did)
})
}
fn item_type(item_id: ast::def_id, item: ebml::doc,
tcx: ty::ctxt, cdata: cmd) -> ty::t {
let t = doc_type(item, tcx, cdata);
if family_names_type(item_family(item)) {
ty::mk_with_id(tcx, t, item_id)
} else { t }
}
fn item_impl_iface(item: ebml::doc, tcx: ty::ctxt, cdata: cmd)
-> option<ty::t> {
let result = none;
ebml::tagged_docs(item, tag_impl_iface) {|ity|
let t = parse_ty_data(ity.data, cdata.cnum, ity.start, tcx, {|did|
translate_def_id(cdata, did)
});
result = some(t);
}
result
}
2012-01-30 04:36:18 -06:00
fn item_ty_param_bounds(item: ebml::doc, tcx: ty::ctxt, cdata: cmd)
-> @[ty::param_bounds] {
let bounds = [];
ebml::tagged_docs(item, tag_items_data_item_ty_param_bounds) {|p|
let bd = parse_bounds_data(p.data, p.start, cdata.cnum, tcx, {|did|
translate_def_id(cdata, did)
});
2012-01-30 04:36:18 -06:00
bounds += [bd];
}
2012-01-02 05:09:26 -06:00
@bounds
}
fn item_ty_param_count(item: ebml::doc) -> uint {
let n = 0u;
ebml::tagged_docs(item, tag_items_data_item_ty_param_bounds,
{|_p| n += 1u; });
n
}
fn enum_variant_ids(item: ebml::doc, cdata: cmd) -> [ast::def_id] {
let ids: [ast::def_id] = [];
2011-07-27 07:19:39 -05:00
let v = tag_items_data_item_variant;
ebml::tagged_docs(item, v) {|p|
2011-08-12 00:58:14 -05:00
let ext = parse_def_id(ebml::doc_data(p));
ids += [{crate: cdata.cnum, node: ext.node}];
};
ret ids;
}
// Given a path and serialized crate metadata, returns the ID of the
// definition the path refers to.
fn resolve_path(path: [ast::ident], data: @[u8]) -> [ast::def_id] {
fn eq_item(data: [u8], s: str) -> bool {
ret str::eq(str::from_bytes(data), s);
}
2011-09-02 17:34:58 -05:00
let s = str::connect(path, "::");
2011-08-12 00:58:14 -05:00
let md = ebml::new_doc(data);
let paths = ebml::get_doc(md, tag_paths);
2011-07-27 07:19:39 -05:00
let eqer = bind eq_item(_, s);
let result: [ast::def_id] = [];
2011-09-02 17:34:58 -05:00
for doc: ebml::doc in lookup_hash(paths, eqer, hash_path(s)) {
2011-08-12 00:58:14 -05:00
let did_doc = ebml::get_doc(doc, tag_def_id);
result += [parse_def_id(ebml::doc_data(did_doc))];
}
ret result;
}
fn item_path(item_doc: ebml::doc) -> ast_map::path {
let path_doc = ebml::get_doc(item_doc, tag_path);
let len_doc = ebml::get_doc(path_doc, tag_path_len);
let len = ebml::doc_as_u32(len_doc) as uint;
let result = [];
vec::reserve(result, len);
ebml::docs(path_doc) {|tag, elt_doc|
if tag == tag_path_elt_mod {
let str = ebml::doc_as_str(elt_doc);
result += [ast_map::path_mod(str)];
} else if tag == tag_path_elt_name {
let str = ebml::doc_as_str(elt_doc);
result += [ast_map::path_name(str)];
} else {
// ignore tag_path_len element
}
}
ret result;
}
fn item_name(item: ebml::doc) -> ast::ident {
let name = ebml::get_doc(item, tag_paths_data_name);
str::from_bytes(ebml::doc_data(name))
}
fn lookup_item_name(data: @[u8], id: ast::node_id) -> ast::ident {
item_name(lookup_item(id, data))
}
fn lookup_def(cnum: ast::crate_num, data: @[u8], did_: ast::def_id) ->
2011-07-27 07:19:39 -05:00
ast::def {
let item = lookup_item(did_.node, data);
let fam_ch = item_family(item);
2011-07-27 07:19:39 -05:00
let did = {crate: cnum, node: did_.node};
// We treat references to enums as references to types.
alt check fam_ch {
'c' { ast::def_const(did) }
'u' { ast::def_fn(did, ast::unsafe_fn) }
'f' { ast::def_fn(did, ast::impure_fn) }
'p' { ast::def_fn(did, ast::pure_fn) }
'y' { ast::def_ty(did) }
't' { ast::def_ty(did) }
'm' { ast::def_mod(did) }
'n' { ast::def_native_mod(did) }
'v' {
let tid = variant_enum_id(item);
tid = {crate: cnum, node: tid.node};
ast::def_variant(tid, did)
}
'I' { ast::def_ty(did) }
}
}
fn get_type(cdata: cmd, id: ast::node_id, tcx: ty::ctxt)
-> ty::ty_param_bounds_and_ty {
let item = lookup_item(id, cdata.data);
let t = item_type({crate: cdata.cnum, node: id}, item, tcx, cdata);
2012-01-30 04:36:18 -06:00
let tp_bounds = if family_has_type_params(item_family(item)) {
item_ty_param_bounds(item, tcx, cdata)
2012-01-02 05:09:26 -06:00
} else { @[] };
ret {bounds: tp_bounds, ty: t};
}
fn get_type_param_count(data: @[u8], id: ast::node_id) -> uint {
item_ty_param_count(lookup_item(id, data))
}
fn get_impl_iface(cdata: cmd, id: ast::node_id, tcx: ty::ctxt)
-> option<ty::t> {
item_impl_iface(lookup_item(id, cdata.data), tcx, cdata)
}
2011-09-02 17:34:58 -05:00
fn get_symbol(data: @[u8], id: ast::node_id) -> str {
ret item_symbol(lookup_item(id, data));
}
fn get_item_path(cdata: cmd, id: ast::node_id) -> ast_map::path {
item_path(lookup_item(id, cdata.data))
}
fn maybe_get_item_ast(cdata: cmd, tcx: ty::ctxt, maps: maps,
id: ast::node_id) -> option<ast::inlined_item> {
let item_doc = lookup_item(id, cdata.data);
let path = vec::init(item_path(item_doc));
astencode::decode_inlined_item(cdata, tcx, maps, path, item_doc)
}
fn get_enum_variants(cdata: cmd, id: ast::node_id, tcx: ty::ctxt)
-> [ty::variant_info] {
let data = cdata.data;
2011-08-12 00:58:14 -05:00
let items = ebml::get_doc(ebml::new_doc(data), tag_items);
let item = find_item(id, items);
let infos: [ty::variant_info] = [];
let variant_ids = enum_variant_ids(item, cdata);
let disr_val = 0;
for did: ast::def_id in variant_ids {
2011-07-27 07:19:39 -05:00
let item = find_item(did.node, items);
let ctor_ty = item_type({crate: cdata.cnum, node: id}, item,
tcx, cdata);
let name = item_name(item);
let arg_tys: [ty::t] = [];
alt ty::get(ctor_ty).struct {
ty::ty_fn(f) {
for a: ty::arg in f.inputs { arg_tys += [a.ty]; }
2011-07-27 07:19:39 -05:00
}
2012-01-19 16:24:03 -06:00
_ { /* Nullary enum variant. */ }
}
alt variant_disr_val(item) {
some(val) { disr_val = val; }
_ { /* empty */ }
}
infos += [@{args: arg_tys, ctor_ty: ctor_ty, name: name,
id: did, disr_val: disr_val}];
disr_val += 1;
}
ret infos;
}
fn item_impl_methods(cdata: cmd, item: ebml::doc, base_tps: uint)
-> [@middle::resolve::method_info] {
let rslt = [];
ebml::tagged_docs(item, tag_item_method) {|doc|
let m_did = parse_def_id(ebml::doc_data(doc));
let mth_item = lookup_item(m_did.node, cdata.data);
rslt += [@{did: translate_def_id(cdata, m_did),
n_tps: item_ty_param_count(mth_item) - base_tps,
ident: item_name(mth_item)}];
}
rslt
}
fn get_impls_for_mod(cdata: cmd, m_id: ast::node_id,
name: option<ast::ident>)
-> @[@middle::resolve::_impl] {
let data = cdata.data;
let mod_item = lookup_item(m_id, data), result = [];
ebml::tagged_docs(mod_item, tag_mod_impl) {|doc|
let did = translate_def_id(cdata, parse_def_id(ebml::doc_data(doc)));
let item = lookup_item(did.node, data), nm = item_name(item);
if alt name { some(n) { n == nm } none { true } } {
2012-02-09 10:08:54 -06:00
let base_tps = item_ty_param_count(item);
result += [@{did: did, ident: nm,
methods: item_impl_methods(cdata, item, base_tps)}];
}
}
@result
}
fn get_iface_methods(cdata: cmd, id: ast::node_id, tcx: ty::ctxt)
-> @[ty::method] {
let data = cdata.data;
let item = lookup_item(id, data), result = [];
ebml::tagged_docs(item, tag_item_method) {|mth|
2012-01-30 04:36:18 -06:00
let bounds = item_ty_param_bounds(mth, tcx, cdata);
let name = item_name(mth);
let ty = doc_type(mth, tcx, cdata);
let fty = alt ty::get(ty).struct { ty::ty_fn(f) { f }
_ { tcx.sess.bug("get_iface_methods: id has non-function type");
} };
result += [{ident: name, tps: bounds, fty: fty,
purity: alt check item_family(mth) {
'u' { ast::unsafe_fn }
'f' { ast::impure_fn }
'p' { ast::pure_fn }
}}];
}
@result
}
fn family_has_type_params(fam_ch: char) -> bool {
alt check fam_ch {
'c' | 'T' | 'm' | 'n' { false }
'f' | 'u' | 'p' | 'F' | 'U' | 'P' | 'y' | 't' | 'v' | 'i' | 'I' { true }
}
}
fn family_names_type(fam_ch: char) -> bool {
alt fam_ch { 'y' | 't' | 'I' { true } _ { false } }
}
fn read_path(d: ebml::doc) -> {path: str, pos: uint} {
2011-08-12 00:58:14 -05:00
let desc = ebml::doc_data(d);
let pos = io::u64_from_be_bytes(desc, 0u, 4u) as uint;
let pathbytes = vec::slice::<u8>(desc, 4u, vec::len::<u8>(desc));
let path = str::from_bytes(pathbytes);
2011-07-27 07:19:39 -05:00
ret {path: path, pos: pos};
}
fn describe_def(items: ebml::doc, id: ast::def_id) -> str {
2011-09-02 17:34:58 -05:00
if id.crate != ast::local_crate { ret "external"; }
ret item_family_to_str(item_family(find_item(id.node, items)));
}
fn item_family_to_str(fam: char) -> str {
alt check fam {
2011-09-02 17:34:58 -05:00
'c' { ret "const"; }
'f' { ret "fn"; }
'u' { ret "unsafe fn"; }
2011-09-02 17:34:58 -05:00
'p' { ret "pure fn"; }
'F' { ret "native fn"; }
'U' { ret "unsafe native fn"; }
'P' { ret "pure native fn"; }
2011-09-02 17:34:58 -05:00
'y' { ret "type"; }
'T' { ret "native type"; }
't' { ret "type"; }
'm' { ret "mod"; }
'n' { ret "native mod"; }
2012-01-19 16:24:03 -06:00
'v' { ret "enum"; }
'i' { ret "impl"; }
'I' { ret "iface"; }
}
}
fn get_meta_items(md: ebml::doc) -> [@ast::meta_item] {
let items: [@ast::meta_item] = [];
ebml::tagged_docs(md, tag_meta_item_word) {|meta_item_doc|
2011-08-12 00:58:14 -05:00
let nd = ebml::get_doc(meta_item_doc, tag_meta_item_name);
let n = str::from_bytes(ebml::doc_data(nd));
items += [attr::mk_word_item(n)];
};
ebml::tagged_docs(md, tag_meta_item_name_value) {|meta_item_doc|
2011-08-12 00:58:14 -05:00
let nd = ebml::get_doc(meta_item_doc, tag_meta_item_name);
let vd = ebml::get_doc(meta_item_doc, tag_meta_item_value);
let n = str::from_bytes(ebml::doc_data(nd));
let v = str::from_bytes(ebml::doc_data(vd));
// FIXME (#611): Should be able to decode meta_name_value variants,
// but currently they can't be encoded
items += [attr::mk_name_value_item_str(n, v)];
};
ebml::tagged_docs(md, tag_meta_item_list) {|meta_item_doc|
2011-08-12 00:58:14 -05:00
let nd = ebml::get_doc(meta_item_doc, tag_meta_item_name);
let n = str::from_bytes(ebml::doc_data(nd));
2011-07-27 07:19:39 -05:00
let subitems = get_meta_items(meta_item_doc);
items += [attr::mk_list_item(n, subitems)];
};
ret items;
}
fn get_attributes(md: ebml::doc) -> [ast::attribute] {
let attrs: [ast::attribute] = [];
2011-08-12 00:58:14 -05:00
alt ebml::maybe_get_doc(md, tag_attributes) {
2011-07-27 07:19:39 -05:00
option::some(attrs_d) {
ebml::tagged_docs(attrs_d, tag_attribute) {|attr_doc|
2011-07-27 07:19:39 -05:00
let meta_items = get_meta_items(attr_doc);
// Currently it's only possible to have a single meta item on
// an attribute
2011-08-15 18:38:23 -05:00
assert (vec::len(meta_items) == 1u);
let meta_item = meta_items[0];
2011-07-27 07:19:39 -05:00
attrs +=
[{node: {style: ast::attr_outer, value: *meta_item},
span: ast_util::dummy_sp()}];
};
2011-07-27 07:19:39 -05:00
}
option::none { }
}
ret attrs;
}
fn list_meta_items(meta_items: ebml::doc, out: io::writer) {
for mi: @ast::meta_item in get_meta_items(meta_items) {
2011-09-02 17:34:58 -05:00
out.write_str(#fmt["%s\n", pprust::meta_item_to_str(*mi)]);
}
}
2011-12-11 09:23:38 -06:00
fn list_crate_attributes(md: ebml::doc, hash: str, out: io::writer) {
out.write_str(#fmt("=Crate Attributes (%s)=\n", hash));
for attr: ast::attribute in get_attributes(md) {
2011-09-02 17:34:58 -05:00
out.write_str(#fmt["%s\n", pprust::attribute_to_str(attr)]);
}
2011-09-02 17:34:58 -05:00
out.write_str("\n\n");
}
fn get_crate_attributes(data: @[u8]) -> [ast::attribute] {
2011-08-12 00:58:14 -05:00
ret get_attributes(ebml::new_doc(data));
}
2011-09-02 17:34:58 -05:00
type crate_dep = {cnum: ast::crate_num, ident: str};
2011-07-27 07:19:39 -05:00
fn get_crate_deps(data: @[u8]) -> [crate_dep] {
let deps: [crate_dep] = [];
2011-08-12 00:58:14 -05:00
let cratedoc = ebml::new_doc(data);
let depsdoc = ebml::get_doc(cratedoc, tag_crate_deps);
2011-07-27 07:19:39 -05:00
let crate_num = 1;
ebml::tagged_docs(depsdoc, tag_crate_dep) {|depdoc|
let depname = str::from_bytes(ebml::doc_data(depdoc));
deps += [{cnum: crate_num, ident: depname}];
crate_num += 1;
};
ret deps;
}
2011-08-11 21:14:38 -05:00
fn list_crate_deps(data: @[u8], out: io::writer) {
2011-09-02 17:34:58 -05:00
out.write_str("=External Dependencies=\n");
for dep: crate_dep in get_crate_deps(data) {
2011-09-02 17:34:58 -05:00
out.write_str(#fmt["%d %s\n", dep.cnum, dep.ident]);
}
2011-09-02 17:34:58 -05:00
out.write_str("\n");
}
2011-12-11 09:23:38 -06:00
fn get_crate_hash(data: @[u8]) -> str {
let cratedoc = ebml::new_doc(data);
let hashdoc = ebml::get_doc(cratedoc, tag_crate_hash);
ret str::from_bytes(ebml::doc_data(hashdoc));
2011-12-11 09:23:38 -06:00
}
fn list_crate_items(bytes: @[u8], md: ebml::doc, out: io::writer) {
2011-09-02 17:34:58 -05:00
out.write_str("=Items=\n");
2011-08-12 00:58:14 -05:00
let items = ebml::get_doc(md, tag_items);
iter_crate_items(bytes) {|path, did|
out.write_str(#fmt["%s (%s)\n", path, describe_def(items, did)]);
}
out.write_str("\n");
}
2012-01-23 16:59:00 -06:00
fn iter_crate_items(bytes: @[u8], proc: fn(str, ast::def_id)) {
let md = ebml::new_doc(bytes);
let paths = ebml::get_doc(md, tag_paths);
2011-08-12 00:58:14 -05:00
let index = ebml::get_doc(paths, tag_index);
let bs = ebml::get_doc(index, tag_index_buckets);
ebml::tagged_docs(bs, tag_index_buckets_bucket) {|bucket|
2011-07-27 07:19:39 -05:00
let et = tag_index_buckets_bucket_elt;
ebml::tagged_docs(bucket, et) {|elt|
2011-07-27 07:19:39 -05:00
let data = read_path(elt);
let {tag:_, doc:def} = ebml::doc_at(bytes, data.pos);
2011-08-12 00:58:14 -05:00
let did_doc = ebml::get_doc(def, tag_def_id);
let did = parse_def_id(ebml::doc_data(did_doc));
proc(data.path, did);
};
};
}
fn get_crate_module_paths(bytes: @[u8]) -> [(ast::def_id, str)] {
fn mod_of_path(p: str) -> str {
str::connect(vec::init(str::split_str(p, "::")), "::")
}
// find all module (path, def_ids), which are not
// fowarded path due to renamed import or reexport
let res = [];
let mods = map::new_str_hash();
iter_crate_items(bytes) {|path, did|
let m = mod_of_path(path);
if str::is_not_empty(m) {
// if m has a sub-item, it must be a module
mods.insert(m, true);
}
// Collect everything by now. There might be multiple
// paths pointing to the same did. Those will be
// unified later by using the mods map
res += [(did, path)];
}
ret vec::filter(res) {|x|
let (_, xp) = x;
mods.contains_key(xp)
}
}
fn list_crate_metadata(bytes: @[u8], out: io::writer) {
2011-12-11 09:23:38 -06:00
let hash = get_crate_hash(bytes);
2011-08-12 00:58:14 -05:00
let md = ebml::new_doc(bytes);
2011-12-11 09:23:38 -06:00
list_crate_attributes(md, hash, out);
list_crate_deps(bytes, out);
list_crate_items(bytes, md, out);
}
// Translates a def_id from an external crate to a def_id for the current
// compilation environment. We use this when trying to load types from
// external crates - if those types further refer to types in other crates
// then we must translate the crate number from that encoded in the external
// crate to the correct local crate number.
fn translate_def_id(cdata: cmd, did: ast::def_id) -> ast::def_id {
if did.crate == ast::local_crate {
ret {crate: cdata.cnum, node: did.node};
}
alt cdata.cnum_map.find(did.crate) {
option::some(n) { ret {crate: n, node: did.node}; }
option::none { fail "didn't find a crate in the cnum_map"; }
}
}
// Local Variables:
// mode: rust
// fill-column: 78;
// indent-tabs-mode: nil
// c-basic-offset: 4
// buffer-file-coding-system: utf-8-unix
// End: