rust/src/comp/metadata/decoder.rs

441 lines
14 KiB
Rust
Raw Normal View History

2011-07-08 01:29:09 -05:00
// Decoding metadata from a single crate's metadata
2011-06-27 18:03:01 -05:00
2011-08-12 00:58:14 -05:00
import std::ebml;
2011-08-15 18:38:23 -05:00
import std::vec;
import std::option;
import std::str;
2011-08-24 23:26:19 -05:00
import std::istr;
2011-08-11 21:14:38 -05:00
import std::io;
import std::map::hashmap;
import syntax::ast;
import syntax::ast_util;
2011-06-30 19:03:08 -05:00
import front::attr;
import middle::ty;
import common::*;
import tydecode::parse_def_id;
import tydecode::parse_ty_data;
import driver::session;
import syntax::print::pprust;
import cstore;
export get_symbol;
export get_tag_variants;
export get_type;
export get_type_param_count;
export get_type_param_kinds;
export lookup_defs;
export get_crate_attributes;
export list_crate_metadata;
export crate_dep;
export get_crate_deps;
export external_resolver;
// A function that takes a def_id relative to the crate being searched and
// returns a def_id relative to the compilation environment, i.e. if we hit a
// def_id for an item defined in another crate, somebody needs to figure out
// what crate that's in and give us a def_id that makes sense for the current
// build.
type external_resolver = fn(&ast::def_id) -> ast::def_id;
2011-07-27 07:19:39 -05:00
fn lookup_hash(d: &ebml::doc, eq_fn: fn(&[u8]) -> bool, hash: uint) ->
2011-08-12 00:58:14 -05:00
[ebml::doc] {
let index = ebml::get_doc(d, tag_index);
let table = ebml::get_doc(index, tag_index_table);
2011-07-27 07:19:39 -05:00
let hash_pos = table.start + hash % 256u * 4u;
2011-08-12 00:58:14 -05:00
let pos = ebml::be_uint_from_bytes(d.data, hash_pos, 4u);
let bucket = ebml::doc_at(d.data, pos);
// Awkward logic because we can't ret from foreach yet
let result: [ebml::doc] = [];
2011-07-27 07:19:39 -05:00
let belt = tag_index_buckets_bucket_elt;
for each elt: ebml::doc in ebml::tagged_docs(bucket, belt) {
2011-08-12 00:58:14 -05:00
let pos = ebml::be_uint_from_bytes(elt.data, elt.start, 4u);
if eq_fn(vec::slice::<u8>(*elt.data, elt.start + 4u, elt.end)) {
result += [ebml::doc_at(d.data, pos)];
}
}
ret result;
}
fn maybe_find_item(item_id: int, items: &ebml::doc) -> option::t<ebml::doc> {
fn eq_item(bytes: &[u8], item_id: int) -> bool {
2011-08-12 00:58:14 -05:00
ret ebml::be_uint_from_bytes(@bytes, 0u, 4u) as int == item_id;
}
2011-07-27 07:19:39 -05:00
let eqer = bind eq_item(_, item_id);
let found = lookup_hash(items, eqer, hash_node_id(item_id));
2011-08-15 18:38:23 -05:00
if vec::len(found) == 0u {
ret option::none::<ebml::doc>;
} else { ret option::some::<ebml::doc>(found[0]); }
}
2011-08-12 00:58:14 -05:00
fn find_item(item_id: int, items: &ebml::doc) -> ebml::doc {
ret option::get(maybe_find_item(item_id, items));
}
2011-08-12 00:58:14 -05:00
// Looks up an item in the given metadata and returns an ebml doc pointing
// to the item data.
2011-08-12 00:58:14 -05:00
fn lookup_item(item_id: int, data: &@[u8]) -> ebml::doc {
let items = ebml::get_doc(ebml::new_doc(data), tag_items);
ret find_item(item_id, items);
}
2011-08-12 00:58:14 -05:00
fn item_family(item: &ebml::doc) -> u8 {
let fam = ebml::get_doc(item, tag_items_data_item_family);
ret ebml::doc_as_uint(fam) as u8;
}
fn item_symbol(item: &ebml::doc) -> istr {
2011-08-12 00:58:14 -05:00
let sym = ebml::get_doc(item, tag_items_data_item_symbol);
ret istr::unsafe_from_bytes(ebml::doc_data(sym));
}
2011-08-12 00:58:14 -05:00
fn variant_tag_id(d: &ebml::doc) -> ast::def_id {
let tagdoc = ebml::get_doc(d, tag_items_data_item_tag_id);
ret parse_def_id(ebml::doc_data(tagdoc));
}
2011-08-12 00:58:14 -05:00
fn item_type(item: &ebml::doc, this_cnum: ast::crate_num, tcx: ty::ctxt,
2011-07-27 07:19:39 -05:00
extres: &external_resolver) -> ty::t {
fn parse_external_def_id(this_cnum: ast::crate_num,
extres: &external_resolver, s: &istr) ->
2011-07-27 07:19:39 -05:00
ast::def_id {
let buf = istr::bytes(s);
2011-07-27 07:19:39 -05:00
let external_def_id = parse_def_id(buf);
2011-07-08 01:29:09 -05:00
// This item was defined in the crate we're searching if it's has the
// local crate number, otherwise we need to search a different crate
2011-07-27 07:19:39 -05:00
if external_def_id.crate == ast::local_crate {
ret {crate: this_cnum, node: external_def_id.node};
} else { ret extres(external_def_id); }
}
2011-08-12 00:58:14 -05:00
let tp = ebml::get_doc(item, tag_items_data_item_type);
2011-07-27 07:19:39 -05:00
let def_parser = bind parse_external_def_id(this_cnum, extres, _);
ret parse_ty_data(item.data, this_cnum, tp.start, tp.end - tp.start,
def_parser, tcx);
}
2011-08-12 00:58:14 -05:00
fn item_ty_param_kinds(item: &ebml::doc) -> [ast::kind] {
let ks: [ast::kind] = [];
let tp = tag_items_data_item_ty_param_kinds;
2011-08-12 00:58:14 -05:00
for each p: ebml::doc in ebml::tagged_docs(item, tp) {
let dat: [u8] = ebml::doc_data(p);
2011-08-12 00:58:14 -05:00
let vi = ebml::vint_at(dat, 0u);
let i = 0u;
while i < vi.val {
let k =
alt dat[vi.next + i] as char {
'u' { ast::kind_unique }
's' { ast::kind_shared }
'p' { ast::kind_pinned }
};
ks += [k];
i += 1u;
}
}
ret ks;
}
2011-08-12 00:58:14 -05:00
fn tag_variant_ids(item: &ebml::doc, this_cnum: ast::crate_num) ->
[ast::def_id] {
let ids: [ast::def_id] = [];
2011-07-27 07:19:39 -05:00
let v = tag_items_data_item_variant;
for each p: ebml::doc in ebml::tagged_docs(item, v) {
2011-08-12 00:58:14 -05:00
let ext = parse_def_id(ebml::doc_data(p));
ids += [{crate: this_cnum, node: ext.node}];
}
ret ids;
}
// Given a path and serialized crate metadata, returns the ID of the
// definition the path refers to.
fn resolve_path(path: &[ast::ident], data: @[u8]) -> [ast::def_id] {
fn eq_item(data: &[u8], s: &istr) -> bool {
ret istr::eq(istr::unsafe_from_bytes(data), s);
}
let s = istr::connect(path, ~"::");
2011-08-12 00:58:14 -05:00
let md = ebml::new_doc(data);
let paths = ebml::get_doc(md, tag_paths);
2011-07-27 07:19:39 -05:00
let eqer = bind eq_item(_, s);
let result: [ast::def_id] = [];
for doc: ebml::doc in lookup_hash(paths, eqer,
hash_path(s)) {
2011-08-12 00:58:14 -05:00
let did_doc = ebml::get_doc(doc, tag_def_id);
result += [parse_def_id(ebml::doc_data(did_doc))];
}
ret result;
}
// Crate metadata queries
fn lookup_defs(data: &@[u8], cnum: ast::crate_num, path: &[ast::ident]) ->
[ast::def] {
2011-08-15 18:38:23 -05:00
ret vec::map(bind lookup_def(cnum, data, _), resolve_path(path, data));
}
// FIXME doesn't yet handle re-exported externals
fn lookup_def(cnum: ast::crate_num, data: @[u8], did_: &ast::def_id) ->
2011-07-27 07:19:39 -05:00
ast::def {
let item = lookup_item(did_.node, data);
let fam_ch = item_family(item);
2011-07-27 07:19:39 -05:00
let did = {crate: cnum, node: did_.node};
2011-07-27 07:48:34 -05:00
// We treat references to tags as references to types.
let def =
alt fam_ch as char {
2011-07-27 07:19:39 -05:00
'c' { ast::def_const(did) }
'f' { ast::def_fn(did, ast::impure_fn) }
'p' { ast::def_fn(did, ast::pure_fn) }
'F' { ast::def_native_fn(did) }
'y' { ast::def_ty(did) }
'T' { ast::def_native_ty(did) }
't' { ast::def_ty(did) }
'm' { ast::def_mod(did) }
'n' { ast::def_native_mod(did) }
'v' {
let tid = variant_tag_id(item);
tid = {crate: cnum, node: tid.node};
ast::def_variant(tid, did)
}
};
ret def;
}
fn get_type(data: @[u8], def: ast::def_id, tcx: &ty::ctxt,
extres: &external_resolver) -> ty::ty_param_kinds_and_ty {
2011-07-27 07:19:39 -05:00
let this_cnum = def.crate;
let node_id = def.node;
let item = lookup_item(node_id, data);
let t = item_type(item, this_cnum, tcx, extres);
let tp_kinds: [ast::kind];
let fam_ch = item_family(item);
let has_ty_params = family_has_type_params(fam_ch);
2011-07-27 07:19:39 -05:00
if has_ty_params {
tp_kinds = item_ty_param_kinds(item);
} else { tp_kinds = []; }
ret {kinds: tp_kinds, ty: t};
}
fn get_type_param_count(data: @[u8], id: ast::node_id) -> uint {
2011-08-15 18:38:23 -05:00
ret vec::len(get_type_param_kinds(data, id));
}
fn get_type_param_kinds(data: @[u8], id: ast::node_id) -> [ast::kind] {
ret item_ty_param_kinds(lookup_item(id, data));
}
fn get_symbol(data: @[u8], id: ast::node_id) -> istr {
ret item_symbol(lookup_item(id, data));
}
fn get_tag_variants(_data: &@[u8], def: ast::def_id, tcx: &ty::ctxt,
extres: &external_resolver) -> [ty::variant_info] {
2011-07-27 07:19:39 -05:00
let external_crate_id = def.crate;
let data =
cstore::get_crate_data(tcx.sess.get_cstore(), external_crate_id).data;
2011-08-12 00:58:14 -05:00
let items = ebml::get_doc(ebml::new_doc(data), tag_items);
2011-07-27 07:19:39 -05:00
let item = find_item(def.node, items);
let infos: [ty::variant_info] = [];
2011-07-27 07:19:39 -05:00
let variant_ids = tag_variant_ids(item, external_crate_id);
for did: ast::def_id in variant_ids {
2011-07-27 07:19:39 -05:00
let item = find_item(did.node, items);
let ctor_ty = item_type(item, external_crate_id, tcx, extres);
let arg_tys: [ty::t] = [];
2011-07-27 07:19:39 -05:00
alt ty::struct(tcx, ctor_ty) {
ty::ty_fn(_, args, _, _, _) {
for a: ty::arg in args { arg_tys += [a.ty]; }
2011-07-27 07:19:39 -05:00
}
_ {
// Nullary tag variant.
}
}
infos += [{args: arg_tys, ctor_ty: ctor_ty, id: did}];
}
ret infos;
}
fn family_has_type_params(fam_ch: u8) -> bool {
ret alt fam_ch as char {
2011-07-27 07:19:39 -05:00
'c' { false }
'f' { true }
'p' { true }
'F' { true }
'y' { true }
't' { true }
'T' { false }
'm' { false }
'n' { false }
'v' { true }
};
}
fn read_path(d: &ebml::doc) -> {path: istr, pos: uint} {
2011-08-12 00:58:14 -05:00
let desc = ebml::doc_data(d);
let pos = ebml::be_uint_from_bytes(@desc, 0u, 4u);
let pathbytes = vec::slice::<u8>(desc, 4u, vec::len::<u8>(desc));
let path = istr::unsafe_from_bytes(pathbytes);
2011-07-27 07:19:39 -05:00
ret {path: path, pos: pos};
}
fn describe_def(items: &ebml::doc, id: ast::def_id) -> istr {
if id.crate != ast::local_crate { ret ~"external"; }
ret item_family_to_str(item_family(find_item(id.node, items)));
}
fn item_family_to_str(fam: u8) -> istr {
alt fam as char {
'c' { ret ~"const"; }
'f' { ret ~"fn"; }
'p' { ret ~"pure fn"; }
'F' { ret ~"native fn"; }
'y' { ret ~"type"; }
'T' { ret ~"native type"; }
't' { ret ~"type"; }
'm' { ret ~"mod"; }
'n' { ret ~"native mod"; }
'v' { ret ~"tag"; }
}
}
2011-08-12 00:58:14 -05:00
fn get_meta_items(md: &ebml::doc) -> [@ast::meta_item] {
let items: [@ast::meta_item] = [];
for each meta_item_doc: ebml::doc in
2011-08-12 00:58:14 -05:00
ebml::tagged_docs(md, tag_meta_item_word) {
let nd = ebml::get_doc(meta_item_doc, tag_meta_item_name);
2011-08-25 19:00:12 -05:00
let n = istr::unsafe_from_bytes(ebml::doc_data(nd));
items += [attr::mk_word_item(n)];
}
for each meta_item_doc: ebml::doc in
2011-08-12 00:58:14 -05:00
ebml::tagged_docs(md, tag_meta_item_name_value) {
let nd = ebml::get_doc(meta_item_doc, tag_meta_item_name);
let vd = ebml::get_doc(meta_item_doc, tag_meta_item_value);
2011-08-25 19:00:12 -05:00
let n = istr::unsafe_from_bytes(ebml::doc_data(nd));
let v = istr::unsafe_from_bytes(ebml::doc_data(vd));
// FIXME (#611): Should be able to decode meta_name_value variants,
// but currently they can't be encoded
items += [attr::mk_name_value_item_str(n, v)];
}
for each meta_item_doc: ebml::doc in
2011-08-12 00:58:14 -05:00
ebml::tagged_docs(md, tag_meta_item_list) {
let nd = ebml::get_doc(meta_item_doc, tag_meta_item_name);
2011-08-25 19:00:12 -05:00
let n = istr::unsafe_from_bytes(ebml::doc_data(nd));
2011-07-27 07:19:39 -05:00
let subitems = get_meta_items(meta_item_doc);
items += [attr::mk_list_item(n, subitems)];
}
ret items;
}
2011-08-12 00:58:14 -05:00
fn get_attributes(md: &ebml::doc) -> [ast::attribute] {
let attrs: [ast::attribute] = [];
2011-08-12 00:58:14 -05:00
alt ebml::maybe_get_doc(md, tag_attributes) {
2011-07-27 07:19:39 -05:00
option::some(attrs_d) {
for each attr_doc: ebml::doc in
2011-08-12 00:58:14 -05:00
ebml::tagged_docs(attrs_d, tag_attribute) {
2011-07-27 07:19:39 -05:00
let meta_items = get_meta_items(attr_doc);
// Currently it's only possible to have a single meta item on
// an attribute
2011-08-15 18:38:23 -05:00
assert (vec::len(meta_items) == 1u);
let meta_item = meta_items[0];
2011-07-27 07:19:39 -05:00
attrs +=
[{node: {style: ast::attr_outer, value: *meta_item},
span: ast_util::dummy_sp()}];
}
2011-07-27 07:19:39 -05:00
}
option::none. { }
}
ret attrs;
}
2011-08-12 00:58:14 -05:00
fn list_meta_items(meta_items: &ebml::doc, out: io::writer) {
for mi: @ast::meta_item in get_meta_items(meta_items) {
2011-08-24 23:26:19 -05:00
out.write_str(
istr::from_estr(
#fmt["%s\n",
istr::to_estr(pprust::meta_item_to_str(*mi))]));
}
}
2011-08-12 00:58:14 -05:00
fn list_crate_attributes(md: &ebml::doc, out: io::writer) {
2011-08-24 23:26:19 -05:00
out.write_str(~"=Crate Attributes=\n");
for attr: ast::attribute in get_attributes(md) {
2011-08-24 23:26:19 -05:00
out.write_str(
istr::from_estr(
#fmt["%s\n",
istr::to_estr(pprust::attribute_to_str(attr))]));
}
2011-08-24 23:26:19 -05:00
out.write_str(~"\n\n");
}
fn get_crate_attributes(data: @[u8]) -> [ast::attribute] {
2011-08-12 00:58:14 -05:00
ret get_attributes(ebml::new_doc(data));
}
type crate_dep = {cnum: ast::crate_num, ident: istr};
2011-07-27 07:19:39 -05:00
fn get_crate_deps(data: @[u8]) -> [crate_dep] {
let deps: [crate_dep] = [];
2011-08-12 00:58:14 -05:00
let cratedoc = ebml::new_doc(data);
let depsdoc = ebml::get_doc(cratedoc, tag_crate_deps);
2011-07-27 07:19:39 -05:00
let crate_num = 1;
for each depdoc: ebml::doc in ebml::tagged_docs(depsdoc, tag_crate_dep) {
let depname = istr::unsafe_from_bytes(ebml::doc_data(depdoc));
deps += [{cnum: crate_num, ident: depname}];
crate_num += 1;
}
ret deps;
}
2011-08-11 21:14:38 -05:00
fn list_crate_deps(data: @[u8], out: io::writer) {
2011-08-24 23:26:19 -05:00
out.write_str(~"=External Dependencies=\n");
for dep: crate_dep in get_crate_deps(data) {
2011-08-24 23:26:19 -05:00
out.write_str(
istr::from_estr(#fmt["%d %s\n", dep.cnum,
istr::to_estr(dep.ident)]));
}
2011-08-24 23:26:19 -05:00
out.write_str(~"\n");
}
2011-08-12 00:58:14 -05:00
fn list_crate_items(bytes: &@[u8], md: &ebml::doc, out: io::writer) {
2011-08-24 23:26:19 -05:00
out.write_str(~"=Items=\n");
2011-08-12 00:58:14 -05:00
let paths = ebml::get_doc(md, tag_paths);
let items = ebml::get_doc(md, tag_items);
let index = ebml::get_doc(paths, tag_index);
let bs = ebml::get_doc(index, tag_index_buckets);
for each bucket: ebml::doc in
2011-08-12 00:58:14 -05:00
ebml::tagged_docs(bs, tag_index_buckets_bucket) {
2011-07-27 07:19:39 -05:00
let et = tag_index_buckets_bucket_elt;
for each elt: ebml::doc in ebml::tagged_docs(bucket, et) {
2011-07-27 07:19:39 -05:00
let data = read_path(elt);
2011-08-12 00:58:14 -05:00
let def = ebml::doc_at(bytes, data.pos);
let did_doc = ebml::get_doc(def, tag_def_id);
let did = parse_def_id(ebml::doc_data(did_doc));
2011-08-24 23:26:19 -05:00
out.write_str(
istr::from_estr(
#fmt["%s (%s)\n",
istr::to_estr(data.path),
istr::to_estr(describe_def(items, did))]));
}
}
2011-08-24 23:26:19 -05:00
out.write_str(~"\n");
}
2011-08-11 21:14:38 -05:00
fn list_crate_metadata(bytes: &@[u8], out: io::writer) {
2011-08-12 00:58:14 -05:00
let md = ebml::new_doc(bytes);
list_crate_attributes(md, out);
list_crate_deps(bytes, out);
list_crate_items(bytes, md, out);
}
// Local Variables:
// mode: rust
// fill-column: 78;
// indent-tabs-mode: nil
// c-basic-offset: 4
// buffer-file-coding-system: utf-8-unix
// compile-command: "make -k -C $RBUILD 2>&1 | sed -e 's/\\/x\\//x:\\//g'";
// End: