improve the tyencode abbrev format
3% win on libcore 528828 liballoc-bb943c5a.rlib 1425126 liballoc_jemalloc-bb943c5a.rlib 10090 liballoc_system-bb943c5a.rlib 144904 libarena-bb943c5a.rlib 3773896 libcollections-bb943c5a.rlib 17075242 libcore-bb943c5a.rlib 195770 libflate-bb943c5a.rlib 234702 libfmt_macros-bb943c5a.rlib 536342 libgetopts-bb943c5a.rlib 212028 libgraphviz-bb943c5a.rlib 397068 liblibc-bb943c5a.rlib 185038 liblog-bb943c5a.rlib 680782 librand-bb943c5a.rlib 577574 librbml-bb943c5a.rlib 1381992 librustc_back-bb943c5a.rlib 37554736 librustc-bb943c5a.rlib 12826 librustc_bitflags-bb943c5a.rlib 2257392 librustc_borrowck-bb943c5a.rlib 533858 librustc_data_structures-bb943c5a.rlib 9338878 librustc_driver-bb943c5a.rlib 8960016 librustc_front-bb943c5a.rlib 1594212 librustc_lint-bb943c5a.rlib 79159342 librustc_llvm-bb943c5a.rlib 4590656 librustc_mir-bb943c5a.rlib 3529292 librustc_platform_intrinsics-bb943c5a.rlib 590688 librustc_privacy-bb943c5a.rlib 3084134 librustc_resolve-bb943c5a.rlib 14032890 librustc_trans-bb943c5a.rlib 11833852 librustc_typeck-bb943c5a.rlib 1641496 librustc_unicode-bb943c5a.rlib 15611582 librustdoc-bb943c5a.rlib 2693764 libserialize-bb943c5a.rlib 8266920 libstd-bb943c5a.rlib 29573790 libsyntax-bb943c5a.rlib 895484 libterm-bb943c5a.rlib
This commit is contained in:
parent
ce02aa4942
commit
b74219964c
@ -914,7 +914,7 @@ fn write_sized_vuint<W: Write>(w: &mut W, n: usize, size: usize) -> EncodeResult
|
||||
}
|
||||
}
|
||||
|
||||
fn write_vuint<W: Write>(w: &mut W, n: usize) -> EncodeResult {
|
||||
pub fn write_vuint<W: Write>(w: &mut W, n: usize) -> EncodeResult {
|
||||
if n < 0x7f { return write_sized_vuint(w, n, 1); }
|
||||
if n < 0x4000 { return write_sized_vuint(w, n, 2); }
|
||||
if n < 0x200000 { return write_sized_vuint(w, n, 3); }
|
||||
|
@ -2150,7 +2150,7 @@ struct Stats {
|
||||
}
|
||||
|
||||
// Get the encoded string for a type
|
||||
pub fn encoded_ty<'tcx>(tcx: &ty::ctxt<'tcx>, t: Ty<'tcx>) -> String {
|
||||
pub fn encoded_ty<'tcx>(tcx: &ty::ctxt<'tcx>, t: Ty<'tcx>) -> Vec<u8> {
|
||||
let mut wr = Cursor::new(Vec::new());
|
||||
tyencode::enc_ty(&mut Encoder::new(&mut wr), &tyencode::ctxt {
|
||||
diag: tcx.sess.diagnostic(),
|
||||
@ -2158,5 +2158,5 @@ pub fn encoded_ty<'tcx>(tcx: &ty::ctxt<'tcx>, t: Ty<'tcx>) -> String {
|
||||
tcx: tcx,
|
||||
abbrevs: &RefCell::new(FnvHashMap())
|
||||
}, t);
|
||||
String::from_utf8(wr.into_inner()).unwrap()
|
||||
wr.into_inner()
|
||||
}
|
||||
|
@ -125,6 +125,12 @@ fn scan<F>(&mut self, mut is_last: F) -> &'a [u8]
|
||||
return &self.data[start_pos..end_pos];
|
||||
}
|
||||
|
||||
fn parse_vuint(&mut self) -> usize {
|
||||
let res = rbml::reader::vuint_at(self.data, self.pos).unwrap();
|
||||
self.pos = res.next;
|
||||
res.val
|
||||
}
|
||||
|
||||
fn parse_name(&mut self, last: char) -> ast::Name {
|
||||
fn is_last(b: char, c: char) -> bool { return c == b; }
|
||||
let bytes = self.scan(|a| is_last(last, a));
|
||||
@ -405,11 +411,8 @@ pub fn parse_ty(&mut self) -> Ty<'tcx> {
|
||||
// we return it (modulo closure types, see below). But if not, then we
|
||||
// jump to offset 123 and read the type from there.
|
||||
|
||||
let pos = self.parse_hex();
|
||||
assert_eq!(self.next(), ':');
|
||||
let len = self.parse_hex();
|
||||
assert_eq!(self.next(), '#');
|
||||
let key = ty::CReaderCacheKey {cnum: self.krate, pos: pos, len: len };
|
||||
let pos = self.parse_vuint();
|
||||
let key = ty::CReaderCacheKey { cnum: self.krate, pos: pos };
|
||||
match tcx.rcache.borrow().get(&key).cloned() {
|
||||
Some(tt) => {
|
||||
// If there is a closure buried in the type some where, then we
|
||||
@ -508,19 +511,6 @@ fn parse_param_space(&mut self) -> subst::ParamSpace {
|
||||
subst::ParamSpace::from_uint(self.parse_uint())
|
||||
}
|
||||
|
||||
fn parse_hex(&mut self) -> usize {
|
||||
let mut n = 0;
|
||||
loop {
|
||||
let cur = self.peek();
|
||||
if (cur < '0' || cur > '9') && (cur < 'a' || cur > 'f') { return n; }
|
||||
self.pos = self.pos + 1;
|
||||
n *= 16;
|
||||
if '0' <= cur && cur <= '9' {
|
||||
n += (cur as usize) - ('0' as usize);
|
||||
} else { n += 10 + (cur as usize) - ('a' as usize); }
|
||||
};
|
||||
}
|
||||
|
||||
fn parse_abi_set(&mut self) -> abi::Abi {
|
||||
assert_eq!(self.next(), '[');
|
||||
let bytes = self.scan(|c| c == ']');
|
||||
|
@ -14,7 +14,7 @@
|
||||
#![allow(non_camel_case_types)]
|
||||
|
||||
use std::cell::RefCell;
|
||||
use std::str;
|
||||
use std::io::Cursor;
|
||||
use std::io::prelude::*;
|
||||
|
||||
use middle::def_id::DefId;
|
||||
@ -31,7 +31,7 @@
|
||||
use syntax::ast;
|
||||
use syntax::diagnostic::SpanHandler;
|
||||
|
||||
use rbml::writer::Encoder;
|
||||
use rbml::writer::{self, Encoder};
|
||||
|
||||
macro_rules! mywrite { ($w:expr, $($arg:tt)*) => ({ write!($w.writer, $($arg)*); }) }
|
||||
|
||||
@ -48,14 +48,14 @@ pub struct ctxt<'a, 'tcx: 'a> {
|
||||
// Extra parameters are for converting to/from def_ids in the string rep.
|
||||
// Whatever format you choose should not contain pipe characters.
|
||||
pub struct ty_abbrev {
|
||||
s: String
|
||||
s: Vec<u8>
|
||||
}
|
||||
|
||||
pub type abbrev_map<'tcx> = RefCell<FnvHashMap<Ty<'tcx>, ty_abbrev>>;
|
||||
|
||||
pub fn enc_ty<'a, 'tcx>(w: &mut Encoder, cx: &ctxt<'a, 'tcx>, t: Ty<'tcx>) {
|
||||
match cx.abbrevs.borrow_mut().get(&t) {
|
||||
Some(a) => { w.writer.write_all(a.s.as_bytes()); return; }
|
||||
Some(a) => { w.writer.write_all(&a.s); return; }
|
||||
None => {}
|
||||
}
|
||||
|
||||
@ -167,23 +167,20 @@ pub fn enc_ty<'a, 'tcx>(w: &mut Encoder, cx: &ctxt<'a, 'tcx>, t: Ty<'tcx>) {
|
||||
|
||||
let end = w.mark_stable_position();
|
||||
let len = end - pos;
|
||||
fn estimate_sz(u: u64) -> u64 {
|
||||
let mut n = u;
|
||||
let mut len = 0;
|
||||
while n != 0 { len += 1; n = n >> 4; }
|
||||
return len;
|
||||
}
|
||||
let abbrev_len = 3 + estimate_sz(pos) + estimate_sz(len);
|
||||
|
||||
let buf: &mut [u8] = &mut [0; 16]; // vuint < 15 bytes
|
||||
let mut abbrev = Cursor::new(buf);
|
||||
abbrev.write_all(b"#");
|
||||
writer::write_vuint(&mut abbrev, pos as usize);
|
||||
|
||||
cx.abbrevs.borrow_mut().insert(t, ty_abbrev {
|
||||
s: if abbrev_len < len {
|
||||
format!("#{:x}:{:x}#", pos, len)
|
||||
s: if abbrev.position() < len {
|
||||
abbrev.get_ref()[..abbrev.position() as usize].to_owned()
|
||||
} else {
|
||||
// if the abbreviation is longer than the real type,
|
||||
// don't use #-notation. However, insert it here so
|
||||
// other won't have to `mark_stable_position`
|
||||
str::from_utf8(
|
||||
&w.writer.get_ref()[pos as usize..end as usize]
|
||||
).unwrap().to_owned()
|
||||
w.writer.get_ref()[pos as usize..end as usize].to_owned()
|
||||
}
|
||||
});
|
||||
}
|
||||
|
@ -366,7 +366,6 @@ pub fn autoderef(expr_id: NodeId, autoderef: u32) -> MethodCall {
|
||||
pub struct CReaderCacheKey {
|
||||
pub cnum: CrateNum,
|
||||
pub pos: usize,
|
||||
pub len: usize
|
||||
}
|
||||
|
||||
/// A restriction that certain types must be the same size. The use of
|
||||
|
@ -214,7 +214,7 @@ fn symbol_hash<'tcx>(tcx: &ty::ctxt<'tcx>,
|
||||
symbol_hasher.input_str(&meta[..]);
|
||||
}
|
||||
symbol_hasher.input_str("-");
|
||||
symbol_hasher.input_str(&encoder::encoded_ty(tcx, t));
|
||||
symbol_hasher.input(&encoder::encoded_ty(tcx, t));
|
||||
// Prefix with 'h' so that it never blends into adjacent digits
|
||||
let mut hash = String::from("h");
|
||||
hash.push_str(&truncated_hash_result(symbol_hasher));
|
||||
|
Loading…
Reference in New Issue
Block a user