2012-12-03 18:48:01 -06:00
|
|
|
// Copyright 2012 The Rust Project Developers. See the COPYRIGHT
|
|
|
|
// file at the top-level directory of this distribution and at
|
|
|
|
// http://rust-lang.org/COPYRIGHT.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
|
|
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
|
|
|
// option. This file may not be copied, modified, or distributed
|
|
|
|
// except according to those terms.
|
|
|
|
|
2014-03-21 20:05:05 -05:00
|
|
|
#![allow(non_camel_case_types)]
|
2013-05-17 17:28:44 -05:00
|
|
|
|
2014-08-27 20:46:52 -05:00
|
|
|
use std::hash::{Hash, Hasher};
|
|
|
|
use std::collections::HashMap;
|
2012-09-04 13:54:36 -05:00
|
|
|
use syntax::ast;
|
2013-08-14 08:54:35 -05:00
|
|
|
use syntax::visit;
|
|
|
|
use syntax::visit::Visitor;
|
2012-12-23 16:41:37 -06:00
|
|
|
|
2014-02-19 21:08:12 -06:00
|
|
|
use time;
|
2013-03-21 04:50:02 -05:00
|
|
|
|
2013-11-19 15:22:03 -06:00
|
|
|
pub fn time<T, U>(do_it: bool, what: &str, u: U, f: |U| -> T) -> T {
|
Implement LTO
This commit implements LTO for rust leveraging LLVM's passes. What this means
is:
* When compiling an rlib, in addition to insdering foo.o into the archive, also
insert foo.bc (the LLVM bytecode) of the optimized module.
* When the compiler detects the -Z lto option, it will attempt to perform LTO on
a staticlib or binary output. The compiler will emit an error if a dylib or
rlib output is being generated.
* The actual act of performing LTO is as follows:
1. Force all upstream libraries to have an rlib version available.
2. Load the bytecode of each upstream library from the rlib.
3. Link all this bytecode into the current LLVM module (just using llvm
apis)
4. Run an internalization pass which internalizes all symbols except those
found reachable for the local crate of compilation.
5. Run the LLVM LTO pass manager over this entire module
6a. If assembling an archive, then add all upstream rlibs into the output
archive. This ignores all of the object/bitcode/metadata files rust
generated and placed inside the rlibs.
6b. If linking a binary, create copies of all upstream rlibs, remove the
rust-generated object-file, and then link everything as usual.
As I have explained in #10741, this process is excruciatingly slow, so this is
*not* turned on by default, and it is also why I have decided to hide it behind
a -Z flag for now. The good news is that the binary sizes are about as small as
they can be as a result of LTO, so it's definitely working.
Closes #10741
Closes #10740
2013-12-03 01:19:29 -06:00
|
|
|
local_data_key!(depth: uint);
|
2013-09-27 21:46:09 -05:00
|
|
|
if !do_it { return f(u); }
|
Implement LTO
This commit implements LTO for rust leveraging LLVM's passes. What this means
is:
* When compiling an rlib, in addition to insdering foo.o into the archive, also
insert foo.bc (the LLVM bytecode) of the optimized module.
* When the compiler detects the -Z lto option, it will attempt to perform LTO on
a staticlib or binary output. The compiler will emit an error if a dylib or
rlib output is being generated.
* The actual act of performing LTO is as follows:
1. Force all upstream libraries to have an rlib version available.
2. Load the bytecode of each upstream library from the rlib.
3. Link all this bytecode into the current LLVM module (just using llvm
apis)
4. Run an internalization pass which internalizes all symbols except those
found reachable for the local crate of compilation.
5. Run the LLVM LTO pass manager over this entire module
6a. If assembling an archive, then add all upstream rlibs into the output
archive. This ignores all of the object/bitcode/metadata files rust
generated and placed inside the rlibs.
6b. If linking a binary, create copies of all upstream rlibs, remove the
rust-generated object-file, and then link everything as usual.
As I have explained in #10741, this process is excruciatingly slow, so this is
*not* turned on by default, and it is also why I have decided to hide it behind
a -Z flag for now. The good news is that the binary sizes are about as small as
they can be as a result of LTO, so it's definitely working.
Closes #10741
Closes #10740
2013-12-03 01:19:29 -06:00
|
|
|
|
2014-04-28 22:36:08 -05:00
|
|
|
let old = depth.get().map(|d| *d).unwrap_or(0);
|
|
|
|
depth.replace(Some(old + 1));
|
Implement LTO
This commit implements LTO for rust leveraging LLVM's passes. What this means
is:
* When compiling an rlib, in addition to insdering foo.o into the archive, also
insert foo.bc (the LLVM bytecode) of the optimized module.
* When the compiler detects the -Z lto option, it will attempt to perform LTO on
a staticlib or binary output. The compiler will emit an error if a dylib or
rlib output is being generated.
* The actual act of performing LTO is as follows:
1. Force all upstream libraries to have an rlib version available.
2. Load the bytecode of each upstream library from the rlib.
3. Link all this bytecode into the current LLVM module (just using llvm
apis)
4. Run an internalization pass which internalizes all symbols except those
found reachable for the local crate of compilation.
5. Run the LLVM LTO pass manager over this entire module
6a. If assembling an archive, then add all upstream rlibs into the output
archive. This ignores all of the object/bitcode/metadata files rust
generated and placed inside the rlibs.
6b. If linking a binary, create copies of all upstream rlibs, remove the
rust-generated object-file, and then link everything as usual.
As I have explained in #10741, this process is excruciatingly slow, so this is
*not* turned on by default, and it is also why I have decided to hide it behind
a -Z flag for now. The good news is that the binary sizes are about as small as
they can be as a result of LTO, so it's definitely working.
Closes #10741
Closes #10740
2013-12-03 01:19:29 -06:00
|
|
|
|
2014-02-13 21:51:26 -06:00
|
|
|
let start = time::precise_time_s();
|
2013-09-27 21:46:09 -05:00
|
|
|
let rv = f(u);
|
2014-02-13 21:51:26 -06:00
|
|
|
let end = time::precise_time_s();
|
Implement LTO
This commit implements LTO for rust leveraging LLVM's passes. What this means
is:
* When compiling an rlib, in addition to insdering foo.o into the archive, also
insert foo.bc (the LLVM bytecode) of the optimized module.
* When the compiler detects the -Z lto option, it will attempt to perform LTO on
a staticlib or binary output. The compiler will emit an error if a dylib or
rlib output is being generated.
* The actual act of performing LTO is as follows:
1. Force all upstream libraries to have an rlib version available.
2. Load the bytecode of each upstream library from the rlib.
3. Link all this bytecode into the current LLVM module (just using llvm
apis)
4. Run an internalization pass which internalizes all symbols except those
found reachable for the local crate of compilation.
5. Run the LLVM LTO pass manager over this entire module
6a. If assembling an archive, then add all upstream rlibs into the output
archive. This ignores all of the object/bitcode/metadata files rust
generated and placed inside the rlibs.
6b. If linking a binary, create copies of all upstream rlibs, remove the
rust-generated object-file, and then link everything as usual.
As I have explained in #10741, this process is excruciatingly slow, so this is
*not* turned on by default, and it is also why I have decided to hide it behind
a -Z flag for now. The good news is that the binary sizes are about as small as
they can be as a result of LTO, so it's definitely working.
Closes #10741
Closes #10740
2013-12-03 01:19:29 -06:00
|
|
|
|
|
|
|
println!("{}time: {:3.3f} s\t{}", " ".repeat(old), end - start, what);
|
2014-04-28 22:36:08 -05:00
|
|
|
depth.replace(Some(old));
|
Implement LTO
This commit implements LTO for rust leveraging LLVM's passes. What this means
is:
* When compiling an rlib, in addition to insdering foo.o into the archive, also
insert foo.bc (the LLVM bytecode) of the optimized module.
* When the compiler detects the -Z lto option, it will attempt to perform LTO on
a staticlib or binary output. The compiler will emit an error if a dylib or
rlib output is being generated.
* The actual act of performing LTO is as follows:
1. Force all upstream libraries to have an rlib version available.
2. Load the bytecode of each upstream library from the rlib.
3. Link all this bytecode into the current LLVM module (just using llvm
apis)
4. Run an internalization pass which internalizes all symbols except those
found reachable for the local crate of compilation.
5. Run the LLVM LTO pass manager over this entire module
6a. If assembling an archive, then add all upstream rlibs into the output
archive. This ignores all of the object/bitcode/metadata files rust
generated and placed inside the rlibs.
6b. If linking a binary, create copies of all upstream rlibs, remove the
rust-generated object-file, and then link everything as usual.
As I have explained in #10741, this process is excruciatingly slow, so this is
*not* turned on by default, and it is also why I have decided to hide it behind
a -Z flag for now. The good news is that the binary sizes are about as small as
they can be as a result of LTO, so it's definitely working.
Closes #10741
Closes #10740
2013-12-03 01:19:29 -06:00
|
|
|
|
2013-03-21 04:50:02 -05:00
|
|
|
rv
|
|
|
|
}
|
2011-06-15 13:19:50 -05:00
|
|
|
|
2013-11-19 15:22:03 -06:00
|
|
|
pub fn indent<R>(op: || -> R) -> R {
|
2012-04-05 22:59:07 -05:00
|
|
|
// Use in conjunction with the log post-processor like `src/etc/indenter`
|
|
|
|
// to make debug output more readable.
|
2013-10-21 15:08:31 -05:00
|
|
|
debug!(">>");
|
2012-10-23 13:28:20 -05:00
|
|
|
let r = op();
|
2013-10-21 15:08:31 -05:00
|
|
|
debug!("<< (Result = {:?})", r);
|
2013-02-15 03:14:34 -06:00
|
|
|
r
|
2012-04-05 22:59:07 -05:00
|
|
|
}
|
|
|
|
|
2014-06-06 08:51:42 -05:00
|
|
|
pub struct Indenter {
|
|
|
|
_cannot_construct_outside_of_this_module: ()
|
2013-02-27 18:13:53 -06:00
|
|
|
}
|
|
|
|
|
2014-06-06 08:51:42 -05:00
|
|
|
impl Drop for Indenter {
|
2013-10-21 15:08:31 -05:00
|
|
|
fn drop(&mut self) { debug!("<<"); }
|
2012-04-05 22:59:07 -05:00
|
|
|
}
|
|
|
|
|
2014-06-06 08:51:42 -05:00
|
|
|
pub fn indenter() -> Indenter {
|
2013-10-21 15:08:31 -05:00
|
|
|
debug!(">>");
|
2014-06-06 08:51:42 -05:00
|
|
|
Indenter { _cannot_construct_outside_of_this_module: () }
|
2012-04-05 22:59:07 -05:00
|
|
|
}
|
|
|
|
|
2013-12-10 01:16:18 -06:00
|
|
|
struct LoopQueryVisitor<'a> {
|
2014-04-07 15:30:48 -05:00
|
|
|
p: |&ast::Expr_|: 'a -> bool,
|
2013-09-25 03:55:04 -05:00
|
|
|
flag: bool,
|
2013-08-14 08:54:35 -05:00
|
|
|
}
|
|
|
|
|
2014-09-09 17:54:36 -05:00
|
|
|
impl<'a, 'v> Visitor<'v> for LoopQueryVisitor<'a> {
|
2014-09-12 05:10:30 -05:00
|
|
|
fn visit_expr(&mut self, e: &ast::Expr) {
|
2013-09-25 03:55:04 -05:00
|
|
|
self.flag |= (self.p)(&e.node);
|
2012-08-06 14:34:08 -05:00
|
|
|
match e.node {
|
2012-06-20 20:50:44 -05:00
|
|
|
// Skip inner loops, since a break in the inner loop isn't a
|
|
|
|
// break inside the outer loop
|
2014-07-21 22:54:28 -05:00
|
|
|
ast::ExprLoop(..) | ast::ExprWhile(..) | ast::ExprForLoop(..) => {}
|
2014-09-12 05:10:30 -05:00
|
|
|
_ => visit::walk_expr(self, e)
|
2012-06-20 20:50:44 -05:00
|
|
|
}
|
2013-08-14 08:54:35 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Takes a predicate p, returns true iff p is true for any subexpressions
|
|
|
|
// of b -- skipping any inner loops (loop, while, loop_body)
|
2014-01-06 06:00:46 -06:00
|
|
|
pub fn loop_query(b: &ast::Block, p: |&ast::Expr_| -> bool) -> bool {
|
2013-08-29 20:04:17 -05:00
|
|
|
let mut v = LoopQueryVisitor {
|
|
|
|
p: p,
|
2013-09-25 03:55:04 -05:00
|
|
|
flag: false,
|
2013-08-29 20:04:17 -05:00
|
|
|
};
|
2014-09-12 05:10:30 -05:00
|
|
|
visit::walk_block(&mut v, b);
|
2013-09-25 03:55:04 -05:00
|
|
|
return v.flag;
|
2012-06-14 14:24:56 -05:00
|
|
|
}
|
|
|
|
|
2013-12-10 01:16:18 -06:00
|
|
|
struct BlockQueryVisitor<'a> {
|
2014-04-07 15:30:48 -05:00
|
|
|
p: |&ast::Expr|: 'a -> bool,
|
2013-09-25 03:55:04 -05:00
|
|
|
flag: bool,
|
2013-08-14 08:54:35 -05:00
|
|
|
}
|
|
|
|
|
2014-09-09 17:54:36 -05:00
|
|
|
impl<'a, 'v> Visitor<'v> for BlockQueryVisitor<'a> {
|
2014-09-12 05:10:30 -05:00
|
|
|
fn visit_expr(&mut self, e: &ast::Expr) {
|
2013-09-25 03:55:04 -05:00
|
|
|
self.flag |= (self.p)(e);
|
2014-09-12 05:10:30 -05:00
|
|
|
visit::walk_expr(self, e)
|
2013-08-14 08:54:35 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-10-18 14:20:18 -05:00
|
|
|
// Takes a predicate p, returns true iff p is true for any subexpressions
|
|
|
|
// of b -- skipping any inner loops (loop, while, loop_body)
|
2014-09-07 12:09:06 -05:00
|
|
|
pub fn block_query(b: &ast::Block, p: |&ast::Expr| -> bool) -> bool {
|
2013-08-29 20:04:17 -05:00
|
|
|
let mut v = BlockQueryVisitor {
|
|
|
|
p: p,
|
2013-09-25 03:55:04 -05:00
|
|
|
flag: false,
|
2013-08-29 20:04:17 -05:00
|
|
|
};
|
2014-09-12 05:10:30 -05:00
|
|
|
visit::walk_block(&mut v, &*b);
|
2013-09-25 03:55:04 -05:00
|
|
|
return v.flag;
|
2012-03-10 22:34:57 -06:00
|
|
|
}
|
2014-08-27 20:46:52 -05:00
|
|
|
|
|
|
|
// K: Eq + Hash<S>, V, S, H: Hasher<S>
|
|
|
|
pub fn can_reach<S,H:Hasher<S>,T:Eq+Clone+Hash<S>>(
|
|
|
|
edges_map: &HashMap<T,Vec<T>,H>,
|
|
|
|
source: T,
|
|
|
|
destination: T)
|
|
|
|
-> bool
|
|
|
|
{
|
|
|
|
/*!
|
|
|
|
* Determines whether there exists a path from `source` to
|
|
|
|
* `destination`. The graph is defined by the `edges_map`, which
|
|
|
|
* maps from a node `S` to a list of its adjacent nodes `T`.
|
|
|
|
*
|
|
|
|
* Efficiency note: This is implemented in an inefficient way
|
|
|
|
* because it is typically invoked on very small graphs. If the graphs
|
|
|
|
* become larger, a more efficient graph representation and algorithm
|
|
|
|
* would probably be advised.
|
|
|
|
*/
|
|
|
|
|
|
|
|
if source == destination {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Do a little breadth-first-search here. The `queue` list
|
|
|
|
// doubles as a way to detect if we've seen a particular FR
|
|
|
|
// before. Note that we expect this graph to be an *extremely
|
|
|
|
// shallow* tree.
|
|
|
|
let mut queue = vec!(source);
|
|
|
|
let mut i = 0;
|
|
|
|
while i < queue.len() {
|
|
|
|
match edges_map.find(queue.get(i)) {
|
|
|
|
Some(edges) => {
|
|
|
|
for target in edges.iter() {
|
|
|
|
if *target == destination {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
if !queue.iter().any(|x| x == target) {
|
|
|
|
queue.push((*target).clone());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
None => {}
|
|
|
|
}
|
|
|
|
i += 1;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|