2012-12-13 13:05:22 -08:00
|
|
|
|
2014-02-07 20:08:32 +01:00
|
|
|
// Copyright 2012-2014 The Rust Project Developers. See the COPYRIGHT
|
2012-12-10 17:32:48 -08:00
|
|
|
// file at the top-level directory of this distribution and at
|
|
|
|
// http://rust-lang.org/COPYRIGHT.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
|
|
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
|
|
|
// option. This file may not be copied, modified, or distributed
|
|
|
|
// except according to those terms.
|
|
|
|
|
2013-12-11 23:17:54 -08:00
|
|
|
#[feature(managed_boxes)];
|
|
|
|
|
2014-02-19 19:29:58 -08:00
|
|
|
extern crate collections;
|
|
|
|
|
2014-03-05 15:28:08 -08:00
|
|
|
|
2011-07-12 14:19:38 -07:00
|
|
|
/**
|
|
|
|
A somewhat reduced test case to expose some Valgrind issues.
|
|
|
|
|
|
|
|
This originally came from the word-count benchmark.
|
|
|
|
*/
|
|
|
|
|
2013-01-08 19:37:25 -08:00
|
|
|
pub fn map(filename: ~str, emit: map_reduce::putter) { emit(filename, ~"1"); }
|
2011-07-12 14:19:38 -07:00
|
|
|
|
|
|
|
mod map_reduce {
|
2014-02-19 19:29:58 -08:00
|
|
|
use collections::HashMap;
|
2013-05-24 19:35:29 -07:00
|
|
|
use std::str;
|
|
|
|
use std::task;
|
2011-07-12 14:19:38 -07:00
|
|
|
|
2014-04-02 09:47:11 -07:00
|
|
|
pub type putter<'a> = |~str, ~str|: 'a;
|
2011-07-12 14:19:38 -07:00
|
|
|
|
2012-12-28 17:17:05 -08:00
|
|
|
pub type mapper = extern fn(~str, putter);
|
2011-07-12 14:19:38 -07:00
|
|
|
|
2014-03-05 14:02:44 -08:00
|
|
|
enum ctrl_proto { find_reducer(Vec<u8>, Sender<int>), mapper_done, }
|
2011-07-12 14:19:38 -07:00
|
|
|
|
2014-03-05 14:02:44 -08:00
|
|
|
fn start_mappers(ctrl: Sender<ctrl_proto>, inputs: Vec<~str>) {
|
2013-08-03 12:45:23 -04:00
|
|
|
for i in inputs.iter() {
|
2013-01-28 23:54:39 -08:00
|
|
|
let ctrl = ctrl.clone();
|
2013-03-15 18:27:15 -04:00
|
|
|
let i = i.clone();
|
2013-11-21 23:36:52 -08:00
|
|
|
task::spawn(proc() map_task(ctrl.clone(), i.clone()) );
|
2012-01-04 21:14:53 -08:00
|
|
|
}
|
2011-07-12 14:19:38 -07:00
|
|
|
}
|
|
|
|
|
2014-03-09 14:58:32 -07:00
|
|
|
fn map_task(ctrl: Sender<ctrl_proto>, input: ~str) {
|
2013-12-31 15:46:27 -08:00
|
|
|
let mut intermediates = HashMap::new();
|
2013-03-23 21:22:00 -04:00
|
|
|
|
2013-12-05 18:19:06 -08:00
|
|
|
fn emit(im: &mut HashMap<~str, int>,
|
2014-03-09 14:58:32 -07:00
|
|
|
ctrl: Sender<ctrl_proto>, key: ~str,
|
2013-03-23 21:22:00 -04:00
|
|
|
_val: ~str) {
|
|
|
|
if im.contains_key(&key) {
|
|
|
|
return;
|
2011-07-12 14:19:38 -07:00
|
|
|
}
|
2014-03-09 14:58:32 -07:00
|
|
|
let (tx, rx) = channel();
|
log: Introduce liblog, the old std::logging
This commit moves all logging out of the standard library into an external
crate. This crate is the new crate which is responsible for all logging macros
and logging implementation. A few reasons for this change are:
* The crate map has always been a bit of a code smell among rust programs. It
has difficulty being loaded on almost all platforms, and it's used almost
exclusively for logging and only logging. Removing the crate map is one of the
end goals of this movement.
* The compiler has a fair bit of special support for logging. It has the
__log_level() expression as well as generating a global word per module
specifying the log level. This is unfairly favoring the built-in logging
system, and is much better done purely in libraries instead of the compiler
itself.
* Initialization of logging is much easier to do if there is no reliance on a
magical crate map being available to set module log levels.
* If the logging library can be written outside of the standard library, there's
no reason that it shouldn't be. It's likely that we're not going to build the
highest quality logging library of all time, so third-party libraries should
be able to provide just as high-quality logging systems as the default one
provided in the rust distribution.
With a migration such as this, the change does not come for free. There are some
subtle changes in the behavior of liblog vs the previous logging macros:
* The core change of this migration is that there is no longer a physical
log-level per module. This concept is still emulated (it is quite useful), but
there is now only a global log level, not a local one. This global log level
is a reflection of the maximum of all log levels specified. The previously
generated logging code looked like:
if specified_level <= __module_log_level() {
println!(...)
}
The newly generated code looks like:
if specified_level <= ::log::LOG_LEVEL {
if ::log::module_enabled(module_path!()) {
println!(...)
}
}
Notably, the first layer of checking is still intended to be "super fast" in
that it's just a load of a global word and a compare. The second layer of
checking is executed to determine if the current module does indeed have
logging turned on.
This means that if any module has a debug log level turned on, all modules
with debug log levels get a little bit slower (they all do more expensive
dynamic checks to determine if they're turned on or not).
Semantically, this migration brings no change in this respect, but
runtime-wise, this will have a perf impact on some code.
* A `RUST_LOG=::help` directive will no longer print out a list of all modules
that can be logged. This is because the crate map will no longer specify the
log levels of all modules, so the list of modules is not known. Additionally,
warnings can no longer be provided if a malformed logging directive was
supplied.
The new "hello world" for logging looks like:
#[phase(syntax, link)]
extern crate log;
fn main() {
debug!("Hello, world!");
}
2014-03-08 22:11:44 -08:00
|
|
|
println!("sending find_reducer");
|
2014-03-05 15:28:08 -08:00
|
|
|
ctrl.send(find_reducer(Vec::from_slice(key.as_bytes()), tx));
|
log: Introduce liblog, the old std::logging
This commit moves all logging out of the standard library into an external
crate. This crate is the new crate which is responsible for all logging macros
and logging implementation. A few reasons for this change are:
* The crate map has always been a bit of a code smell among rust programs. It
has difficulty being loaded on almost all platforms, and it's used almost
exclusively for logging and only logging. Removing the crate map is one of the
end goals of this movement.
* The compiler has a fair bit of special support for logging. It has the
__log_level() expression as well as generating a global word per module
specifying the log level. This is unfairly favoring the built-in logging
system, and is much better done purely in libraries instead of the compiler
itself.
* Initialization of logging is much easier to do if there is no reliance on a
magical crate map being available to set module log levels.
* If the logging library can be written outside of the standard library, there's
no reason that it shouldn't be. It's likely that we're not going to build the
highest quality logging library of all time, so third-party libraries should
be able to provide just as high-quality logging systems as the default one
provided in the rust distribution.
With a migration such as this, the change does not come for free. There are some
subtle changes in the behavior of liblog vs the previous logging macros:
* The core change of this migration is that there is no longer a physical
log-level per module. This concept is still emulated (it is quite useful), but
there is now only a global log level, not a local one. This global log level
is a reflection of the maximum of all log levels specified. The previously
generated logging code looked like:
if specified_level <= __module_log_level() {
println!(...)
}
The newly generated code looks like:
if specified_level <= ::log::LOG_LEVEL {
if ::log::module_enabled(module_path!()) {
println!(...)
}
}
Notably, the first layer of checking is still intended to be "super fast" in
that it's just a load of a global word and a compare. The second layer of
checking is executed to determine if the current module does indeed have
logging turned on.
This means that if any module has a debug log level turned on, all modules
with debug log levels get a little bit slower (they all do more expensive
dynamic checks to determine if they're turned on or not).
Semantically, this migration brings no change in this respect, but
runtime-wise, this will have a perf impact on some code.
* A `RUST_LOG=::help` directive will no longer print out a list of all modules
that can be logged. This is because the crate map will no longer specify the
log levels of all modules, so the list of modules is not known. Additionally,
warnings can no longer be provided if a malformed logging directive was
supplied.
The new "hello world" for logging looks like:
#[phase(syntax, link)]
extern crate log;
fn main() {
debug!("Hello, world!");
}
2014-03-08 22:11:44 -08:00
|
|
|
println!("receiving");
|
2014-03-09 14:58:32 -07:00
|
|
|
let c = rx.recv();
|
log: Introduce liblog, the old std::logging
This commit moves all logging out of the standard library into an external
crate. This crate is the new crate which is responsible for all logging macros
and logging implementation. A few reasons for this change are:
* The crate map has always been a bit of a code smell among rust programs. It
has difficulty being loaded on almost all platforms, and it's used almost
exclusively for logging and only logging. Removing the crate map is one of the
end goals of this movement.
* The compiler has a fair bit of special support for logging. It has the
__log_level() expression as well as generating a global word per module
specifying the log level. This is unfairly favoring the built-in logging
system, and is much better done purely in libraries instead of the compiler
itself.
* Initialization of logging is much easier to do if there is no reliance on a
magical crate map being available to set module log levels.
* If the logging library can be written outside of the standard library, there's
no reason that it shouldn't be. It's likely that we're not going to build the
highest quality logging library of all time, so third-party libraries should
be able to provide just as high-quality logging systems as the default one
provided in the rust distribution.
With a migration such as this, the change does not come for free. There are some
subtle changes in the behavior of liblog vs the previous logging macros:
* The core change of this migration is that there is no longer a physical
log-level per module. This concept is still emulated (it is quite useful), but
there is now only a global log level, not a local one. This global log level
is a reflection of the maximum of all log levels specified. The previously
generated logging code looked like:
if specified_level <= __module_log_level() {
println!(...)
}
The newly generated code looks like:
if specified_level <= ::log::LOG_LEVEL {
if ::log::module_enabled(module_path!()) {
println!(...)
}
}
Notably, the first layer of checking is still intended to be "super fast" in
that it's just a load of a global word and a compare. The second layer of
checking is executed to determine if the current module does indeed have
logging turned on.
This means that if any module has a debug log level turned on, all modules
with debug log levels get a little bit slower (they all do more expensive
dynamic checks to determine if they're turned on or not).
Semantically, this migration brings no change in this respect, but
runtime-wise, this will have a perf impact on some code.
* A `RUST_LOG=::help` directive will no longer print out a list of all modules
that can be logged. This is because the crate map will no longer specify the
log levels of all modules, so the list of modules is not known. Additionally,
warnings can no longer be provided if a malformed logging directive was
supplied.
The new "hello world" for logging looks like:
#[phase(syntax, link)]
extern crate log;
fn main() {
debug!("Hello, world!");
}
2014-03-08 22:11:44 -08:00
|
|
|
println!("{:?}", c);
|
2013-03-23 21:22:00 -04:00
|
|
|
im.insert(key, c);
|
2011-07-12 14:19:38 -07:00
|
|
|
}
|
|
|
|
|
2013-01-28 23:54:39 -08:00
|
|
|
let ctrl_clone = ctrl.clone();
|
2013-12-31 15:46:27 -08:00
|
|
|
::map(input, |a,b| emit(&mut intermediates, ctrl.clone(), a, b) );
|
2013-01-28 23:54:39 -08:00
|
|
|
ctrl_clone.send(mapper_done);
|
2011-07-12 14:19:38 -07:00
|
|
|
}
|
|
|
|
|
2014-03-05 14:02:44 -08:00
|
|
|
pub fn map_reduce(inputs: Vec<~str>) {
|
2014-03-09 14:58:32 -07:00
|
|
|
let (tx, rx) = channel();
|
2011-07-12 14:19:38 -07:00
|
|
|
|
|
|
|
// This task becomes the master control task. It spawns others
|
|
|
|
// to do the rest.
|
|
|
|
|
2013-04-03 09:28:36 -04:00
|
|
|
let mut reducers: HashMap<~str, int>;
|
2011-07-12 14:19:38 -07:00
|
|
|
|
2013-04-03 09:28:36 -04:00
|
|
|
reducers = HashMap::new();
|
2011-07-12 14:19:38 -07:00
|
|
|
|
2014-03-09 14:58:32 -07:00
|
|
|
start_mappers(tx, inputs.clone());
|
2011-07-12 14:19:38 -07:00
|
|
|
|
2013-05-14 18:52:12 +09:00
|
|
|
let mut num_mappers = inputs.len() as int;
|
2011-07-12 14:19:38 -07:00
|
|
|
|
2011-07-27 14:19:39 +02:00
|
|
|
while num_mappers > 0 {
|
2014-03-09 14:58:32 -07:00
|
|
|
match rx.recv() {
|
2012-08-03 19:59:04 -07:00
|
|
|
mapper_done => { num_mappers -= 1; }
|
|
|
|
find_reducer(k, cc) => {
|
2013-12-05 18:19:06 -08:00
|
|
|
let mut c;
|
2014-03-05 15:28:08 -08:00
|
|
|
match reducers.find(&str::from_utf8(k.as_slice()).unwrap()
|
|
|
|
.to_owned()) {
|
2013-12-05 18:19:06 -08:00
|
|
|
Some(&_c) => { c = _c; }
|
|
|
|
None => { c = 0; }
|
|
|
|
}
|
2013-01-28 23:54:39 -08:00
|
|
|
cc.send(c);
|
2011-07-27 14:19:39 +02:00
|
|
|
}
|
2011-07-12 14:19:38 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-02-01 19:43:17 -08:00
|
|
|
pub fn main() {
|
2014-03-05 14:02:44 -08:00
|
|
|
map_reduce::map_reduce(vec!(~"../src/test/run-pass/hashmap-memory.rs"));
|
2011-08-15 21:54:52 -07:00
|
|
|
}
|