// Copyright 2016 The Rust Project Developers. See the COPYRIGHT // file at the top-level directory of this distribution and at // http://rust-lang.org/COPYRIGHT. // // Licensed under the Apache License, Version 2.0 or the MIT license // , at your // option. This file may not be copied, modified, or distributed // except according to those terms. //! This is the implementation of the pass which transforms generators into state machines. //! //! MIR generation for generators creates a function which has a self argument which //! passes by value. This argument is effectively a generator type which only contains upvars and //! is only used for this argument inside the MIR for the generator. //! It is passed by value to enable upvars to be moved out of it. Drop elaboration runs on that //! MIR before this pass and creates drop flags for MIR locals. //! It will also drop the generator argument (which only consists of upvars) if any of the upvars //! are moved out of. This pass elaborates the drops of upvars / generator argument in the case //! that none of the upvars were moved out of. This is because we cannot have any drops of this //! generator in the MIR, since it is used to create the drop glue for the generator. We'd get //! infinite recursion otherwise. //! //! This pass creates the implementation for the Generator::resume function and the drop shim //! for the generator based on the MIR input. It converts the generator argument from Self to //! &mut Self adding derefs in the MIR as needed. It computes the final layout of the generator //! struct which looks like this: //! First upvars are stored //! It is followed by the generator state field. //! Then finally the MIR locals which are live across a suspension point are stored. //! //! struct Generator { //! upvars..., //! state: u32, //! mir_locals..., //! } //! //! This pass computes the meaning of the state field and the MIR locals which are live //! across a suspension point. There are however two hardcoded generator states: //! 0 - Generator have not been resumed yet //! 1 - Generator has been poisoned //! //! It also rewrites `return x` and `yield y` as setting a new generator state and returning //! GeneratorState::Complete(x) and GeneratorState::Yielded(y) respectively. //! MIR locals which are live across a suspension point are moved to the generator struct //! with references to them being updated with references to the generator struct. //! //! The pass creates two functions which have a switch on the generator state giving //! the action to take. //! //! One of them is the implementation of Generator::resume. //! For generators which have already returned it panics. //! For generators with state 0 (unresumed) it starts the execution of the generator. //! For generators with state 1 (poisoned) it panics. //! Otherwise it continues the execution from the last suspension point. //! //! The other function is the drop glue for the generator. //! For generators which have already returned it does nothing. //! For generators with state 0 (unresumed) it drops the upvars of the generator. //! For generators with state 1 (poisoned) it does nothing. //! Otherwise it drops all the values in scope at the last suspension point. use rustc::hir; use rustc::hir::def_id::DefId; use rustc::middle::const_val::ConstVal; use rustc::mir::*; use rustc::mir::transform::{MirPass, MirSource}; use rustc::mir::visit::{LvalueContext, MutVisitor}; use rustc::ty::{self, TyCtxt, AdtDef, Ty, GeneratorInterior}; use rustc::ty::subst::{Kind, Substs}; use util::dump_mir; use util::liveness; use rustc_const_math::ConstInt; use rustc_data_structures::indexed_vec::Idx; use std::collections::HashMap; use std::borrow::Cow; use std::iter::once; use std::mem; use transform::simplify; use transform::no_landing_pads::no_landing_pads; pub struct StateTransform; struct RenameLocalVisitor { from: Local, to: Local, } impl<'tcx> MutVisitor<'tcx> for RenameLocalVisitor { fn visit_local(&mut self, local: &mut Local) { if *local == self.from { *local = self.to; } } } struct DerefArgVisitor; impl<'tcx> MutVisitor<'tcx> for DerefArgVisitor { fn visit_lvalue(&mut self, lvalue: &mut Lvalue<'tcx>, context: LvalueContext<'tcx>, location: Location) { if *lvalue == Lvalue::Local(self_arg()) { *lvalue = Lvalue::Projection(Box::new(Projection { base: lvalue.clone(), elem: ProjectionElem::Deref, })); } else { self.super_lvalue(lvalue, context, location); } } } fn self_arg() -> Local { Local::new(1) } struct TransformVisitor<'a, 'tcx: 'a> { tcx: TyCtxt<'a, 'tcx, 'tcx>, state_adt_ref: &'tcx AdtDef, state_substs: &'tcx Substs<'tcx>, // The index of the generator state in the generator struct state_field: usize, // Mapping from Local to (type of local, generator struct index) remap: HashMap, usize)>, // The number of generator states. 0 is unresumed, 1 is poisoned. So this is initialized to 2 bb_target_count: u32, // Map from a (which block to resume execution at, which block to use to drop the generator) // to a generator state bb_targets: HashMap<(BasicBlock, Option), u32>, // The original RETURN_POINTER local new_ret_local: Local, // The block to resume execution when for Return return_block: BasicBlock, } impl<'a, 'tcx> TransformVisitor<'a, 'tcx> { // Make a GeneratorState rvalue fn make_state(&self, idx: usize, val: Operand<'tcx>) -> Rvalue<'tcx> { let adt = AggregateKind::Adt(self.state_adt_ref, idx, self.state_substs, None); Rvalue::Aggregate(box adt, vec![val]) } // Create a Lvalue referencing a generator struct field fn make_field(&self, idx: usize, ty: Ty<'tcx>) -> Lvalue<'tcx> { let base = Lvalue::Local(self_arg()); let field = Projection { base: base, elem: ProjectionElem::Field(Field::new(idx), ty), }; Lvalue::Projection(Box::new(field)) } // Create a statement which changes the generator state fn set_state(&self, state_disc: u32, source_info: SourceInfo) -> Statement<'tcx> { let state = self.make_field(self.state_field, self.tcx.types.u32); let val = Operand::Constant(box Constant { span: source_info.span, ty: self.tcx.types.u32, literal: Literal::Value { value: ConstVal::Integral(ConstInt::U32(state_disc)), }, }); Statement { source_info, kind: StatementKind::Assign(state, Rvalue::Use(val)), } } } impl<'a, 'tcx> MutVisitor<'tcx> for TransformVisitor<'a, 'tcx> { fn visit_lvalue(&mut self, lvalue: &mut Lvalue<'tcx>, context: LvalueContext<'tcx>, location: Location) { if let Lvalue::Local(l) = *lvalue { // Replace an Local in the remap with a generator struct access if let Some(&(ty, idx)) = self.remap.get(&l) { *lvalue = self.make_field(idx, ty); } } else { self.super_lvalue(lvalue, context, location); } } fn visit_basic_block_data(&mut self, block: BasicBlock, data: &mut BasicBlockData<'tcx>) { // Remove StorageLive and StorageDead statements for remapped locals data.retain_statements(|s| { match s.kind { StatementKind::StorageLive(ref l) | StatementKind::StorageDead(ref l) => { if let Lvalue::Local(l) = *l { !self.remap.contains_key(&l) } else { true } } _ => true } }); let ret_val = match data.terminator().kind { TerminatorKind::Return => Some((1, self.return_block, Operand::Consume(Lvalue::Local(self.new_ret_local)), None)), TerminatorKind::Yield { ref value, resume, drop } => Some((0, resume, value.clone(), drop)), _ => None }; if let Some((state_idx, resume, v, drop)) = ret_val { let bb_idx = { let bb_targets = &mut self.bb_targets; let bb_target = &mut self.bb_target_count; *bb_targets.entry((resume, drop)).or_insert_with(|| { let target = *bb_target; *bb_target = target.checked_add(1).unwrap(); target }) }; let source_info = data.terminator().source_info; data.statements.push(self.set_state(bb_idx, source_info)); data.statements.push(Statement { source_info, kind: StatementKind::Assign(Lvalue::Local(RETURN_POINTER), self.make_state(state_idx, v)), }); data.terminator.as_mut().unwrap().kind = TerminatorKind::Return; } self.super_basic_block_data(block, data); } } fn make_generator_state_argument_indirect<'a, 'tcx>( tcx: TyCtxt<'a, 'tcx, 'tcx>, def_id: DefId, mir: &mut Mir<'tcx>) { let gen_ty = mir.local_decls.raw[1].ty; let region = ty::ReFree(ty::FreeRegion { scope: def_id, bound_region: ty::BoundRegion::BrEnv, }); let region = tcx.mk_region(region); let ref_gen_ty = tcx.mk_ref(region, ty::TypeAndMut { ty: gen_ty, mutbl: hir::MutMutable }); // Replace the by value generator argument mir.local_decls.raw[1].ty = ref_gen_ty; // Add a deref to accesses of the generator state DerefArgVisitor.visit_mir(mir); } fn replace_result_variable<'tcx>(ret_ty: Ty<'tcx>, mir: &mut Mir<'tcx>) -> Local { let source_info = SourceInfo { span: mir.span, scope: ARGUMENT_VISIBILITY_SCOPE, }; let new_ret = LocalDecl { mutability: Mutability::Mut, ty: ret_ty, name: None, source_info, internal: false, is_user_variable: false, }; let new_ret_local = Local::new(mir.local_decls.len()); mir.local_decls.push(new_ret); mir.local_decls.swap(0, new_ret_local.index()); RenameLocalVisitor { from: RETURN_POINTER, to: new_ret_local, }.visit_mir(mir); new_ret_local } fn locals_live_across_suspend_points<'a, 'tcx>(tcx: TyCtxt<'a, 'tcx, 'tcx>, mir: &Mir<'tcx>, source: MirSource) -> liveness::LocalSet { let mut set = liveness::LocalSet::new_empty(mir.local_decls.len()); let result = liveness::liveness_of_locals(mir); liveness::dump_mir(tcx, "generator_liveness", source, mir, &result); for (block, data) in mir.basic_blocks().iter_enumerated() { if let TerminatorKind::Yield { .. } = data.terminator().kind { set.union(&result.outs[block]); } } // The generator argument is ignored set.remove(&self_arg()); set } fn compute_layout<'a, 'tcx>(tcx: TyCtxt<'a, 'tcx, 'tcx>, source: MirSource, interior: GeneratorInterior<'tcx>, mir: &mut Mir<'tcx>) -> (HashMap, usize)>, GeneratorLayout<'tcx>) { // Use a liveness analysis to compute locals which are live across a suspension point let live_locals = locals_live_across_suspend_points(tcx, mir, source); // Erase regions from the types passed in from typeck so we can compare them with // MIR types let allowed = tcx.erase_regions(&interior.as_slice()); for (local, decl) in mir.local_decls.iter_enumerated() { // Ignore locals which are internal or not live if !live_locals.contains(&local) || decl.internal { continue; } // Sanity check that typeck knows about the type of locals which are // live across a suspension point if !allowed.contains(&decl.ty) { span_bug!(mir.span, "Broken MIR: generator contains type {} in MIR, \ but typeck only knows about {}", decl.ty, interior); } } let upvar_len = mir.upvar_decls.len(); let dummy_local = LocalDecl::new_internal(tcx.mk_nil(), mir.span); // Gather live locals and their indices replacing values in mir.local_decls with a dummy // to avoid changing local indices let live_decls = live_locals.iter().map(|local| { let var = mem::replace(&mut mir.local_decls[local], dummy_local.clone()); (local, var) }); // Create a map from local indices to generator struct indices. // These are offset by (upvar_len + 1) because of fields which comes before locals. // We also create a vector of the LocalDecls of these locals. let (remap, vars) = live_decls.enumerate().map(|(idx, (local, var))| { ((local, (var.ty, upvar_len + 1 + idx)), var) }).unzip(); let layout = GeneratorLayout { fields: vars }; (remap, layout) } fn insert_entry_point<'tcx>(mir: &mut Mir<'tcx>, block: BasicBlockData<'tcx>) { mir.basic_blocks_mut().raw.insert(0, block); let blocks = mir.basic_blocks_mut().iter_mut(); for target in blocks.flat_map(|b| b.terminator_mut().successors_mut()) { *target = BasicBlock::new(target.index() + 1); } } fn elaborate_generator_drops<'a, 'tcx>(tcx: TyCtxt<'a, 'tcx, 'tcx>, def_id: DefId, mir: &mut Mir<'tcx>) { use util::elaborate_drops::{elaborate_drop, Unwind}; use util::patch::MirPatch; use shim::DropShimElaborator; // Note that `elaborate_drops` only drops the upvars of a generator, and // this is ok because `open_drop` can only be reached within that own // generator's resume function. let param_env = tcx.param_env(def_id); let gen = self_arg(); for block in mir.basic_blocks().indices() { let (target, unwind, source_info) = match mir.basic_blocks()[block].terminator() { &Terminator { source_info, kind: TerminatorKind::Drop { location: Lvalue::Local(local), target, unwind } } if local == gen => (target, unwind, source_info), _ => continue, }; let unwind = if let Some(unwind) = unwind { Unwind::To(unwind) } else { Unwind::InCleanup }; let patch = { let mut elaborator = DropShimElaborator { mir: &mir, patch: MirPatch::new(mir), tcx, param_env }; elaborate_drop( &mut elaborator, source_info, &Lvalue::Local(gen), (), target, unwind, block ); elaborator.patch }; patch.apply(mir); } } fn create_generator_drop_shim<'a, 'tcx>( tcx: TyCtxt<'a, 'tcx, 'tcx>, transform: &TransformVisitor<'a, 'tcx>, def_id: DefId, source: MirSource, gen_ty: Ty<'tcx>, mir: &Mir<'tcx>, drop_clean: BasicBlock) -> Mir<'tcx> { let mut mir = mir.clone(); let source_info = SourceInfo { span: mir.span, scope: ARGUMENT_VISIBILITY_SCOPE, }; let return_block = BasicBlock::new(mir.basic_blocks().len()); mir.basic_blocks_mut().push(BasicBlockData { statements: Vec::new(), terminator: Some(Terminator { source_info, kind: TerminatorKind::Return, }), is_cleanup: false, }); let mut cases: Vec<_> = transform.bb_targets.iter().filter_map(|(&(_, u), &s)| { u.map(|d| (s, d)) }).collect(); cases.insert(0, (0, drop_clean)); // The poisoned state 1 falls through to the default case which is just to return let switch = TerminatorKind::SwitchInt { discr: Operand::Consume(transform.make_field(transform.state_field, tcx.types.u32)), switch_ty: tcx.types.u32, values: Cow::from(cases.iter().map(|&(i, _)| { ConstInt::U32(i) }).collect::>()), targets: cases.iter().map(|&(_, d)| d).chain(once(return_block)).collect(), }; insert_entry_point(&mut mir, BasicBlockData { statements: Vec::new(), terminator: Some(Terminator { source_info, kind: switch, }), is_cleanup: false, }); for block in mir.basic_blocks_mut() { let kind = &mut block.terminator_mut().kind; if let TerminatorKind::GeneratorDrop = *kind { *kind = TerminatorKind::Return; } } // Replace the return variable let source_info = SourceInfo { span: mir.span, scope: ARGUMENT_VISIBILITY_SCOPE, }; mir.return_ty = tcx.mk_nil(); mir.local_decls[RETURN_POINTER] = LocalDecl { mutability: Mutability::Mut, ty: tcx.mk_nil(), name: None, source_info, internal: false, is_user_variable: false, }; make_generator_state_argument_indirect(tcx, def_id, &mut mir); // Change the generator argument from &mut to *mut mir.local_decls[self_arg()] = LocalDecl { mutability: Mutability::Mut, ty: tcx.mk_ptr(ty::TypeAndMut { ty: gen_ty, mutbl: hir::Mutability::MutMutable, }), name: None, source_info, internal: false, is_user_variable: false, }; no_landing_pads(tcx, &mut mir); // Make sure we remove dead blocks to remove // unrelated code from the resume part of the function simplify::remove_dead_blocks(&mut mir); dump_mir(tcx, None, "generator_drop", &0, source, &mut mir); mir } fn insert_panic_on_resume_after_return<'a, 'tcx>(tcx: TyCtxt<'a, 'tcx, 'tcx>, mir: &mut Mir<'tcx>) { let assert_block = BasicBlock::new(mir.basic_blocks().len()); let term = TerminatorKind::Assert { cond: Operand::Constant(box Constant { span: mir.span, ty: tcx.types.bool, literal: Literal::Value { value: ConstVal::Bool(false), }, }), expected: true, msg: AssertMessage::GeneratorResumedAfterReturn, target: assert_block, cleanup: None, }; let source_info = SourceInfo { span: mir.span, scope: ARGUMENT_VISIBILITY_SCOPE, }; mir.basic_blocks_mut().push(BasicBlockData { statements: Vec::new(), terminator: Some(Terminator { source_info, kind: term, }), is_cleanup: false, }); } fn create_generator_resume_function<'a, 'tcx>( tcx: TyCtxt<'a, 'tcx, 'tcx>, mut transform: TransformVisitor<'a, 'tcx>, def_id: DefId, source: MirSource, mir: &mut Mir<'tcx>) { // Poison the generator when it unwinds for block in mir.basic_blocks_mut() { let source_info = block.terminator().source_info; if let &TerminatorKind::Resume = &block.terminator().kind { block.statements.push(transform.set_state(1, source_info)); } } let source_info = SourceInfo { span: mir.span, scope: ARGUMENT_VISIBILITY_SCOPE, }; let poisoned_block = BasicBlock::new(mir.basic_blocks().len()); let term = TerminatorKind::Assert { cond: Operand::Constant(box Constant { span: mir.span, ty: tcx.types.bool, literal: Literal::Value { value: ConstVal::Bool(false), }, }), expected: true, msg: AssertMessage::GeneratorResumedAfterPanic, target: transform.return_block, cleanup: None, }; mir.basic_blocks_mut().push(BasicBlockData { statements: Vec::new(), terminator: Some(Terminator { source_info, kind: term, }), is_cleanup: false, }); transform.bb_targets.insert((poisoned_block, None), 1); let switch = TerminatorKind::SwitchInt { discr: Operand::Consume(transform.make_field(transform.state_field, tcx.types.u32)), switch_ty: tcx.types.u32, values: Cow::from(transform.bb_targets.values().map(|&i| { ConstInt::U32(i) }).collect::>()), targets: transform.bb_targets.keys() .map(|&(k, _)| k) .chain(once(transform.return_block)) .collect(), }; insert_entry_point(mir, BasicBlockData { statements: Vec::new(), terminator: Some(Terminator { source_info, kind: switch, }), is_cleanup: false, }); make_generator_state_argument_indirect(tcx, def_id, mir); no_landing_pads(tcx, mir); // Make sure we remove dead blocks to remove // unrelated code from the drop part of the function simplify::remove_dead_blocks(mir); dump_mir(tcx, None, "generator_resume", &0, source, mir); } fn insert_clean_drop<'a, 'tcx>(mir: &mut Mir<'tcx>) -> BasicBlock { let source_info = SourceInfo { span: mir.span, scope: ARGUMENT_VISIBILITY_SCOPE, }; let return_block = BasicBlock::new(mir.basic_blocks().len()); mir.basic_blocks_mut().push(BasicBlockData { statements: Vec::new(), terminator: Some(Terminator { source_info, kind: TerminatorKind::Return, }), is_cleanup: false, }); // Create a block to destroy an unresumed generators. This can only destroy upvars. let drop_clean = BasicBlock::new(mir.basic_blocks().len()); let term = TerminatorKind::Drop { location: Lvalue::Local(self_arg()), target: return_block, unwind: None, }; mir.basic_blocks_mut().push(BasicBlockData { statements: Vec::new(), terminator: Some(Terminator { source_info, kind: term, }), is_cleanup: false, }); drop_clean } impl MirPass for StateTransform { fn run_pass<'a, 'tcx>(&self, tcx: TyCtxt<'a, 'tcx, 'tcx>, source: MirSource, mir: &mut Mir<'tcx>) { let yield_ty = if let Some(yield_ty) = mir.yield_ty { yield_ty } else { // This only applies to generators return }; assert!(mir.generator_drop.is_none()); let node_id = source.item_id(); let def_id = tcx.hir.local_def_id(source.item_id()); let hir_id = tcx.hir.node_to_hir_id(node_id); // Get the interior types which typeck computed let interior = *tcx.typeck_tables_of(def_id).generator_interiors().get(hir_id).unwrap(); // The first argument is the generator type passed by value let gen_ty = mir.local_decls.raw[1].ty; // Compute GeneratorState let state_did = tcx.lang_items.gen_state().unwrap(); let state_adt_ref = tcx.adt_def(state_did); let state_substs = tcx.mk_substs([Kind::from(yield_ty), Kind::from(mir.return_ty)].iter()); let ret_ty = tcx.mk_adt(state_adt_ref, state_substs); // We rename RETURN_POINTER which has type mir.return_ty to new_ret_local // RETURN_POINTER then is a fresh unused local with type ret_ty. let new_ret_local = replace_result_variable(ret_ty, mir); // Extract locals which are live across suspension point into `layout` // `remap` gives a mapping from local indices onto generator struct indices let (remap, layout) = compute_layout(tcx, source, interior, mir); let state_field = mir.upvar_decls.len(); let mut bb_targets = HashMap::new(); // If we jump to the entry point, we should go to the initial 0 generator state. // FIXME: Could this result in the need for destruction for state 0? bb_targets.insert((BasicBlock::new(0), None), 0); // Run the transformation which converts Lvalues from Local to generator struct // accesses for locals in `remap`. // It also rewrites `return x` and `yield y` as writing a new generator state and returning // GeneratorState::Complete(x) and GeneratorState::Yielded(y) respectively. let mut transform = TransformVisitor { tcx, state_adt_ref, state_substs, remap, bb_target_count: 2, bb_targets, new_ret_local, state_field, // For returns we will resume execution at the next added basic block. // This happens in `insert_panic_on_resume_after_return` return_block: BasicBlock::new(mir.basic_blocks().len()), }; transform.visit_mir(mir); // Update our MIR struct to reflect the changed we've made mir.return_ty = ret_ty; mir.yield_ty = None; mir.arg_count = 1; mir.spread_arg = None; mir.generator_layout = Some(layout); // Panic if we resumed after returning insert_panic_on_resume_after_return(tcx, mir); // Insert `drop(generator_struct)` which is used to drop upvars for generators in // the unresumed (0) state. // This is expanded to a drop ladder in `elaborate_generator_drops`. let drop_clean = insert_clean_drop(mir); dump_mir(tcx, None, "generator_pre-elab", &0, source, mir); // Expand `drop(generator_struct)` to a drop ladder which destroys upvars. // If any upvars are moved out of, drop elaboration will handle upvar destruction. // However we need to also elaborate the code generated by `insert_clean_drop`. elaborate_generator_drops(tcx, def_id, mir); dump_mir(tcx, None, "generator_post-transform", &0, source, mir); // Create a copy of our MIR and use it to create the drop shim for the generator let drop_shim = create_generator_drop_shim(tcx, &transform, def_id, source, gen_ty, &mir, drop_clean); mir.generator_drop = Some(box drop_shim); // Create the Generator::resume function create_generator_resume_function(tcx, transform, def_id, source, mir); } }