rust/src/librustc_trans/trans/intrinsic.rs

// Copyright 2012-2014 The Rust Project Developers. See the COPYRIGHT
// file at the top-level directory of this distribution and at
// http://rust-lang.org/COPYRIGHT.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.

#![allow(non_upper_case_globals)]

use llvm;
use llvm::{SequentiallyConsistent, Acquire, Release, AtomicXchg, ValueRef, TypeKind};
use middle::subst;
use middle::subst::FnSpace;
use trans::base::*;
use trans::build::*;
use trans::callee;
use trans::cleanup;
use trans::cleanup::CleanupMethods;
use trans::common::*;
use trans::datum::*;
use trans::expr;
use trans::glue;
use trans::type_of::*;
use trans::type_of;
use trans::machine;
use trans::machine::llsize_of;
use trans::type_::Type;
use middle::ty::{mod, Ty};
use syntax::abi::RustIntrinsic;
use syntax::ast;
use syntax::parse::token;
use util::ppaux::{Repr, ty_to_string};

pub fn get_simple_intrinsic(ccx: &CrateContext, item: &ast::ForeignItem) -> Option<ValueRef> {
    let name = match token::get_ident(item.ident).get() {
        "sqrtf32" => "llvm.sqrt.f32",
        "sqrtf64" => "llvm.sqrt.f64",
        "powif32" => "llvm.powi.f32",
        "powif64" => "llvm.powi.f64",
        "sinf32" => "llvm.sin.f32",
        "sinf64" => "llvm.sin.f64",
        "cosf32" => "llvm.cos.f32",
        "cosf64" => "llvm.cos.f64",
        "powf32" => "llvm.pow.f32",
        "powf64" => "llvm.pow.f64",
        "expf32" => "llvm.exp.f32",
        "expf64" => "llvm.exp.f64",
        "exp2f32" => "llvm.exp2.f32",
        "exp2f64" => "llvm.exp2.f64",
        "logf32" => "llvm.log.f32",
        "logf64" => "llvm.log.f64",
        "log10f32" => "llvm.log10.f32",
        "log10f64" => "llvm.log10.f64",
        "log2f32" => "llvm.log2.f32",
        "log2f64" => "llvm.log2.f64",
        "fmaf32" => "llvm.fma.f32",
        "fmaf64" => "llvm.fma.f64",
        "fabsf32" => "llvm.fabs.f32",
        "fabsf64" => "llvm.fabs.f64",
        "copysignf32" => "llvm.copysign.f32",
        "copysignf64" => "llvm.copysign.f64",
        "floorf32" => "llvm.floor.f32",
        "floorf64" => "llvm.floor.f64",
        "ceilf32" => "llvm.ceil.f32",
        "ceilf64" => "llvm.ceil.f64",
        "truncf32" => "llvm.trunc.f32",
        "truncf64" => "llvm.trunc.f64",
        "rintf32" => "llvm.rint.f32",
        "rintf64" => "llvm.rint.f64",
        "nearbyintf32" => "llvm.nearbyint.f32",
        "nearbyintf64" => "llvm.nearbyint.f64",
        "roundf32" => "llvm.round.f32",
        "roundf64" => "llvm.round.f64",
        "ctpop8" => "llvm.ctpop.i8",
        "ctpop16" => "llvm.ctpop.i16",
        "ctpop32" => "llvm.ctpop.i32",
        "ctpop64" => "llvm.ctpop.i64",
        "bswap16" => "llvm.bswap.i16",
        "bswap32" => "llvm.bswap.i32",
        "bswap64" => "llvm.bswap.i64",
        "assume" => "llvm.assume",
        _ => return None
    };
    Some(ccx.get_intrinsic(&name))
}

/// Performs late verification that intrinsics are used correctly. At present,
/// the only intrinsic that needs such verification is `transmute`.
pub fn check_intrinsics(ccx: &CrateContext) {
    let mut last_failing_id = None;
    for transmute_restriction in ccx.tcx().transmute_restrictions.borrow().iter() {
        // Sometimes, a single call to transmute will push multiple
        // type pairs to test in order to exhaustively test the
        // possibility around a type parameter. If one of those fails,
        // there is no sense reporting errors on the others.
        if last_failing_id == Some(transmute_restriction.id) {
            continue;
        }

        debug!("transmute_restriction: {}", transmute_restriction.repr(ccx.tcx()));

        assert!(!ty::type_has_params(transmute_restriction.substituted_from));
        assert!(!ty::type_has_params(transmute_restriction.substituted_to));

        let llfromtype = type_of::sizing_type_of(ccx,
                                                 transmute_restriction.substituted_from);
        let lltotype = type_of::sizing_type_of(ccx,
                                               transmute_restriction.substituted_to);
        let from_type_size = machine::llbitsize_of_real(ccx, llfromtype);
        let to_type_size = machine::llbitsize_of_real(ccx, lltotype);
        if from_type_size != to_type_size {
            last_failing_id = Some(transmute_restriction.id);

            if transmute_restriction.original_from != transmute_restriction.substituted_from {
                ccx.sess().span_err(
                    transmute_restriction.span,
                    format!("transmute called on types with potentially different sizes: \
                             {} (could be {} bit{}) to {} (could be {} bit{})",
                            ty_to_string(ccx.tcx(), transmute_restriction.original_from),
                            from_type_size as uint,
                            if from_type_size == 1 {""} else {"s"},
                            ty_to_string(ccx.tcx(), transmute_restriction.original_to),
                            to_type_size as uint,
                            if to_type_size == 1 {""} else {"s"}).as_slice());
            } else {
                ccx.sess().span_err(
                    transmute_restriction.span,
                    format!("transmute called on types with different sizes: \
                             {} ({} bit{}) to {} ({} bit{})",
                            ty_to_string(ccx.tcx(), transmute_restriction.original_from),
                            from_type_size as uint,
                            if from_type_size == 1 {""} else {"s"},
                            ty_to_string(ccx.tcx(), transmute_restriction.original_to),
                            to_type_size as uint,
                            if to_type_size == 1 {""} else {"s"}).as_slice());
            }
        }
    }
    ccx.sess().abort_if_errors();
}

pub fn trans_intrinsic_call<'a, 'blk, 'tcx>(mut bcx: Block<'blk, 'tcx>,
                                            node: ast::NodeId,
                                            callee_ty: Ty<'tcx>,
                                            cleanup_scope: cleanup::CustomScopeIndex,
                                            args: callee::CallArgs<'a, 'tcx>,
                                            dest: expr::Dest,
                                            substs: subst::Substs<'tcx>,
                                            call_info: NodeInfo)
                                            -> Result<'blk, 'tcx> {

    let fcx = bcx.fcx;
    let ccx = fcx.ccx;
    let tcx = bcx.tcx();

    let ret_ty = match callee_ty.sty {
        ty::ty_bare_fn(_, ref f) => f.sig.0.output,
        _ => panic!("expected bare_fn in trans_intrinsic_call")
    };
    let foreign_item = tcx.map.expect_foreign_item(node);
    let name = token::get_ident(foreign_item.ident);

    // For `transmute` we can just trans the input expr directly into dest
    if name.get() == "transmute" {
        let llret_ty = type_of::type_of(ccx, ret_ty.unwrap());
        match args {
            callee::ArgExprs(arg_exprs) => {
                assert_eq!(arg_exprs.len(), 1);

                let (in_type, out_type) = (*substs.types.get(FnSpace, 0),
                                           *substs.types.get(FnSpace, 1));
                let llintype = type_of::type_of(ccx, in_type);
                let llouttype = type_of::type_of(ccx, out_type);

                let in_type_size = machine::llbitsize_of_real(ccx, llintype);
                let out_type_size = machine::llbitsize_of_real(ccx, llouttype);

                // This should be caught by the intrinsicck pass
                assert_eq!(in_type_size, out_type_size);

                let nonpointer_nonaggregate = |&: llkind: TypeKind| -> bool {
                    use llvm::TypeKind::*;
                    match llkind {
                        Half | Float | Double | X86_FP80 | FP128 |
                            PPC_FP128 | Integer | Vector | X86_MMX => true,
                        _ => false
                    }
                };

                // An approximation to which types can be directly cast via
                // LLVM's bitcast.  This doesn't cover pointer -> pointer casts,
                // but does, importantly, cover SIMD types.
                let in_kind = llintype.kind();
                let ret_kind = llret_ty.kind();
                let bitcast_compatible =
                    (nonpointer_nonaggregate(in_kind) && nonpointer_nonaggregate(ret_kind)) || {
                        in_kind == TypeKind::Pointer && ret_kind == TypeKind::Pointer
                    };

                let dest = if bitcast_compatible {
                    // if we're here, the type is scalar-like (a primitive, a
                    // SIMD type or a pointer), and so can be handled as a
                    // by-value ValueRef and can also be directly bitcast to the
                    // target type.  Doing this special case makes conversions
                    // like `u32x4` -> `u64x2` much nicer for LLVM and so more
                    // efficient (these are done efficiently implicitly in C
                    // with the `__m128i` type and so this means Rust doesn't
                    // lose out there).
                    let expr = &*arg_exprs[0];
                    let datum = unpack_datum!(bcx, expr::trans(bcx, expr));
                    let datum = unpack_datum!(bcx, datum.to_rvalue_datum(bcx, "transmute_temp"));
                    let val = if datum.kind.is_by_ref() {
                        load_ty(bcx, datum.val, datum.ty)
                    } else {
                        datum.val
                    };

                    let cast_val = BitCast(bcx, val, llret_ty);

                    match dest {
                        expr::SaveIn(d) => {
                            // this often occurs in a sequence like `Store(val,
                            // d); val2 = Load(d)`, so disappears easily.
                            Store(bcx, cast_val, d);
                        }
                        expr::Ignore => {}
                    }
                    dest
                } else {
                    // The types are too complicated to do with a by-value
                    // bitcast, so pointer cast instead. We need to cast the
                    // dest so the types work out.
                    let dest = match dest {
                        expr::SaveIn(d) => expr::SaveIn(PointerCast(bcx, d, llintype.ptr_to())),
                        expr::Ignore => expr::Ignore
                    };
                    bcx = expr::trans_into(bcx, &*arg_exprs[0], dest);
                    dest
                };

                fcx.pop_custom_cleanup_scope(cleanup_scope);

                return match dest {
                    expr::SaveIn(d) => Result::new(bcx, d),
                    expr::Ignore => Result::new(bcx, C_undef(llret_ty.ptr_to()))
                };

            }

            _ => {
                ccx.sess().bug("expected expr as argument for transmute");
            }
        }
    }

    // Push the arguments.
    let mut llargs = Vec::new();
    bcx = callee::trans_args(bcx,
                             args,
                             callee_ty,
                             &mut llargs,
                             cleanup::CustomScope(cleanup_scope),
                             false,
                             RustIntrinsic);

    fcx.pop_custom_cleanup_scope(cleanup_scope);

    // These are the only intrinsic functions that diverge.
    if name.get() == "abort" {
        let llfn = ccx.get_intrinsic(&("llvm.trap"));
        Call(bcx, llfn, &[], None);
        Unreachable(bcx);
        return Result::new(bcx, C_undef(Type::nil(ccx).ptr_to()));
    } else if name.get() == "unreachable" {
        Unreachable(bcx);
        return Result::new(bcx, C_nil(ccx));
    }

    let ret_ty = match ret_ty {
        ty::FnConverging(ret_ty) => ret_ty,
        ty::FnDiverging => unreachable!()
    };

    let llret_ty = type_of::type_of(ccx, ret_ty);

    // Get location to store the result. If the user does
    // not care about the result, just make a stack slot
    let llresult = match dest {
        expr::SaveIn(d) => d,
        expr::Ignore => {
            if !type_is_zero_size(ccx, ret_ty) {
                alloc_ty(bcx, ret_ty, "intrinsic_result")
            } else {
                C_undef(llret_ty.ptr_to())
            }
        }
    };

    let simple = get_simple_intrinsic(ccx, &*foreign_item);
    let llval = match (simple, name.get()) {
        (Some(llfn), _) => {
            Call(bcx, llfn, llargs.as_slice(), None)
        }
        (_, "breakpoint") => {
            let llfn = ccx.get_intrinsic(&("llvm.debugtrap"));
            Call(bcx, llfn, &[], None)
        }
        (_, "size_of") => {
            let tp_ty = *substs.types.get(FnSpace, 0);
            let lltp_ty = type_of::type_of(ccx, tp_ty);
            C_uint(ccx, machine::llsize_of_real(ccx, lltp_ty))
        }
        (_, "min_align_of") => {
            let tp_ty = *substs.types.get(FnSpace, 0);
            C_uint(ccx, type_of::align_of(ccx, tp_ty))
        }
        (_, "pref_align_of") => {
            let tp_ty = *substs.types.get(FnSpace, 0);
            let lltp_ty = type_of::type_of(ccx, tp_ty);
            C_uint(ccx, machine::llalign_of_pref(ccx, lltp_ty))
        }
        (_, "move_val_init") => {
            // Create a datum reflecting the value being moved.
            // Use `appropriate_mode` so that the datum is by ref
            // if the value is non-immediate. Note that, with
            // intrinsics, there are no argument cleanups to
            // concern ourselves with, so we can use an rvalue datum.
            let tp_ty = *substs.types.get(FnSpace, 0);
            let mode = appropriate_rvalue_mode(ccx, tp_ty);
            let src = Datum {
                val: llargs[1],
                ty: tp_ty,
                kind: Rvalue::new(mode)
            };
            bcx = src.store_to(bcx, llargs[0]);
            C_nil(ccx)
        }
        (_, "get_tydesc") => {
            let tp_ty = *substs.types.get(FnSpace, 0);
            let static_ti = get_tydesc(ccx, tp_ty);

            // FIXME (#3730): ideally this shouldn't need a cast,
            // but there's a circularity between translating rust types to llvm
            // types and having a tydesc type available. So I can't directly access
            // the llvm type of intrinsic::TyDesc struct.
            PointerCast(bcx, static_ti.tydesc, llret_ty)
        }
        (_, "type_id") => {
            let hash = ty::hash_crate_independent(
                ccx.tcx(),
                *substs.types.get(FnSpace, 0),
                &ccx.link_meta().crate_hash);
            // NB: This needs to be kept in lockstep with the TypeId struct in
            //     the intrinsic module
            C_named_struct(llret_ty, &[C_u64(ccx, hash)])
        }
        (_, "init") => {
            let tp_ty = *substs.types.get(FnSpace, 0);
            let lltp_ty = type_of::type_of(ccx, tp_ty);
            if return_type_is_void(ccx, tp_ty) {
                C_nil(ccx)
            } else {
                C_null(lltp_ty)
            }
        }
        // Effectively no-ops
        (_, "uninit") | (_, "forget") => {
            C_nil(ccx)
        }
        (_, "needs_drop") => {
            let tp_ty = *substs.types.get(FnSpace, 0);
            C_bool(ccx, type_needs_drop(ccx.tcx(), tp_ty))
        }
        (_, "owns_managed") => {
            let tp_ty = *substs.types.get(FnSpace, 0);
            C_bool(ccx, ty::type_contents(ccx.tcx(), tp_ty).owns_managed())
        }
        (_, "offset") => {
            let ptr = llargs[0];
            let offset = llargs[1];
            InBoundsGEP(bcx, ptr, &[offset])
        }

        (_, "copy_nonoverlapping_memory") => {
            copy_intrinsic(bcx, false, false, *substs.types.get(FnSpace, 0),
                           llargs[0], llargs[1], llargs[2])
        }
        (_, "copy_memory") => {
            copy_intrinsic(bcx, true, false, *substs.types.get(FnSpace, 0),
                           llargs[0], llargs[1], llargs[2])
        }
        (_, "set_memory") => {
            memset_intrinsic(bcx, false, *substs.types.get(FnSpace, 0),
                             llargs[0], llargs[1], llargs[2])
        }

        (_, "volatile_copy_nonoverlapping_memory") => {
            copy_intrinsic(bcx, false, true, *substs.types.get(FnSpace, 0),
                           llargs[0], llargs[1], llargs[2])
        }
        (_, "volatile_copy_memory") => {
            copy_intrinsic(bcx, true, true, *substs.types.get(FnSpace, 0),
                           llargs[0], llargs[1], llargs[2])
        }
        (_, "volatile_set_memory") => {
            memset_intrinsic(bcx, true, *substs.types.get(FnSpace, 0),
                             llargs[0], llargs[1], llargs[2])
        }
        (_, "volatile_load") => {
            VolatileLoad(bcx, llargs[0])
        },
        (_, "volatile_store") => {
            VolatileStore(bcx, llargs[1], llargs[0]);
            C_nil(ccx)
        },

        (_, "ctlz8") => count_zeros_intrinsic(bcx, "llvm.ctlz.i8", llargs[0]),
        (_, "ctlz16") => count_zeros_intrinsic(bcx, "llvm.ctlz.i16", llargs[0]),
        (_, "ctlz32") => count_zeros_intrinsic(bcx, "llvm.ctlz.i32", llargs[0]),
        (_, "ctlz64") => count_zeros_intrinsic(bcx, "llvm.ctlz.i64", llargs[0]),
        (_, "cttz8") => count_zeros_intrinsic(bcx, "llvm.cttz.i8", llargs[0]),
        (_, "cttz16") => count_zeros_intrinsic(bcx, "llvm.cttz.i16", llargs[0]),
        (_, "cttz32") => count_zeros_intrinsic(bcx, "llvm.cttz.i32", llargs[0]),
        (_, "cttz64") => count_zeros_intrinsic(bcx, "llvm.cttz.i64", llargs[0]),

        (_, "i8_add_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.sadd.with.overflow.i8", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "i16_add_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.sadd.with.overflow.i16", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "i32_add_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.sadd.with.overflow.i32", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "i64_add_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.sadd.with.overflow.i64", ret_ty,
                                   llargs[0], llargs[1]),

        (_, "u8_add_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.uadd.with.overflow.i8", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "u16_add_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.uadd.with.overflow.i16", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "u32_add_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.uadd.with.overflow.i32", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "u64_add_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.uadd.with.overflow.i64", ret_ty,
                                   llargs[0], llargs[1]),

        (_, "i8_sub_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.ssub.with.overflow.i8", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "i16_sub_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.ssub.with.overflow.i16", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "i32_sub_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.ssub.with.overflow.i32", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "i64_sub_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.ssub.with.overflow.i64", ret_ty,
                                   llargs[0], llargs[1]),

        (_, "u8_sub_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.usub.with.overflow.i8", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "u16_sub_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.usub.with.overflow.i16", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "u32_sub_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.usub.with.overflow.i32", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "u64_sub_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.usub.with.overflow.i64", ret_ty,
                                   llargs[0], llargs[1]),

        (_, "i8_mul_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.smul.with.overflow.i8", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "i16_mul_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.smul.with.overflow.i16", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "i32_mul_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.smul.with.overflow.i32", ret_ty,
                                   llargs[0], llargs[1]),
        (_, "i64_mul_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.smul.with.overflow.i64", ret_ty,
                                   llargs[0], llargs[1]),

        (_, "u8_mul_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.umul.with.overflow.i8", ret_ty,
                                    llargs[0], llargs[1]),
        (_, "u16_mul_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.umul.with.overflow.i16", ret_ty,
                                    llargs[0], llargs[1]),
        (_, "u32_mul_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.umul.with.overflow.i32", ret_ty,
                                    llargs[0], llargs[1]),
        (_, "u64_mul_with_overflow") =>
            with_overflow_intrinsic(bcx, "llvm.umul.with.overflow.i64", ret_ty,
                                    llargs[0], llargs[1]),

        (_, "return_address") => {
            if !fcx.caller_expects_out_pointer {
                tcx.sess.span_err(call_info.span,
                                  "invalid use of `return_address` intrinsic: function \
                                   does not use out pointer");
                C_null(Type::i8p(ccx))
            } else {
                PointerCast(bcx, llvm::get_param(fcx.llfn, 0), Type::i8p(ccx))
            }
        }

        // This requires that atomic intrinsics follow a specific naming pattern:
        // "atomic_<operation>[_<ordering>]", and no ordering means SeqCst
        (_, name) if name.starts_with("atomic_") => {
            let split: Vec<&str> = name.split('_').collect();
            assert!(split.len() >= 2, "Atomic intrinsic not correct format");

            let order = if split.len() == 2 {
                llvm::SequentiallyConsistent
            } else {
                match split[2] {
                    "relaxed" => llvm::Monotonic,
                    "acq"     => llvm::Acquire,
                    "rel"     => llvm::Release,
                    "acqrel"  => llvm::AcquireRelease,
                    _ => ccx.sess().fatal("unknown ordering in atomic intrinsic")
                }
            };

            match split[1] {
                "cxchg" => {
                    // See include/llvm/IR/Instructions.h for their implementation
                    // of this, I assume that it's good enough for us to use for
                    // now.
                    let strongest_failure_ordering = match order {
                        llvm::NotAtomic | llvm::Unordered =>
                            ccx.sess().fatal("cmpxchg must be atomic"),

                        llvm::Monotonic | llvm::Release =>
                            llvm::Monotonic,

                        llvm::Acquire | llvm::AcquireRelease =>
                            llvm::Acquire,

                        llvm::SequentiallyConsistent =>
                            llvm::SequentiallyConsistent
                    };

                    let res = AtomicCmpXchg(bcx, llargs[0], llargs[1],
                                            llargs[2], order,
                                            strongest_failure_ordering);
                    if unsafe { llvm::LLVMVersionMinor() >= 5 } {
                        ExtractValue(bcx, res, 0)
                    } else {
                        res
                    }
                }

                "load" => {
                    AtomicLoad(bcx, llargs[0], order)
                }
                "store" => {
                    AtomicStore(bcx, llargs[1], llargs[0], order);
                    C_nil(ccx)
                }

                "fence" => {
                    AtomicFence(bcx, order);
                    C_nil(ccx)
                }

                // These are all AtomicRMW ops
                op => {
                    let atom_op = match op {
                        "xchg"  => llvm::AtomicXchg,
                        "xadd"  => llvm::AtomicAdd,
                        "xsub"  => llvm::AtomicSub,
                        "and"   => llvm::AtomicAnd,
                        "nand"  => llvm::AtomicNand,
                        "or"    => llvm::AtomicOr,
                        "xor"   => llvm::AtomicXor,
                        "max"   => llvm::AtomicMax,
                        "min"   => llvm::AtomicMin,
                        "umax"  => llvm::AtomicUMax,
                        "umin"  => llvm::AtomicUMin,
                        _ => ccx.sess().fatal("unknown atomic operation")
                    };

                    AtomicRMW(bcx, atom_op, llargs[0], llargs[1], order)
                }
            }

        }

        (_, _) => ccx.sess().span_bug(foreign_item.span, "unknown intrinsic")
    };

    if val_ty(llval) != Type::void(ccx) &&
       machine::llsize_of_alloc(ccx, val_ty(llval)) != 0 {
        store_ty(bcx, llval, llresult, ret_ty);
    }

    // If we made a temporary stack slot, let's clean it up
    match dest {
        expr::Ignore => {
            bcx = glue::drop_ty(bcx, llresult, ret_ty, Some(call_info));
        }
        expr::SaveIn(_) => {}
    }

    Result::new(bcx, llresult)
}

fn copy_intrinsic<'blk, 'tcx>(bcx: Block<'blk, 'tcx>,
                              allow_overlap: bool, volatile: bool, tp_ty: Ty<'tcx>,
                              dst: ValueRef, src: ValueRef, count: ValueRef) -> ValueRef {
    let ccx = bcx.ccx();
    let lltp_ty = type_of::type_of(ccx, tp_ty);
    let align = C_i32(ccx, type_of::align_of(ccx, tp_ty) as i32);
    let size = machine::llsize_of(ccx, lltp_ty);
    let int_size = machine::llbitsize_of_real(ccx, ccx.int_type());
    let name = if allow_overlap {
        if int_size == 32 {
            "llvm.memmove.p0i8.p0i8.i32"
        } else {
            "llvm.memmove.p0i8.p0i8.i64"
        }
    } else {
        if int_size == 32 {
            "llvm.memcpy.p0i8.p0i8.i32"
        } else {
            "llvm.memcpy.p0i8.p0i8.i64"
        }
    };

    let dst_ptr = PointerCast(bcx, dst, Type::i8p(ccx));
    let src_ptr = PointerCast(bcx, src, Type::i8p(ccx));
    let llfn = ccx.get_intrinsic(&name);

    Call(bcx, llfn, &[dst_ptr, src_ptr, Mul(bcx, size, count), align,
                      C_bool(ccx, volatile)], None)
}

fn memset_intrinsic<'blk, 'tcx>(bcx: Block<'blk, 'tcx>, volatile: bool, tp_ty: Ty<'tcx>,
                                dst: ValueRef, val: ValueRef, count: ValueRef) -> ValueRef {
    let ccx = bcx.ccx();
    let lltp_ty = type_of::type_of(ccx, tp_ty);
    let align = C_i32(ccx, type_of::align_of(ccx, tp_ty) as i32);
    let size = machine::llsize_of(ccx, lltp_ty);
    let name = if machine::llbitsize_of_real(ccx, ccx.int_type()) == 32 {
        "llvm.memset.p0i8.i32"
    } else {
        "llvm.memset.p0i8.i64"
    };

    let dst_ptr = PointerCast(bcx, dst, Type::i8p(ccx));
    let llfn = ccx.get_intrinsic(&name);

    Call(bcx, llfn, &[dst_ptr, val, Mul(bcx, size, count), align,
                      C_bool(ccx, volatile)], None)
}

fn count_zeros_intrinsic(bcx: Block, name: &'static str, val: ValueRef) -> ValueRef {
    let y = C_bool(bcx.ccx(), false);
    let llfn = bcx.ccx().get_intrinsic(&name);
    Call(bcx, llfn, &[val, y], None)
}

fn with_overflow_intrinsic<'blk, 'tcx>(bcx: Block<'blk, 'tcx>, name: &'static str,
                                       t: Ty<'tcx>, a: ValueRef, b: ValueRef) -> ValueRef {
    let llfn = bcx.ccx().get_intrinsic(&name);

    // Convert `i1` to a `bool`, and write it to the out parameter
    let val = Call(bcx, llfn, &[a, b], None);
    let result = ExtractValue(bcx, val, 0);
    let overflow = ZExt(bcx, ExtractValue(bcx, val, 1), Type::bool(bcx.ccx()));
    let ret = C_undef(type_of::type_of(bcx.ccx(), t));
    let ret = InsertValue(bcx, ret, result, 0);
    let ret = InsertValue(bcx, ret, overflow, 1);

    ret
}