import std._str; import std._vec; import std._str.rustrt.sbuf; import std._vec.rustrt.vbuf; import std.map.hashmap; import front.ast; import driver.session; import back.x86; import back.abi; import util.common.istr; import util.common.new_str_hash; import lib.llvm.llvm; import lib.llvm.builder; import lib.llvm.llvm.ModuleRef; import lib.llvm.llvm.ValueRef; import lib.llvm.llvm.TypeRef; import lib.llvm.llvm.BuilderRef; import lib.llvm.llvm.BasicBlockRef; import lib.llvm.False; import lib.llvm.True; state obj namegen(mutable int i) { fn next(str prefix) -> str { i += 1; ret prefix + istr(i); } } type glue_fns = rec(ValueRef activate_glue, ValueRef yield_glue, ValueRef exit_task_glue, vec[ValueRef] upcall_glues); state type trans_ctxt = rec(session.session sess, ModuleRef llmod, hashmap[str,ValueRef] upcalls, hashmap[str,ValueRef] fns, @glue_fns glues, namegen names, str path); state type fn_ctxt = rec(ValueRef llfn, ValueRef lloutptr, ValueRef lltaskptr, @trans_ctxt tcx); type terminator = fn(@fn_ctxt cx, builder build); type block_ctxt = rec(BasicBlockRef llbb, builder build, terminator term, @fn_ctxt fcx); // LLVM type constructors. fn T_nil() -> TypeRef { ret llvm.LLVMVoidType(); } fn T_i1() -> TypeRef { ret llvm.LLVMInt1Type(); } fn T_i8() -> TypeRef { ret llvm.LLVMInt8Type(); } fn T_i16() -> TypeRef { ret llvm.LLVMInt16Type(); } fn T_i32() -> TypeRef { ret llvm.LLVMInt32Type(); } fn T_i64() -> TypeRef { ret llvm.LLVMInt64Type(); } fn T_int() -> TypeRef { // FIXME: switch on target type. ret T_i32(); } fn T_fn(vec[TypeRef] inputs, TypeRef output) -> TypeRef { ret llvm.LLVMFunctionType(output, _vec.buf[TypeRef](inputs), _vec.len[TypeRef](inputs), False); } fn T_ptr(TypeRef t) -> TypeRef { ret llvm.LLVMPointerType(t, 0u); } fn T_struct(vec[TypeRef] elts) -> TypeRef { ret llvm.LLVMStructType(_vec.buf[TypeRef](elts), _vec.len[TypeRef](elts), False); } fn T_opaque() -> TypeRef { ret llvm.LLVMOpaqueType(); } fn T_task() -> TypeRef { ret T_struct(vec(T_int(), // Refcount T_int(), // Delegate pointer T_int(), // Stack segment pointer T_int(), // Runtime SP T_int(), // Rust SP T_int(), // GC chain T_int(), // Domain pointer T_int() // Crate cache pointer )); } fn T_crate() -> TypeRef { ret T_struct(vec(T_int(), // ptrdiff_t image_base_off T_int(), // uintptr_t self_addr T_int(), // ptrdiff_t debug_abbrev_off T_int(), // size_t debug_abbrev_sz T_int(), // ptrdiff_t debug_info_off T_int(), // size_t debug_info_sz T_int(), // size_t activate_glue_off T_int(), // size_t yield_glue_off T_int(), // size_t unwind_glue_off T_int(), // size_t gc_glue_off T_int(), // size_t main_exit_task_glue_off T_int(), // int n_rust_syms T_int(), // int n_c_syms T_int() //int n_libs )); } fn T_double() -> TypeRef { ret llvm.LLVMDoubleType(); } fn T_taskptr() -> TypeRef { ret T_ptr(T_task()); } // LLVM constant constructors. fn C_null(TypeRef t) -> ValueRef { ret llvm.LLVMConstNull(t); } fn C_integral(int i, TypeRef t) -> ValueRef { // FIXME. We can't use LLVM.ULongLong with our existing minimal native // API, which only knows word-sized args. Lucky for us LLVM has a "take a // string encoding" version. Hilarious. Please fix to handle: // // ret llvm.LLVMConstInt(T_int(), t as LLVM.ULongLong, False); // ret llvm.LLVMConstIntOfString(t, _str.buf(istr(i)), 10); } fn C_bool(bool b) -> ValueRef { if (b) { ret C_integral(1, T_i1()); } else { ret C_integral(0, T_i1()); } } fn C_int(int i) -> ValueRef { ret C_integral(i, T_int()); } fn C_str(@trans_ctxt cx, str s) -> ValueRef { auto sc = llvm.LLVMConstString(_str.buf(s), _str.byte_len(s), False); auto g = llvm.LLVMAddGlobal(cx.llmod, llvm.LLVMTypeOf(sc), _str.buf(cx.names.next("str"))); llvm.LLVMSetInitializer(g, sc); ret g; } fn C_struct(vec[ValueRef] elts) -> ValueRef { ret llvm.LLVMConstStruct(_vec.buf[ValueRef](elts), _vec.len[ValueRef](elts), False); } fn decl_cdecl_fn(ModuleRef llmod, str name, vec[TypeRef] inputs, TypeRef output) -> ValueRef { let TypeRef llty = T_fn(inputs, output); log "declaring " + name + " with type " + lib.llvm.type_to_str(llty); let ValueRef llfn = llvm.LLVMAddFunction(llmod, _str.buf(name), llty); llvm.LLVMSetFunctionCallConv(llfn, lib.llvm.LLVMCCallConv); ret llfn; } fn decl_glue(ModuleRef llmod, str s) -> ValueRef { ret decl_cdecl_fn(llmod, s, vec(T_taskptr()), T_nil()); } fn decl_upcall(ModuleRef llmod, uint _n) -> ValueRef { // It doesn't actually matter what type we come up with here, at the // moment, as we cast the upcall function pointers to int before passing // them to the indirect upcall-invocation glue. But eventually we'd like // to call them directly, once we have a calling convention worked out. let int n = _n as int; let str s = abi.upcall_glue_name(n); let vec[TypeRef] args = vec(T_taskptr(), // taskptr T_int()) // callee + _vec.init_elt[TypeRef](T_int(), n as uint); ret decl_cdecl_fn(llmod, s, args, T_int()); } fn get_upcall(@trans_ctxt cx, str name, int n_args) -> ValueRef { if (cx.upcalls.contains_key(name)) { ret cx.upcalls.get(name); } auto inputs = vec(T_taskptr()); inputs += _vec.init_elt[TypeRef](T_int(), n_args as uint); auto output = T_nil(); auto f = decl_cdecl_fn(cx.llmod, name, inputs, output); cx.upcalls.insert(name, f); ret f; } fn trans_upcall(@block_ctxt cx, str name, vec[ValueRef] args) -> ValueRef { let int n = _vec.len[ValueRef](args) as int; let ValueRef llupcall = get_upcall(cx.fcx.tcx, name, n); llupcall = llvm.LLVMConstPointerCast(llupcall, T_int()); let ValueRef llglue = cx.fcx.tcx.glues.upcall_glues.(n); let vec[ValueRef] call_args = vec(cx.fcx.lltaskptr, llupcall); for (ValueRef a in args) { call_args += cx.build.ZExtOrBitCast(a, T_int()); } log "emitting indirect-upcall via " + abi.upcall_glue_name(n); for (ValueRef v in call_args) { log "arg: " + lib.llvm.type_to_str(llvm.LLVMTypeOf(v)); } log "emitting call to callee of type: " + lib.llvm.type_to_str(llvm.LLVMTypeOf(llglue)); ret cx.build.Call(llglue, call_args); } fn trans_lit(@block_ctxt cx, &ast.lit lit) -> ValueRef { alt (lit) { case (ast.lit_int(?i)) { ret C_int(i); } case (ast.lit_uint(?u)) { ret C_int(u as int); } case (ast.lit_char(?c)) { ret C_integral(c as int, T_i32()); } case (ast.lit_bool(?b)) { ret C_bool(b); } case (ast.lit_str(?s)) { auto len = (_str.byte_len(s) as int) + 1; ret trans_upcall(cx, "upcall_new_str", vec(p2i(C_str(cx.fcx.tcx, s)), C_int(len))); } } } fn trans_unary(@block_ctxt cx, ast.unop op, &ast.expr e) -> ValueRef { alt (op) { case (ast.bitnot) { ret cx.build.Not(trans_expr(cx, e)); } case (ast.not) { ret cx.build.Not(trans_expr(cx, e)); } case (ast.neg) { // FIXME: switch by signedness. ret cx.build.Neg(trans_expr(cx, e)); } } cx.fcx.tcx.sess.unimpl("expr variant in trans_unary"); fail; } fn trans_binary(@block_ctxt cx, ast.binop op, &ast.expr a, &ast.expr b) -> ValueRef { alt (op) { case (ast.add) { ret cx.build.Add(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.sub) { ret cx.build.Sub(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.mul) { // FIXME: switch by signedness. ret cx.build.Mul(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.div) { // FIXME: switch by signedness. ret cx.build.SDiv(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.rem) { // FIXME: switch by signedness. ret cx.build.SRem(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.bitor) { ret cx.build.Or(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.bitand) { ret cx.build.And(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.bitxor) { ret cx.build.Xor(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.lsl) { ret cx.build.Shl(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.lsr) { ret cx.build.LShr(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.asr) { ret cx.build.AShr(trans_expr(cx, a), trans_expr(cx, b)); } case (ast.eq) { ret cx.build.ICmp(lib.llvm.LLVMIntEQ, trans_expr(cx, a), trans_expr(cx, b)); } case (ast.ne) { ret cx.build.ICmp(lib.llvm.LLVMIntNE, trans_expr(cx, a), trans_expr(cx, b)); } case (ast.lt) { // FIXME: switch by signedness. ret cx.build.ICmp(lib.llvm.LLVMIntSLT, trans_expr(cx, a), trans_expr(cx, b)); } case (ast.le) { // FIXME: switch by signedness. ret cx.build.ICmp(lib.llvm.LLVMIntSLE, trans_expr(cx, a), trans_expr(cx, b)); } case (ast.ge) { // FIXME: switch by signedness. ret cx.build.ICmp(lib.llvm.LLVMIntSGE, trans_expr(cx, a), trans_expr(cx, b)); } case (ast.gt) { // FIXME: switch by signedness. ret cx.build.ICmp(lib.llvm.LLVMIntSGT, trans_expr(cx, a), trans_expr(cx, b)); } } cx.fcx.tcx.sess.unimpl("expr variant in trans_binary"); fail; } fn trans_expr(@block_ctxt cx, &ast.expr e) -> ValueRef { alt (e) { case (ast.expr_lit(?lit)) { ret trans_lit(cx, *lit); } case (ast.expr_unary(?op, ?x)) { ret trans_unary(cx, op, *x); } case (ast.expr_binary(?op, ?x, ?y)) { ret trans_binary(cx, op, *x, *y); } } cx.fcx.tcx.sess.unimpl("expr variant in trans_expr"); fail; } fn trans_log(@block_ctxt cx, &ast.expr e) { alt (e) { case (ast.expr_lit(?lit)) { alt (*lit) { case (ast.lit_str(_)) { auto v = trans_expr(cx, e); trans_upcall(cx, "upcall_log_str", vec(v)); } case (_) { auto v = trans_expr(cx, e); trans_upcall(cx, "upcall_log_int", vec(v)); } } } case (_) { auto v = trans_expr(cx, e); trans_upcall(cx, "upcall_log_int", vec(v)); } } } fn trans_stmt(@block_ctxt cx, &ast.stmt s) { alt (s) { case (ast.stmt_log(?a)) { trans_log(cx, *a); } case (_) { cx.fcx.tcx.sess.unimpl("stmt variant"); } } } fn default_terminate(@fn_ctxt cx, builder build) { build.RetVoid(); } fn new_builder(BasicBlockRef llbb) -> builder { let BuilderRef llbuild = llvm.LLVMCreateBuilder(); llvm.LLVMPositionBuilderAtEnd(llbuild, llbb); ret builder(llbuild); } fn new_block_ctxt(@fn_ctxt cx, terminator term) -> @block_ctxt { let BasicBlockRef llbb = llvm.LLVMAppendBasicBlock(cx.llfn, _str.buf("")); ret @rec(llbb=llbb, build=new_builder(llbb), term=term, fcx=cx); } fn trans_block(@fn_ctxt cx, &ast.block b, terminator term) { auto bcx = (new_block_ctxt(cx, term)); for (@ast.stmt s in b) { trans_stmt(bcx, *s); } bcx.term(cx, bcx.build); } fn new_fn_ctxt(@trans_ctxt cx, str name, TypeRef T_out, vec[TypeRef] T_explicit_args) -> @fn_ctxt { let vec[TypeRef] args = vec(T_ptr(T_out), // outptr. T_taskptr() // taskptr ); args += T_explicit_args; let ValueRef llfn = decl_cdecl_fn(cx.llmod, name, args, T_nil()); cx.fns.insert(cx.path, llfn); let ValueRef lloutptr = llvm.LLVMGetParam(llfn, 0u); let ValueRef lltaskptr = llvm.LLVMGetParam(llfn, 1u); ret @rec(llfn=llfn, lloutptr=lloutptr, lltaskptr=lltaskptr, tcx=cx); } fn trans_fn(@trans_ctxt cx, &ast._fn f) { let TypeRef out = T_int(); let vec[TypeRef] args = vec(); auto fcx = new_fn_ctxt(cx, cx.path, out, args); auto term = default_terminate; trans_block(fcx, f.body, term); } fn trans_item(@trans_ctxt cx, &str name, &ast.item item) { auto sub_cx = @rec(path=cx.path + "." + name with *cx); alt (item) { case (ast.item_fn(?f)) { trans_fn(sub_cx, *f); } case (ast.item_mod(?m)) { trans_mod(sub_cx, *m); } } } fn trans_mod(@trans_ctxt cx, &ast._mod m) { for each (tup(str, ast.item) pair in m.items()) { trans_item(cx, pair._0, pair._1); } } fn p2i(ValueRef v) -> ValueRef { ret llvm.LLVMConstPtrToInt(v, T_int()); } fn trans_exit_task_glue(@trans_ctxt cx) { let vec[TypeRef] T_args = vec(); let vec[ValueRef] V_args = vec(); auto term = default_terminate; auto llfn = cx.glues.exit_task_glue; let ValueRef lloutptr = C_null(T_int()); let ValueRef lltaskptr = llvm.LLVMGetParam(llfn, 0u); auto fcx = @rec(llfn=llfn, lloutptr=lloutptr, lltaskptr=lltaskptr, tcx=cx); auto bcx = new_block_ctxt(fcx, term); trans_upcall(bcx, "upcall_exit", V_args); bcx.term(fcx, bcx.build); } fn crate_constant(@trans_ctxt cx) -> ValueRef { let ValueRef crate_ptr = llvm.LLVMAddGlobal(cx.llmod, T_crate(), _str.buf("rust_crate")); let ValueRef crate_addr = p2i(crate_ptr); let ValueRef activate_glue_off = llvm.LLVMConstSub(p2i(cx.glues.activate_glue), crate_addr); let ValueRef yield_glue_off = llvm.LLVMConstSub(p2i(cx.glues.yield_glue), crate_addr); let ValueRef exit_task_glue_off = llvm.LLVMConstSub(p2i(cx.glues.exit_task_glue), crate_addr); let ValueRef crate_val = C_struct(vec(C_null(T_int()), // ptrdiff_t image_base_off p2i(crate_ptr), // uintptr_t self_addr C_null(T_int()), // ptrdiff_t debug_abbrev_off C_null(T_int()), // size_t debug_abbrev_sz C_null(T_int()), // ptrdiff_t debug_info_off C_null(T_int()), // size_t debug_info_sz activate_glue_off, // size_t activate_glue_off yield_glue_off, // size_t yield_glue_off C_null(T_int()), // size_t unwind_glue_off C_null(T_int()), // size_t gc_glue_off exit_task_glue_off, // size_t main_exit_task_glue_off C_null(T_int()), // int n_rust_syms C_null(T_int()), // int n_c_syms C_null(T_int()) // int n_libs )); llvm.LLVMSetInitializer(crate_ptr, crate_val); ret crate_ptr; } fn trans_main_fn(@trans_ctxt cx, ValueRef llcrate) { auto T_main_args = vec(T_int(), T_int()); auto T_rust_start_args = vec(T_int(), T_int(), T_int(), T_int()); auto llmain = decl_cdecl_fn(cx.llmod, "main", T_main_args, T_int()); auto llrust_start = decl_cdecl_fn(cx.llmod, "rust_start", T_rust_start_args, T_int()); auto llargc = llvm.LLVMGetParam(llmain, 0u); auto llargv = llvm.LLVMGetParam(llmain, 1u); auto llrust_main = cx.fns.get("_rust.main"); // // Emit the moral equivalent of: // // main(int argc, char **argv) { // rust_start(&_rust.main, &crate, argc, argv); // } // let BasicBlockRef llbb = llvm.LLVMAppendBasicBlock(llmain, _str.buf("")); auto b = new_builder(llbb); auto start_args = vec(p2i(llrust_main), p2i(llcrate), llargc, llargv); b.Ret(b.Call(llrust_start, start_args)); } fn trans_crate(session.session sess, ast.crate crate) { auto llmod = llvm.LLVMModuleCreateWithNameInContext(_str.buf("rust_out"), llvm.LLVMGetGlobalContext()); llvm.LLVMSetModuleInlineAsm(llmod, _str.buf(x86.get_module_asm())); auto glues = @rec(activate_glue = decl_glue(llmod, abi.activate_glue_name()), yield_glue = decl_glue(llmod, abi.yield_glue_name()), /* * Note: the signature passed to decl_cdecl_fn here * looks unusual because it is. It corresponds neither * to an upcall signature nor a normal rust-ABI * signature. In fact it is a fake signature, that * exists solely to acquire the task pointer as an * argument to the upcall. It so happens that the * runtime sets up the task pointer as the sole incoming * argument to the frame that we return into when * returning to the exit task glue. So this is the * signature required to retrieve it. */ exit_task_glue = decl_cdecl_fn(llmod, abi.exit_task_glue_name(), vec(T_taskptr()), T_nil()), upcall_glues = _vec.init_fn[ValueRef](bind decl_upcall(llmod, _), abi.n_upcall_glues as uint)); auto cx = @rec(sess = sess, llmod = llmod, upcalls = new_str_hash[ValueRef](), fns = new_str_hash[ValueRef](), glues = glues, names = namegen(0), path = "_rust"); trans_mod(cx, crate.module); trans_exit_task_glue(cx); trans_main_fn(cx, crate_constant(cx)); llvm.LLVMWriteBitcodeToFile(llmod, _str.buf("rust_out.bc")); llvm.LLVMDisposeModule(llmod); } // // Local Variables: // mode: rust // fill-column: 78; // indent-tabs-mode: nil // c-basic-offset: 4 // buffer-file-coding-system: utf-8-unix // compile-command: "make -k -C ../.. 2>&1 | sed -e 's/\\/x\\//x:\\//g'"; // End: //