import libc::{c_int, c_uint}; import driver::session; import session::session; import lib::llvm::llvm; import syntax::attr; import middle::ty; import metadata::{encoder, cstore}; import middle::trans::common::crate_ctxt; import metadata::common::link_meta; import std::map::hashmap; import std::sha1::sha1; import syntax::ast; import syntax::print::pprust; import lib::llvm::{ModuleRef, mk_pass_manager, mk_target_data, True, False, FileType}; import metadata::filesearch; import syntax::ast_map::{path, path_mod, path_name}; enum output_type { output_type_none, output_type_bitcode, output_type_assembly, output_type_llvm_assembly, output_type_object, output_type_exe, } fn llvm_err(sess: session, msg: str) -> ! unsafe { let cstr = llvm::LLVMRustGetLastError(); if cstr == ptr::null() { sess.fatal(msg); } else { sess.fatal(msg + ": " + str::unsafe::from_c_str(cstr)); } } mod write { fn is_object_or_assembly_or_exe(ot: output_type) -> bool { if ot == output_type_assembly || ot == output_type_object || ot == output_type_exe { ret true; } ret false; } // Decides what to call an intermediate file, given the name of the output // and the extension to use. fn mk_intermediate_name(output_path: str, extension: str) -> str unsafe { let stem = alt str::find_char(output_path, '.') { some(dot_pos) { str::slice(output_path, 0u, dot_pos) } none { output_path } }; ret stem + "." + extension; } fn run_passes(sess: session, llmod: ModuleRef, output: str) { let opts = sess.opts; if sess.time_llvm_passes() { llvm::LLVMRustEnableTimePasses(); } let mut pm = mk_pass_manager(); let td = mk_target_data( sess.targ_cfg.target_strs.data_layout); llvm::LLVMAddTargetData(td.lltd, pm.llpm); // FIXME (#2812): run the linter here also, once there are llvm-c // bindings for it. // Generate a pre-optimization intermediate file if -save-temps was // specified. if opts.save_temps { alt opts.output_type { output_type_bitcode { if opts.optimize != 0u { let filename = mk_intermediate_name(output, "no-opt.bc"); str::as_c_str(filename, |buf| { llvm::LLVMWriteBitcodeToFile(llmod, buf) }); } } _ { let filename = mk_intermediate_name(output, "bc"); str::as_c_str(filename, |buf| { llvm::LLVMWriteBitcodeToFile(llmod, buf) }); } } } if !sess.no_verify() { llvm::LLVMAddVerifierPass(pm.llpm); } // FIXME (#2396): This is mostly a copy of the bits of opt's -O2 that // are available in the C api. // Also: We might want to add optimization levels like -O1, -O2, // -Os, etc // Also: Should we expose and use the pass lists used by the opt // tool? if opts.optimize != 0u { let fpm = mk_pass_manager(); llvm::LLVMAddTargetData(td.lltd, fpm.llpm); let FPMB = llvm::LLVMPassManagerBuilderCreate(); llvm::LLVMPassManagerBuilderSetOptLevel(FPMB, 2u as c_uint); llvm::LLVMPassManagerBuilderPopulateFunctionPassManager(FPMB, fpm.llpm); llvm::LLVMPassManagerBuilderDispose(FPMB); llvm::LLVMRunPassManager(fpm.llpm, llmod); let mut threshold = 225u; if opts.optimize == 3u { threshold = 275u; } let MPMB = llvm::LLVMPassManagerBuilderCreate(); llvm::LLVMPassManagerBuilderSetOptLevel(MPMB, opts.optimize as c_uint); llvm::LLVMPassManagerBuilderSetSizeLevel(MPMB, False); llvm::LLVMPassManagerBuilderSetDisableUnitAtATime(MPMB, False); llvm::LLVMPassManagerBuilderSetDisableUnrollLoops(MPMB, False); llvm::LLVMPassManagerBuilderSetDisableSimplifyLibCalls(MPMB, False); if threshold != 0u { llvm::LLVMPassManagerBuilderUseInlinerWithThreshold (MPMB, threshold as c_uint); } llvm::LLVMPassManagerBuilderPopulateModulePassManager(MPMB, pm.llpm); llvm::LLVMPassManagerBuilderDispose(MPMB); } if !sess.no_verify() { llvm::LLVMAddVerifierPass(pm.llpm); } if is_object_or_assembly_or_exe(opts.output_type) { let LLVMOptNone = 0 as c_int; // -O0 let LLVMOptLess = 1 as c_int; // -O1 let LLVMOptDefault = 2 as c_int; // -O2, -Os let LLVMOptAggressive = 3 as c_int; // -O3 let mut CodeGenOptLevel; alt check opts.optimize { 0u { CodeGenOptLevel = LLVMOptNone; } 1u { CodeGenOptLevel = LLVMOptLess; } 2u { CodeGenOptLevel = LLVMOptDefault; } 3u { CodeGenOptLevel = LLVMOptAggressive; } } let mut FileType; if opts.output_type == output_type_object || opts.output_type == output_type_exe { FileType = lib::llvm::ObjectFile; } else { FileType = lib::llvm::AssemblyFile; } // Write optimized bitcode if --save-temps was on. if opts.save_temps { // Always output the bitcode file with --save-temps let filename = mk_intermediate_name(output, "opt.bc"); llvm::LLVMRunPassManager(pm.llpm, llmod); str::as_c_str(filename, |buf| { llvm::LLVMWriteBitcodeToFile(llmod, buf) }); pm = mk_pass_manager(); // Save the assembly file if -S is used if opts.output_type == output_type_assembly { let _: () = str::as_c_str( sess.targ_cfg.target_strs.target_triple, |buf_t| { str::as_c_str(output, |buf_o| { llvm::LLVMRustWriteOutputFile( pm.llpm, llmod, buf_t, buf_o, lib::llvm::AssemblyFile as c_uint, CodeGenOptLevel, true) }) }); } // Save the object file for -c or --save-temps alone // This .o is needed when an exe is built if opts.output_type == output_type_object || opts.output_type == output_type_exe { let _: () = str::as_c_str( sess.targ_cfg.target_strs.target_triple, |buf_t| { str::as_c_str(output, |buf_o| { llvm::LLVMRustWriteOutputFile( pm.llpm, llmod, buf_t, buf_o, lib::llvm::ObjectFile as c_uint, CodeGenOptLevel, true) }) }); } } else { // If we aren't saving temps then just output the file // type corresponding to the '-c' or '-S' flag used let _: () = str::as_c_str( sess.targ_cfg.target_strs.target_triple, |buf_t| { str::as_c_str(output, |buf_o| { llvm::LLVMRustWriteOutputFile( pm.llpm, llmod, buf_t, buf_o, FileType as c_uint, CodeGenOptLevel, true) }) }); } // Clean up and return llvm::LLVMDisposeModule(llmod); if sess.time_llvm_passes() { llvm::LLVMRustPrintPassTimings(); } ret; } if opts.output_type == output_type_llvm_assembly { // Given options "-S --emit-llvm": output LLVM assembly str::as_c_str(output, |buf_o| { llvm::LLVMRustAddPrintModulePass(pm.llpm, llmod, buf_o)}); } else { // If only a bitcode file is asked for by using the '--emit-llvm' // flag, then output it here llvm::LLVMRunPassManager(pm.llpm, llmod); str::as_c_str(output, |buf| llvm::LLVMWriteBitcodeToFile(llmod, buf) ); } llvm::LLVMDisposeModule(llmod); if sess.time_llvm_passes() { llvm::LLVMRustPrintPassTimings(); } } } /* * Name mangling and its relationship to metadata. This is complex. Read * carefully. * * The semantic model of Rust linkage is, broadly, that "there's no global * namespace" between crates. Our aim is to preserve the illusion of this * model despite the fact that it's not *quite* possible to implement on * modern linkers. We initially didn't use system linkers at all, but have * been convinced of their utility. * * There are a few issues to handle: * * - Linkers operate on a flat namespace, so we have to flatten names. * We do this using the C++ namespace-mangling technique. Foo::bar * symbols and such. * * - Symbols with the same name but different types need to get different * linkage-names. We do this by hashing a string-encoding of the type into * a fixed-size (currently 16-byte hex) cryptographic hash function (CHF: * we use SHA1) to "prevent collisions". This is not airtight but 16 hex * digits on uniform probability means you're going to need 2**32 same-name * symbols in the same process before you're even hitting birthday-paradox * collision probability. * * - Symbols in different crates but with same names "within" the crate need * to get different linkage-names. * * So here is what we do: * * - Separate the meta tags into two sets: exported and local. Only work with * the exported ones when considering linkage. * * - Consider two exported tags as special (and mandatory): name and vers. * Every crate gets them; if it doesn't name them explicitly we infer them * as basename(crate) and "0.1", respectively. Call these CNAME, CVERS. * * - Define CMETA as all the non-name, non-vers exported meta tags in the * crate (in sorted order). * * - Define CMH as hash(CMETA + hashes of dependent crates). * * - Compile our crate to lib CNAME-CMH-CVERS.so * * - Define STH(sym) as hash(CNAME, CMH, type_str(sym)) * * - Suffix a mangled sym with ::STH@CVERS, so that it is unique in the * name, non-name metadata, and type sense, and versioned in the way * system linkers understand. * */ fn build_link_meta(sess: session, c: ast::crate, output: str, sha: sha1) -> link_meta { type provided_metas = {name: option<@str>, vers: option<@str>, cmh_items: ~[@ast::meta_item]}; fn provided_link_metas(sess: session, c: ast::crate) -> provided_metas { let mut name: option<@str> = none; let mut vers: option<@str> = none; let mut cmh_items: ~[@ast::meta_item] = ~[]; let linkage_metas = attr::find_linkage_metas(c.node.attrs); attr::require_unique_names(sess.diagnostic(), linkage_metas); for linkage_metas.each |meta| { if *attr::get_meta_item_name(meta) == "name" { alt attr::get_meta_item_value_str(meta) { some(v) { name = some(v); } none { vec::push(cmh_items, meta); } } } else if *attr::get_meta_item_name(meta) == "vers" { alt attr::get_meta_item_value_str(meta) { some(v) { vers = some(v); } none { vec::push(cmh_items, meta); } } } else { vec::push(cmh_items, meta); } } ret {name: name, vers: vers, cmh_items: cmh_items}; } // This calculates CMH as defined above fn crate_meta_extras_hash(sha: sha1, _crate: ast::crate, metas: provided_metas, dep_hashes: ~[@str]) -> str { fn len_and_str(s: str) -> str { ret #fmt["%u_%s", str::len(s), s]; } fn len_and_str_lit(l: ast::lit) -> str { ret len_and_str(pprust::lit_to_str(@l)); } let cmh_items = attr::sort_meta_items(metas.cmh_items); sha.reset(); for cmh_items.each |m_| { let m = m_; alt m.node { ast::meta_name_value(key, value) { sha.input_str(len_and_str(*key)); sha.input_str(len_and_str_lit(value)); } ast::meta_word(name) { sha.input_str(len_and_str(*name)); } ast::meta_list(_, _) { // FIXME (#607): Implement this fail "unimplemented meta_item variant"; } } } for dep_hashes.each |dh| { sha.input_str(len_and_str(*dh)); } ret truncated_sha1_result(sha); } fn warn_missing(sess: session, name: str, default: str) { if !sess.building_library { ret; } sess.warn(#fmt["missing crate link meta '%s', using '%s' as default", name, default]); } fn crate_meta_name(sess: session, _crate: ast::crate, output: str, metas: provided_metas) -> @str { ret alt metas.name { some(v) { v } none { let name = { let mut os = str::split_char(path::basename(output), '.'); if (vec::len(os) < 2u) { sess.fatal(#fmt("output file name %s doesn't\ appear to have an extension", output)); } vec::pop(os); str::connect(os, ".") }; warn_missing(sess, "name", name); @name } }; } fn crate_meta_vers(sess: session, _crate: ast::crate, metas: provided_metas) -> @str { ret alt metas.vers { some(v) { v } none { let vers = "0.0"; warn_missing(sess, "vers", vers); @vers } }; } let provided_metas = provided_link_metas(sess, c); let name = crate_meta_name(sess, c, output, provided_metas); let vers = crate_meta_vers(sess, c, provided_metas); let dep_hashes = cstore::get_dep_hashes(sess.cstore); let extras_hash = crate_meta_extras_hash(sha, c, provided_metas, dep_hashes); ret {name: name, vers: vers, extras_hash: extras_hash}; } fn truncated_sha1_result(sha: sha1) -> str unsafe { ret str::slice(sha.result_str(), 0u, 16u); } // This calculates STH for a symbol, as defined above fn symbol_hash(tcx: ty::ctxt, sha: sha1, t: ty::t, link_meta: link_meta) -> str { // NB: do *not* use abbrevs here as we want the symbol names // to be independent of one another in the crate. sha.reset(); sha.input_str(*link_meta.name); sha.input_str("-"); sha.input_str(link_meta.extras_hash); sha.input_str("-"); sha.input_str(encoder::encoded_ty(tcx, t)); let hash = truncated_sha1_result(sha); // Prefix with _ so that it never blends into adjacent digits ret "_" + hash; } fn get_symbol_hash(ccx: @crate_ctxt, t: ty::t) -> str { alt ccx.type_sha1s.find(t) { some(h) { ret h; } none { let hash = symbol_hash(ccx.tcx, ccx.sha, t, ccx.link_meta); ccx.type_sha1s.insert(t, hash); ret hash; } } } // Name sanitation. LLVM will happily accept identifiers with weird names, but // gas doesn't! fn sanitize(s: str) -> str { let mut result = ""; do str::chars_iter(s) |c| { alt c { '@' { result += "_sbox_"; } '~' { result += "_ubox_"; } '*' { result += "_ptr_"; } '&' { result += "_ref_"; } ',' { result += "_"; } '{' | '(' { result += "_of_"; } 'a' to 'z' | 'A' to 'Z' | '0' to '9' | '_' { str::push_char(result,c); } _ { if c > 'z' && char::is_XID_continue(c) { str::push_char(result,c); } } } } // Underscore-qualify anything that didn't start as an ident. if result.len() > 0u && result[0] != '_' as u8 && ! char::is_XID_start(result[0] as char) { ret "_" + result; } ret result; } fn mangle(ss: path) -> str { // Follow C++ namespace-mangling style let mut n = "_ZN"; // Begin name-sequence. for ss.each |s| { alt s { path_name(s) | path_mod(s) { let sani = sanitize(*s); n += #fmt["%u%s", str::len(sani), sani]; } } } n += "E"; // End name-sequence. n } fn exported_name(path: path, hash: @str, vers: @str) -> str { ret mangle( vec::append_one(vec::append_one(path, path_name(hash)), path_name(vers))); } fn mangle_exported_name(ccx: @crate_ctxt, path: path, t: ty::t) -> str { let hash = get_symbol_hash(ccx, t); ret exported_name(path, @hash, ccx.link_meta.vers); } fn mangle_internal_name_by_type_only(ccx: @crate_ctxt, t: ty::t, name: @str) -> str { let s = @util::ppaux::ty_to_short_str(ccx.tcx, t); let hash = get_symbol_hash(ccx, t); ret mangle(~[path_name(name), path_name(s), path_name(@hash)]); } fn mangle_internal_name_by_path_and_seq(ccx: @crate_ctxt, path: path, flav: @str) -> str { ret mangle(vec::append_one(path, path_name(@ccx.names(*flav)))); } fn mangle_internal_name_by_path(_ccx: @crate_ctxt, path: path) -> str { ret mangle(path); } fn mangle_internal_name_by_seq(ccx: @crate_ctxt, flav: @str) -> str { ret ccx.names(*flav); } // If the user wants an exe generated we need to invoke // cc to link the object file with some libs fn link_binary(sess: session, obj_filename: str, out_filename: str, lm: link_meta) { // Converts a library file name into a cc -l argument fn unlib(config: @session::config, filename: str) -> str unsafe { let rmlib = fn@(filename: str) -> str { let found = str::find_str(filename, "lib"); if config.os == session::os_macos || (config.os == session::os_linux || config.os == session::os_freebsd) && option::is_some(found) && option::get(found) == 0u { ret str::slice(filename, 3u, str::len(filename)); } else { ret filename; } }; fn rmext(filename: str) -> str { let mut parts = str::split_char(filename, '.'); vec::pop(parts); ret str::connect(parts, "."); } ret alt config.os { session::os_macos { rmext(rmlib(filename)) } session::os_linux { rmext(rmlib(filename)) } session::os_freebsd { rmext(rmlib(filename)) } _ { rmext(filename) } }; } let output = if sess.building_library { let long_libname = os::dll_filename(#fmt("%s-%s-%s", *lm.name, lm.extras_hash, *lm.vers)); #debug("link_meta.name: %s", *lm.name); #debug("long_libname: %s", long_libname); #debug("out_filename: %s", out_filename); #debug("dirname(out_filename): %s", path::dirname(out_filename)); path::connect(path::dirname(out_filename), long_libname) } else { out_filename }; log(debug, "output: " + output); // The default library location, we need this to find the runtime. // The location of crates will be determined as needed. let stage: str = "-L" + sess.filesearch.get_target_lib_path(); // In the future, FreeBSD will use clang as default compiler. // It would be flexible to use cc (system's default C compiler) // instead of hard-coded gcc. // For win32, there is no cc command, // so we add a condition to make it use gcc. let cc_prog: str = if sess.targ_cfg.os == session::os_win32 { "gcc" } else { "cc" }; // The invocations of cc share some flags across platforms let mut cc_args = vec::append(~[stage], sess.targ_cfg.target_strs.cc_args); vec::push(cc_args, "-o"); vec::push(cc_args, output); vec::push(cc_args, obj_filename); let mut lib_cmd; let os = sess.targ_cfg.os; if os == session::os_macos { lib_cmd = "-dynamiclib"; } else { lib_cmd = "-shared"; } // # Crate linking let cstore = sess.cstore; for cstore::get_used_crate_files(cstore).each |cratepath| { if str::ends_with(cratepath, ".rlib") { vec::push(cc_args, cratepath); again; } let cratepath = cratepath; let dir = path::dirname(cratepath); if dir != "" { vec::push(cc_args, "-L" + dir); } let libarg = unlib(sess.targ_cfg, path::basename(cratepath)); vec::push(cc_args, "-l" + libarg); } let ula = cstore::get_used_link_args(cstore); for ula.each |arg| { vec::push(cc_args, arg); } // # Extern library linking // User-supplied library search paths (-L on the cammand line) These are // the same paths used to find Rust crates, so some of them may have been // added already by the previous crate linking code. This only allows them // to be found at compile time so it is still entirely up to outside // forces to make sure that library can be found at runtime. let addl_paths = sess.opts.addl_lib_search_paths; for addl_paths.each |path| { vec::push(cc_args, "-L" + path); } // The names of the extern libraries let used_libs = cstore::get_used_libraries(cstore); for used_libs.each |l| { vec::push(cc_args, "-l" + l); } if sess.building_library { vec::push(cc_args, lib_cmd); // On mac we need to tell the linker to let this library // be rpathed if sess.targ_cfg.os == session::os_macos { vec::push(cc_args, "-Wl,-install_name,@rpath/" + path::basename(output)); } } if !sess.debugging_opt(session::no_rt) { // Always want the runtime linked in vec::push(cc_args, "-lrustrt"); } // On linux librt and libdl are an indirect dependencies via rustrt, // and binutils 2.22+ won't add them automatically if sess.targ_cfg.os == session::os_linux { vec::push_all(cc_args, ~["-lrt", "-ldl"]); // LLVM implements the `frem` instruction as a call to `fmod`, // which lives in libm. Similar to above, on some linuxes we // have to be explicit about linking to it. See #2510 vec::push(cc_args, "-lm"); } if sess.targ_cfg.os == session::os_freebsd { vec::push_all(cc_args, ~["-pthread", "-lrt", "-L/usr/local/lib", "-lexecinfo", "-L/usr/local/lib/gcc46", "-L/usr/local/lib/gcc44", "-lstdc++", "-Wl,-z,origin", "-Wl,-rpath,/usr/local/lib/gcc46", "-Wl,-rpath,/usr/local/lib/gcc44"]); } // OS X 10.6 introduced 'compact unwind info', which is produced by the // linker from the dwarf unwind info. Unfortunately, it does not seem to // understand how to unwind our __morestack frame, so we have to turn it // off. This has impacted some other projects like GHC. if sess.targ_cfg.os == session::os_macos { vec::push(cc_args, "-Wl,-no_compact_unwind"); } // Stack growth requires statically linking a __morestack function vec::push(cc_args, "-lmorestack"); // FIXME (#2397): At some point we want to rpath our guesses as to where // extern libraries might live, based on the addl_lib_search_paths vec::push_all(cc_args, rpath::get_rpath_flags(sess, output)); #debug("%s link args: %s", cc_prog, str::connect(cc_args, " ")); // We run 'cc' here let prog = run::program_output(cc_prog, cc_args); if 0 != prog.status { sess.err(#fmt["linking with %s failed with code %d", cc_prog, prog.status]); sess.note(#fmt["%s arguments: %s", cc_prog, str::connect(cc_args, " ")]); sess.note(prog.err + prog.out); sess.abort_if_errors(); } // Clean up on Darwin if sess.targ_cfg.os == session::os_macos { run::run_program("dsymutil", ~[output]); } // Remove the temporary object file if we aren't saving temps if !sess.opts.save_temps { if ! os::remove_file(obj_filename) { sess.warn(#fmt["failed to delete object file '%s'", obj_filename]); } } } // // Local Variables: // mode: rust // fill-column: 78; // indent-tabs-mode: nil // c-basic-offset: 4 // buffer-file-coding-system: utf-8-unix // End: //