1 // Copyright 2012-2015 The Rust Project Developers. See the COPYRIGHT
2 // file at the top-level directory of this distribution and at
3 // http://rust-lang.org/COPYRIGHT.
5 // Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
6 // http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
7 // <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
8 // option. This file may not be copied, modified, or distributed
9 // except according to those terms.
11 //! Codegen the completed AST to the LLVM IR.
13 //! Some functions here, such as codegen_block and codegen_expr, return a value --
14 //! the result of the codegen to LLVM -- while others, such as codegen_fn
15 //! and mono_item, are called only for the side effect of adding a
16 //! particular definition to the LLVM IR output we're producing.
18 //! Hopefully useful general knowledge about codegen:
20 //! * There's no way to find out the Ty type of a Value. Doing so
21 //! would be "trying to get the eggs out of an omelette" (credit:
22 //! pcwalton). You can, instead, find out its llvm::Type by calling val_ty,
23 //! but one llvm::Type corresponds to many `Ty`s; for instance, tup(int, int,
24 //! int) and rec(x=int, y=int, z=int) will have the same llvm::Type.
26 use super::ModuleLlvm;
27 use super::ModuleCodegen;
28 use super::ModuleKind;
29 use super::CachedModuleCodegen;
32 use back::write::{self, OngoingCodegen};
33 use llvm::{self, TypeKind, get_param};
35 use rustc::dep_graph::cgu_reuse_tracker::CguReuse;
36 use rustc::hir::def_id::{CrateNum, DefId, LOCAL_CRATE};
37 use rustc::middle::lang_items::StartFnLangItem;
38 use rustc::middle::weak_lang_items;
39 use rustc::mir::mono::{Linkage, Visibility, Stats, CodegenUnitNameBuilder};
40 use rustc::middle::cstore::{EncodedMetadata};
41 use rustc::ty::{self, Ty, TyCtxt};
42 use rustc::ty::layout::{self, Align, TyLayout, LayoutOf, VariantIdx};
43 use rustc::ty::query::Providers;
44 use rustc::middle::cstore::{self, LinkagePreference};
45 use rustc::middle::exported_symbols;
46 use rustc::util::common::{time, print_time_passes_entry};
47 use rustc::util::profiling::ProfileCategory;
48 use rustc::session::config::{self, DebugInfo, EntryFnType, Lto};
49 use rustc::session::Session;
50 use rustc_incremental;
52 use mir::place::PlaceRef;
54 use builder::{Builder, MemFlags};
56 use common::{C_bool, C_bytes_in_context, C_usize};
57 use rustc_mir::monomorphize::item::DefPathBasedNames;
58 use common::{C_struct_in_context, C_array, val_ty};
60 use context::CodegenCx;
65 use monomorphize::Instance;
66 use monomorphize::partitioning::{CodegenUnit, CodegenUnitExt};
67 use rustc_codegen_utils::symbol_names_test;
69 use mono_item::{MonoItem, MonoItemExt};
71 use type_of::LayoutLlvmExt;
72 use rustc::util::nodemap::FxHashMap;
74 use rustc_data_structures::small_c_str::SmallCStr;
75 use rustc_data_structures::sync::Lrc;
76 use rustc_data_structures::indexed_vec::Idx;
78 use traits::BuilderMethods;
82 use std::ffi::CString;
83 use std::ops::{Deref, DerefMut};
85 use std::time::{Instant, Duration};
87 use syntax_pos::symbol::InternedString;
89 use rustc::hir::{self, CodegenFnAttrs};
91 use value::{Value, ValueTrait};
93 use mir::operand::OperandValue;
95 use rustc_codegen_utils::check_for_rustc_errors_attr;
97 pub struct StatRecorder<'a, 'll: 'a, 'tcx: 'll> {
98 cx: &'a CodegenCx<'ll, 'tcx>,
103 impl StatRecorder<'a, 'll, 'tcx> {
104 pub fn new(cx: &'a CodegenCx<'ll, 'tcx>, name: String) -> Self {
105 let istart = cx.stats.borrow().n_llvm_insns;
114 impl Drop for StatRecorder<'a, 'll, 'tcx> {
116 if self.cx.sess().codegen_stats() {
117 let mut stats = self.cx.stats.borrow_mut();
118 let iend = stats.n_llvm_insns;
119 stats.fn_stats.push((self.name.take().unwrap(), iend - self.istart));
121 // Reset LLVM insn count to avoid compound costs.
122 stats.n_llvm_insns = self.istart;
127 pub fn bin_op_to_icmp_predicate(op: hir::BinOpKind,
129 -> llvm::IntPredicate {
131 hir::BinOpKind::Eq => llvm::IntEQ,
132 hir::BinOpKind::Ne => llvm::IntNE,
133 hir::BinOpKind::Lt => if signed { llvm::IntSLT } else { llvm::IntULT },
134 hir::BinOpKind::Le => if signed { llvm::IntSLE } else { llvm::IntULE },
135 hir::BinOpKind::Gt => if signed { llvm::IntSGT } else { llvm::IntUGT },
136 hir::BinOpKind::Ge => if signed { llvm::IntSGE } else { llvm::IntUGE },
138 bug!("comparison_op_to_icmp_predicate: expected comparison operator, \
145 pub fn bin_op_to_fcmp_predicate(op: hir::BinOpKind) -> llvm::RealPredicate {
147 hir::BinOpKind::Eq => llvm::RealOEQ,
148 hir::BinOpKind::Ne => llvm::RealUNE,
149 hir::BinOpKind::Lt => llvm::RealOLT,
150 hir::BinOpKind::Le => llvm::RealOLE,
151 hir::BinOpKind::Gt => llvm::RealOGT,
152 hir::BinOpKind::Ge => llvm::RealOGE,
154 bug!("comparison_op_to_fcmp_predicate: expected comparison operator, \
161 pub fn compare_simd_types(
162 bx: &Builder<'a, 'll, 'tcx>,
169 let signed = match t.sty {
171 let cmp = bin_op_to_fcmp_predicate(op);
172 return bx.sext(bx.fcmp(cmp, lhs, rhs), ret_ty);
174 ty::Uint(_) => false,
176 _ => bug!("compare_simd_types: invalid SIMD type"),
179 let cmp = bin_op_to_icmp_predicate(op, signed);
180 // LLVM outputs an `< size x i1 >`, so we need to perform a sign extension
181 // to get the correctly sized type. This will compile to a single instruction
182 // once the IR is converted to assembly if the SIMD instruction is supported
183 // by the target architecture.
184 bx.sext(bx.icmp(cmp, lhs, rhs), ret_ty)
187 /// Retrieve the information we are losing (making dynamic) in an unsizing
190 /// The `old_info` argument is a bit funny. It is intended for use
191 /// in an upcast, where the new vtable for an object will be derived
192 /// from the old one.
194 cx: &CodegenCx<'ll, 'tcx>,
197 old_info: Option<&'ll Value>,
199 let (source, target) = cx.tcx.struct_lockstep_tails(source, target);
200 match (&source.sty, &target.sty) {
201 (&ty::Array(_, len), &ty::Slice(_)) => {
202 C_usize(cx, len.unwrap_usize(cx.tcx))
204 (&ty::Dynamic(..), &ty::Dynamic(..)) => {
205 // For now, upcasts are limited to changes in marker
206 // traits, and hence never actually require an actual
207 // change to the vtable.
208 old_info.expect("unsized_info: missing old info for trait upcast")
210 (_, &ty::Dynamic(ref data, ..)) => {
211 let vtable_ptr = cx.layout_of(cx.tcx.mk_mut_ptr(target))
212 .field(cx, abi::FAT_PTR_EXTRA);
213 consts::ptrcast(meth::get_vtable(cx, source, data.principal()),
214 vtable_ptr.llvm_type(cx))
216 _ => bug!("unsized_info: invalid unsizing {:?} -> {:?}",
222 /// Coerce `src` to `dst_ty`. `src_ty` must be a thin pointer.
223 pub fn unsize_thin_ptr(
224 bx: &Builder<'a, 'll, 'tcx>,
228 ) -> (&'ll Value, &'ll Value) {
229 debug!("unsize_thin_ptr: {:?} => {:?}", src_ty, dst_ty);
230 match (&src_ty.sty, &dst_ty.sty) {
234 &ty::RawPtr(ty::TypeAndMut { ty: b, .. })) |
235 (&ty::RawPtr(ty::TypeAndMut { ty: a, .. }),
236 &ty::RawPtr(ty::TypeAndMut { ty: b, .. })) => {
237 assert!(bx.cx.type_is_sized(a));
238 let ptr_ty = bx.cx.layout_of(b).llvm_type(bx.cx).ptr_to();
239 (bx.pointercast(src, ptr_ty), unsized_info(bx.cx, a, b, None))
241 (&ty::Adt(def_a, _), &ty::Adt(def_b, _)) if def_a.is_box() && def_b.is_box() => {
242 let (a, b) = (src_ty.boxed_ty(), dst_ty.boxed_ty());
243 assert!(bx.cx.type_is_sized(a));
244 let ptr_ty = bx.cx.layout_of(b).llvm_type(bx.cx).ptr_to();
245 (bx.pointercast(src, ptr_ty), unsized_info(bx.cx, a, b, None))
247 (&ty::Adt(def_a, _), &ty::Adt(def_b, _)) => {
248 assert_eq!(def_a, def_b);
250 let src_layout = bx.cx.layout_of(src_ty);
251 let dst_layout = bx.cx.layout_of(dst_ty);
252 let mut result = None;
253 for i in 0..src_layout.fields.count() {
254 let src_f = src_layout.field(bx.cx, i);
255 assert_eq!(src_layout.fields.offset(i).bytes(), 0);
256 assert_eq!(dst_layout.fields.offset(i).bytes(), 0);
260 assert_eq!(src_layout.size, src_f.size);
262 let dst_f = dst_layout.field(bx.cx, i);
263 assert_ne!(src_f.ty, dst_f.ty);
264 assert_eq!(result, None);
265 result = Some(unsize_thin_ptr(bx, src, src_f.ty, dst_f.ty));
267 let (lldata, llextra) = result.unwrap();
268 // HACK(eddyb) have to bitcast pointers until LLVM removes pointee types.
269 (bx.bitcast(lldata, dst_layout.scalar_pair_element_llvm_type(bx.cx, 0, true)),
270 bx.bitcast(llextra, dst_layout.scalar_pair_element_llvm_type(bx.cx, 1, true)))
272 _ => bug!("unsize_thin_ptr: called on bad types"),
276 /// Coerce `src`, which is a reference to a value of type `src_ty`,
277 /// to a value of type `dst_ty` and store the result in `dst`
278 pub fn coerce_unsized_into(
279 bx: &Builder<'a, 'll, 'tcx>,
280 src: PlaceRef<'tcx, &'ll Value>,
281 dst: PlaceRef<'tcx, &'ll Value>
283 let src_ty = src.layout.ty;
284 let dst_ty = dst.layout.ty;
285 let coerce_ptr = || {
286 let (base, info) = match src.load(bx).val {
287 OperandValue::Pair(base, info) => {
288 // fat-ptr to fat-ptr unsize preserves the vtable
289 // i.e. &'a fmt::Debug+Send => &'a fmt::Debug
290 // So we need to pointercast the base to ensure
291 // the types match up.
292 let thin_ptr = dst.layout.field(bx.cx, abi::FAT_PTR_ADDR);
293 (bx.pointercast(base, thin_ptr.llvm_type(bx.cx)), info)
295 OperandValue::Immediate(base) => {
296 unsize_thin_ptr(bx, base, src_ty, dst_ty)
298 OperandValue::Ref(..) => bug!()
300 OperandValue::Pair(base, info).store(bx, dst);
302 match (&src_ty.sty, &dst_ty.sty) {
303 (&ty::Ref(..), &ty::Ref(..)) |
304 (&ty::Ref(..), &ty::RawPtr(..)) |
305 (&ty::RawPtr(..), &ty::RawPtr(..)) => {
308 (&ty::Adt(def_a, _), &ty::Adt(def_b, _)) if def_a.is_box() && def_b.is_box() => {
312 (&ty::Adt(def_a, _), &ty::Adt(def_b, _)) => {
313 assert_eq!(def_a, def_b);
315 for i in 0..def_a.variants[VariantIdx::new(0)].fields.len() {
316 let src_f = src.project_field(bx, i);
317 let dst_f = dst.project_field(bx, i);
319 if dst_f.layout.is_zst() {
323 if src_f.layout.ty == dst_f.layout.ty {
324 memcpy_ty(bx, dst_f.llval, dst_f.align, src_f.llval, src_f.align,
325 src_f.layout, MemFlags::empty());
327 coerce_unsized_into(bx, src_f, dst_f);
331 _ => bug!("coerce_unsized_into: invalid coercion {:?} -> {:?}",
337 pub fn cast_shift_expr_rhs(
338 cx: &Builder<'_, 'll, '_>, op: hir::BinOpKind, lhs: &'ll Value, rhs: &'ll Value
340 cast_shift_rhs(op, lhs, rhs, |a, b| cx.trunc(a, b), |a, b| cx.zext(a, b))
343 fn cast_shift_rhs<'ll, F, G>(op: hir::BinOpKind,
349 where F: FnOnce(&'ll Value, &'ll Type) -> &'ll Value,
350 G: FnOnce(&'ll Value, &'ll Type) -> &'ll Value
352 // Shifts may have any size int on the rhs
354 let mut rhs_llty = val_ty(rhs);
355 let mut lhs_llty = val_ty(lhs);
356 if rhs_llty.kind() == TypeKind::Vector {
357 rhs_llty = rhs_llty.element_type()
359 if lhs_llty.kind() == TypeKind::Vector {
360 lhs_llty = lhs_llty.element_type()
362 let rhs_sz = rhs_llty.int_width();
363 let lhs_sz = lhs_llty.int_width();
366 } else if lhs_sz > rhs_sz {
367 // FIXME (#1877: If in the future shifting by negative
368 // values is no longer undefined then this is wrong.
378 /// Returns whether this session's target will use SEH-based unwinding.
380 /// This is only true for MSVC targets, and even then the 64-bit MSVC target
381 /// currently uses SEH-ish unwinding with DWARF info tables to the side (same as
382 /// 64-bit MinGW) instead of "full SEH".
383 pub fn wants_msvc_seh(sess: &Session) -> bool {
384 sess.target.target.options.is_like_msvc
387 pub fn call_assume(bx: &Builder<'_, 'll, '_>, val: &'ll Value) {
388 let assume_intrinsic = bx.cx.get_intrinsic("llvm.assume");
389 bx.call(assume_intrinsic, &[val], None);
392 pub fn from_immediate<'a, 'll: 'a, 'tcx: 'll,
394 Builder: BuilderMethods<'a, 'll, 'tcx, Value>>(
397 ) -> &'ll Value where Value : ValueTrait {
398 if val_ty(val) == Type::i1(bx.cx()) {
399 bx.zext(val, Type::i8(bx.cx()))
406 bx: &Builder<'_, 'll, '_>,
408 layout: layout::TyLayout,
410 if let layout::Abi::Scalar(ref scalar) = layout.abi {
411 return to_immediate_scalar(bx, val, scalar);
416 pub fn to_immediate_scalar(
417 bx: &Builder<'_, 'll, '_>,
419 scalar: &layout::Scalar,
421 if scalar.is_bool() {
422 return bx.trunc(val, Type::i1(bx.cx));
427 pub fn call_memcpy<'a, 'll: 'a, 'tcx: 'll,
429 Builder: BuilderMethods<'a, 'll, 'tcx, Value>>(
437 ) where Value : ValueTrait {
438 if flags.contains(MemFlags::NONTEMPORAL) {
439 // HACK(nox): This is inefficient but there is no nontemporal memcpy.
440 let val = bx.load(src, src_align);
441 let ptr = bx.pointercast(dst, val_ty(val).ptr_to());
442 bx.store_with_flags(val, ptr, dst_align, flags);
446 let src_ptr = bx.pointercast(src, Type::i8p(cx));
447 let dst_ptr = bx.pointercast(dst, Type::i8p(cx));
448 let size = bx.intcast(n_bytes, cx.isize_ty, false);
449 let volatile = flags.contains(MemFlags::VOLATILE);
450 bx.memcpy(dst_ptr, dst_align.abi(), src_ptr, src_align.abi(), size, volatile);
453 pub fn memcpy_ty<'a, 'll: 'a, 'tcx: 'll,
455 Builder: BuilderMethods<'a, 'll, 'tcx, Value>>(
461 layout: TyLayout<'tcx>,
463 ) where Value : ValueTrait {
464 let size = layout.size.bytes();
469 call_memcpy(bx, dst, dst_align, src, src_align, C_usize(bx.cx(), size), flags);
473 bx: &Builder<'_, 'll, '_>,
475 fill_byte: &'ll Value,
480 let ptr_width = &bx.cx.sess().target.target.target_pointer_width;
481 let intrinsic_key = format!("llvm.memset.p0i8.i{}", ptr_width);
482 let llintrinsicfn = bx.cx.get_intrinsic(&intrinsic_key);
483 let volatile = C_bool(bx.cx, volatile);
484 bx.call(llintrinsicfn, &[ptr, fill_byte, size, align, volatile], None)
487 pub fn codegen_instance<'a, 'tcx>(cx: &CodegenCx<'a, 'tcx>, instance: Instance<'tcx>) {
488 let _s = if cx.sess().codegen_stats() {
489 let mut instance_name = String::new();
490 DefPathBasedNames::new(cx.tcx, true, true)
491 .push_def_path(instance.def_id(), &mut instance_name);
492 Some(StatRecorder::new(cx, instance_name))
497 // this is an info! to allow collecting monomorphization statistics
498 // and to allow finding the last function before LLVM aborts from
500 info!("codegen_instance({})", instance);
502 let sig = instance.fn_sig(cx.tcx);
503 let sig = cx.tcx.normalize_erasing_late_bound_regions(ty::ParamEnv::reveal_all(), &sig);
505 let lldecl = cx.instances.borrow().get(&instance).cloned().unwrap_or_else(||
506 bug!("Instance `{:?}` not already declared", instance));
508 cx.stats.borrow_mut().n_closures += 1;
510 let mir = cx.tcx.instance_mir(instance.def);
511 mir::codegen_mir(cx, lldecl, &mir, instance, sig);
514 pub fn set_link_section(llval: &Value, attrs: &CodegenFnAttrs) {
515 let sect = match attrs.link_section {
520 let buf = SmallCStr::new(§.as_str());
521 llvm::LLVMSetSection(llval, buf.as_ptr());
525 /// Create the `main` function which will initialize the rust runtime and call
526 /// users main function.
527 fn maybe_create_entry_wrapper(cx: &CodegenCx) {
528 let (main_def_id, span) = match *cx.sess().entry_fn.borrow() {
529 Some((id, span, _)) => {
530 (cx.tcx.hir.local_def_id(id), span)
535 let instance = Instance::mono(cx.tcx, main_def_id);
537 if !cx.codegen_unit.contains_item(&MonoItem::Fn(instance)) {
538 // We want to create the wrapper in the same codegen unit as Rust's main
543 let main_llfn = callee::get_fn(cx, instance);
545 let et = cx.sess().entry_fn.get().map(|e| e.2);
547 Some(EntryFnType::Main) => create_entry_fn(cx, span, main_llfn, main_def_id, true),
548 Some(EntryFnType::Start) => create_entry_fn(cx, span, main_llfn, main_def_id, false),
549 None => {} // Do nothing.
553 cx: &CodegenCx<'ll, '_>,
555 rust_main: &'ll Value,
556 rust_main_def_id: DefId,
557 use_start_lang_item: bool,
560 Type::func::<Value>(&[Type::c_int(cx), Type::i8p(cx).ptr_to()], Type::c_int(cx));
562 let main_ret_ty = cx.tcx.fn_sig(rust_main_def_id).output();
563 // Given that `main()` has no arguments,
564 // then its return type cannot have
565 // late-bound regions, since late-bound
566 // regions must appear in the argument
568 let main_ret_ty = cx.tcx.erase_regions(
569 &main_ret_ty.no_bound_vars().unwrap(),
572 if declare::get_defined_value(cx, "main").is_some() {
573 // FIXME: We should be smart and show a better diagnostic here.
574 cx.sess().struct_span_err(sp, "entry symbol `main` defined multiple times")
575 .help("did you use #[no_mangle] on `fn main`? Use #[start] instead")
577 cx.sess().abort_if_errors();
580 let llfn = declare::declare_cfn(cx, "main", llfty);
582 // `main` should respect same config for frame pointer elimination as rest of code
583 attributes::set_frame_pointer_elimination(cx, llfn);
584 attributes::apply_target_cpu_attr(cx, llfn);
586 let bx = Builder::new_block(cx, llfn, "top");
588 debuginfo::gdb::insert_reference_to_gdb_debug_scripts_section_global(&bx);
590 // Params from native main() used as args for rust start function
591 let param_argc = get_param(llfn, 0);
592 let param_argv = get_param(llfn, 1);
593 let arg_argc = bx.intcast(param_argc, cx.isize_ty, true);
594 let arg_argv = param_argv;
596 let (start_fn, args) = if use_start_lang_item {
597 let start_def_id = cx.tcx.require_lang_item(StartFnLangItem);
598 let start_fn = callee::resolve_and_get_fn(
601 cx.tcx.intern_substs(&[main_ret_ty.into()]),
603 (start_fn, vec![bx.pointercast(rust_main, Type::i8p(cx).ptr_to()),
606 debug!("using user-defined start fn");
607 (rust_main, vec![arg_argc, arg_argv])
610 let result = bx.call(start_fn, &args, None);
611 bx.ret(bx.intcast(result, Type::c_int(cx), true));
615 fn write_metadata<'a, 'gcx>(tcx: TyCtxt<'a, 'gcx, 'gcx>,
616 llvm_module: &ModuleLlvm)
619 use flate2::Compression;
620 use flate2::write::DeflateEncoder;
622 let (metadata_llcx, metadata_llmod) = (&*llvm_module.llcx, llvm_module.llmod());
624 #[derive(PartialEq, Eq, PartialOrd, Ord)]
631 let kind = tcx.sess.crate_types.borrow().iter().map(|ty| {
633 config::CrateType::Executable |
634 config::CrateType::Staticlib |
635 config::CrateType::Cdylib => MetadataKind::None,
637 config::CrateType::Rlib => MetadataKind::Uncompressed,
639 config::CrateType::Dylib |
640 config::CrateType::ProcMacro => MetadataKind::Compressed,
642 }).max().unwrap_or(MetadataKind::None);
644 if kind == MetadataKind::None {
645 return EncodedMetadata::new();
648 let metadata = tcx.encode_metadata();
649 if kind == MetadataKind::Uncompressed {
653 assert!(kind == MetadataKind::Compressed);
654 let mut compressed = tcx.metadata_encoding_version();
655 DeflateEncoder::new(&mut compressed, Compression::fast())
656 .write_all(&metadata.raw_data).unwrap();
658 let llmeta = C_bytes_in_context(metadata_llcx, &compressed);
659 let llconst = C_struct_in_context(metadata_llcx, &[llmeta], false);
660 let name = exported_symbols::metadata_symbol_name(tcx);
661 let buf = CString::new(name).unwrap();
662 let llglobal = unsafe {
663 llvm::LLVMAddGlobal(metadata_llmod, val_ty(llconst), buf.as_ptr())
666 llvm::LLVMSetInitializer(llglobal, llconst);
667 let section_name = metadata::metadata_section_name(&tcx.sess.target.target);
668 let name = SmallCStr::new(section_name);
669 llvm::LLVMSetSection(llglobal, name.as_ptr());
671 // Also generate a .section directive to force no
672 // flags, at least for ELF outputs, so that the
673 // metadata doesn't get loaded into memory.
674 let directive = format!(".section {}", section_name);
675 let directive = CString::new(directive).unwrap();
676 llvm::LLVMSetModuleInlineAsm(metadata_llmod, directive.as_ptr())
681 pub struct ValueIter<'ll> {
682 cur: Option<&'ll Value>,
683 step: unsafe extern "C" fn(&'ll Value) -> Option<&'ll Value>,
686 impl Iterator for ValueIter<'ll> {
687 type Item = &'ll Value;
689 fn next(&mut self) -> Option<&'ll Value> {
691 if let Some(old) = old {
692 self.cur = unsafe { (self.step)(old) };
698 pub fn iter_globals(llmod: &'ll llvm::Module) -> ValueIter<'ll> {
701 cur: llvm::LLVMGetFirstGlobal(llmod),
702 step: llvm::LLVMGetNextGlobal,
707 fn determine_cgu_reuse<'a, 'tcx>(tcx: TyCtxt<'a, 'tcx, 'tcx>,
708 cgu: &CodegenUnit<'tcx>)
710 if !tcx.dep_graph.is_fully_enabled() {
714 let work_product_id = &cgu.work_product_id();
715 if tcx.dep_graph.previous_work_product(work_product_id).is_none() {
716 // We don't have anything cached for this CGU. This can happen
717 // if the CGU did not exist in the previous session.
721 // Try to mark the CGU as green. If it we can do so, it means that nothing
722 // affecting the LLVM module has changed and we can re-use a cached version.
723 // If we compile with any kind of LTO, this means we can re-use the bitcode
724 // of the Pre-LTO stage (possibly also the Post-LTO version but we'll only
725 // know that later). If we are not doing LTO, there is only one optimized
726 // version of each module, so we re-use that.
727 let dep_node = cgu.codegen_dep_node(tcx);
728 assert!(!tcx.dep_graph.dep_node_exists(&dep_node),
729 "CompileCodegenUnit dep-node for CGU `{}` already exists before marking.",
732 if tcx.dep_graph.try_mark_green(tcx, &dep_node).is_some() {
733 // We can re-use either the pre- or the post-thinlto state
734 if tcx.sess.lto() != Lto::No {
744 pub fn codegen_crate<'a, 'tcx>(tcx: TyCtxt<'a, 'tcx, 'tcx>,
745 rx: mpsc::Receiver<Box<dyn Any + Send>>)
748 check_for_rustc_errors_attr(tcx);
750 let cgu_name_builder = &mut CodegenUnitNameBuilder::new(tcx);
752 // Codegen the metadata.
753 tcx.sess.profiler(|p| p.start_activity(ProfileCategory::Codegen));
755 let metadata_cgu_name = cgu_name_builder.build_cgu_name(LOCAL_CRATE,
757 Some("metadata")).as_str()
759 let metadata_llvm_module = ModuleLlvm::new(tcx.sess, &metadata_cgu_name);
760 let metadata = time(tcx.sess, "write metadata", || {
761 write_metadata(tcx, &metadata_llvm_module)
763 tcx.sess.profiler(|p| p.end_activity(ProfileCategory::Codegen));
765 let metadata_module = ModuleCodegen {
766 name: metadata_cgu_name,
767 module_llvm: metadata_llvm_module,
768 kind: ModuleKind::Metadata,
771 let time_graph = if tcx.sess.opts.debugging_opts.codegen_time_graph {
772 Some(time_graph::TimeGraph::new())
777 // Skip crate items and just output metadata in -Z no-codegen mode.
778 if tcx.sess.opts.debugging_opts.no_codegen ||
779 !tcx.sess.opts.output_types.should_codegen() {
780 let ongoing_codegen = write::start_async_codegen(
787 ongoing_codegen.submit_pre_codegened_module_to_llvm(tcx, metadata_module);
788 ongoing_codegen.codegen_finished(tcx);
790 assert_and_save_dep_graph(tcx);
792 ongoing_codegen.check_for_errors(tcx.sess);
794 return ongoing_codegen;
797 // Run the monomorphization collector and partition the collected items into
799 let codegen_units = tcx.collect_and_partition_mono_items(LOCAL_CRATE).1;
800 let codegen_units = (*codegen_units).clone();
802 // Force all codegen_unit queries so they are already either red or green
803 // when compile_codegen_unit accesses them. We are not able to re-execute
804 // the codegen_unit query from just the DepNode, so an unknown color would
805 // lead to having to re-execute compile_codegen_unit, possibly
807 if tcx.dep_graph.is_fully_enabled() {
808 for cgu in &codegen_units {
809 tcx.codegen_unit(cgu.name().clone());
813 let ongoing_codegen = write::start_async_codegen(
818 codegen_units.len());
819 let ongoing_codegen = AbortCodegenOnDrop(Some(ongoing_codegen));
821 // Codegen an allocator shim, if necessary.
823 // If the crate doesn't have an `allocator_kind` set then there's definitely
824 // no shim to generate. Otherwise we also check our dependency graph for all
825 // our output crate types. If anything there looks like its a `Dynamic`
826 // linkage, then it's already got an allocator shim and we'll be using that
827 // one instead. If nothing exists then it's our job to generate the
829 let any_dynamic_crate = tcx.sess.dependency_formats.borrow()
832 use rustc::middle::dependency_format::Linkage;
833 list.iter().any(|&linkage| linkage == Linkage::Dynamic)
835 let allocator_module = if any_dynamic_crate {
837 } else if let Some(kind) = *tcx.sess.allocator_kind.get() {
838 let llmod_id = cgu_name_builder.build_cgu_name(LOCAL_CRATE,
840 Some("allocator")).as_str()
842 let modules = ModuleLlvm::new(tcx.sess, &llmod_id);
843 time(tcx.sess, "write allocator module", || {
845 allocator::codegen(tcx, &modules, kind)
851 module_llvm: modules,
852 kind: ModuleKind::Allocator,
858 if let Some(allocator_module) = allocator_module {
859 ongoing_codegen.submit_pre_codegened_module_to_llvm(tcx, allocator_module);
862 ongoing_codegen.submit_pre_codegened_module_to_llvm(tcx, metadata_module);
864 // We sort the codegen units by size. This way we can schedule work for LLVM
865 // a bit more efficiently.
866 let codegen_units = {
867 let mut codegen_units = codegen_units;
868 codegen_units.sort_by_cached_key(|cgu| cmp::Reverse(cgu.size_estimate()));
872 let mut total_codegen_time = Duration::new(0, 0);
873 let mut all_stats = Stats::default();
875 for cgu in codegen_units.into_iter() {
876 ongoing_codegen.wait_for_signal_to_codegen_item();
877 ongoing_codegen.check_for_errors(tcx.sess);
879 let cgu_reuse = determine_cgu_reuse(tcx, &cgu);
880 tcx.sess.cgu_reuse_tracker.set_actual_reuse(&cgu.name().as_str(), cgu_reuse);
884 let _timing_guard = time_graph.as_ref().map(|time_graph| {
885 time_graph.start(write::CODEGEN_WORKER_TIMELINE,
886 write::CODEGEN_WORK_PACKAGE_KIND,
887 &format!("codegen {}", cgu.name()))
889 let start_time = Instant::now();
890 let stats = compile_codegen_unit(tcx, *cgu.name());
891 all_stats.extend(stats);
892 total_codegen_time += start_time.elapsed();
895 CguReuse::PreLto => {
896 write::submit_pre_lto_module_to_llvm(tcx, CachedModuleCodegen {
897 name: cgu.name().to_string(),
898 source: cgu.work_product(tcx),
902 CguReuse::PostLto => {
903 write::submit_post_lto_module_to_llvm(tcx, CachedModuleCodegen {
904 name: cgu.name().to_string(),
905 source: cgu.work_product(tcx),
912 ongoing_codegen.codegen_finished(tcx);
914 // Since the main thread is sometimes blocked during codegen, we keep track
915 // -Ztime-passes output manually.
916 print_time_passes_entry(tcx.sess.time_passes(),
917 "codegen to LLVM IR",
920 rustc_incremental::assert_module_sources::assert_module_sources(tcx);
922 symbol_names_test::report_symbol_names(tcx);
924 if tcx.sess.codegen_stats() {
925 println!("--- codegen stats ---");
926 println!("n_glues_created: {}", all_stats.n_glues_created);
927 println!("n_null_glues: {}", all_stats.n_null_glues);
928 println!("n_real_glues: {}", all_stats.n_real_glues);
930 println!("n_fns: {}", all_stats.n_fns);
931 println!("n_inlines: {}", all_stats.n_inlines);
932 println!("n_closures: {}", all_stats.n_closures);
933 println!("fn stats:");
934 all_stats.fn_stats.sort_by_key(|&(_, insns)| insns);
935 for &(ref name, insns) in all_stats.fn_stats.iter() {
936 println!("{} insns, {}", insns, *name);
940 if tcx.sess.count_llvm_insns() {
941 for (k, v) in all_stats.llvm_insns.iter() {
942 println!("{:7} {}", *v, *k);
946 ongoing_codegen.check_for_errors(tcx.sess);
948 assert_and_save_dep_graph(tcx);
949 ongoing_codegen.into_inner()
952 /// A curious wrapper structure whose only purpose is to call `codegen_aborted`
953 /// when it's dropped abnormally.
955 /// In the process of working on rust-lang/rust#55238 a mysterious segfault was
956 /// stumbled upon. The segfault was never reproduced locally, but it was
957 /// suspected to be related to the fact that codegen worker threads were
958 /// sticking around by the time the main thread was exiting, causing issues.
960 /// This structure is an attempt to fix that issue where the `codegen_aborted`
961 /// message will block until all workers have finished. This should ensure that
962 /// even if the main codegen thread panics we'll wait for pending work to
963 /// complete before returning from the main thread, hopefully avoiding
966 /// If you see this comment in the code, then it means that this workaround
967 /// worked! We may yet one day track down the mysterious cause of that
969 struct AbortCodegenOnDrop(Option<OngoingCodegen>);
971 impl AbortCodegenOnDrop {
972 fn into_inner(mut self) -> OngoingCodegen {
973 self.0.take().unwrap()
977 impl Deref for AbortCodegenOnDrop {
978 type Target = OngoingCodegen;
980 fn deref(&self) -> &OngoingCodegen {
981 self.0.as_ref().unwrap()
985 impl DerefMut for AbortCodegenOnDrop {
986 fn deref_mut(&mut self) -> &mut OngoingCodegen {
987 self.0.as_mut().unwrap()
991 impl Drop for AbortCodegenOnDrop {
993 if let Some(codegen) = self.0.take() {
994 codegen.codegen_aborted();
999 fn assert_and_save_dep_graph<'a, 'tcx>(tcx: TyCtxt<'a, 'tcx, 'tcx>) {
1002 || rustc_incremental::assert_dep_graph(tcx));
1005 "serialize dep graph",
1006 || rustc_incremental::save_dep_graph(tcx));
1010 pub fn new(tcx: TyCtxt) -> CrateInfo {
1011 let mut info = CrateInfo {
1012 panic_runtime: None,
1013 compiler_builtins: None,
1014 profiler_runtime: None,
1015 sanitizer_runtime: None,
1016 is_no_builtins: Default::default(),
1017 native_libraries: Default::default(),
1018 used_libraries: tcx.native_libraries(LOCAL_CRATE),
1019 link_args: tcx.link_args(LOCAL_CRATE),
1020 crate_name: Default::default(),
1021 used_crates_dynamic: cstore::used_crates(tcx, LinkagePreference::RequireDynamic),
1022 used_crates_static: cstore::used_crates(tcx, LinkagePreference::RequireStatic),
1023 used_crate_source: Default::default(),
1024 wasm_imports: Default::default(),
1025 lang_item_to_crate: Default::default(),
1026 missing_lang_items: Default::default(),
1028 let lang_items = tcx.lang_items();
1030 let load_wasm_items = tcx.sess.crate_types.borrow()
1032 .any(|c| *c != config::CrateType::Rlib) &&
1033 tcx.sess.opts.target_triple.triple() == "wasm32-unknown-unknown";
1035 if load_wasm_items {
1036 info.load_wasm_imports(tcx, LOCAL_CRATE);
1039 let crates = tcx.crates();
1041 let n_crates = crates.len();
1042 info.native_libraries.reserve(n_crates);
1043 info.crate_name.reserve(n_crates);
1044 info.used_crate_source.reserve(n_crates);
1045 info.missing_lang_items.reserve(n_crates);
1047 for &cnum in crates.iter() {
1048 info.native_libraries.insert(cnum, tcx.native_libraries(cnum));
1049 info.crate_name.insert(cnum, tcx.crate_name(cnum).to_string());
1050 info.used_crate_source.insert(cnum, tcx.used_crate_source(cnum));
1051 if tcx.is_panic_runtime(cnum) {
1052 info.panic_runtime = Some(cnum);
1054 if tcx.is_compiler_builtins(cnum) {
1055 info.compiler_builtins = Some(cnum);
1057 if tcx.is_profiler_runtime(cnum) {
1058 info.profiler_runtime = Some(cnum);
1060 if tcx.is_sanitizer_runtime(cnum) {
1061 info.sanitizer_runtime = Some(cnum);
1063 if tcx.is_no_builtins(cnum) {
1064 info.is_no_builtins.insert(cnum);
1066 if load_wasm_items {
1067 info.load_wasm_imports(tcx, cnum);
1069 let missing = tcx.missing_lang_items(cnum);
1070 for &item in missing.iter() {
1071 if let Ok(id) = lang_items.require(item) {
1072 info.lang_item_to_crate.insert(item, id.krate);
1076 // No need to look for lang items that are whitelisted and don't
1077 // actually need to exist.
1078 let missing = missing.iter()
1080 .filter(|&l| !weak_lang_items::whitelisted(tcx, l))
1082 info.missing_lang_items.insert(cnum, missing);
1088 fn load_wasm_imports(&mut self, tcx: TyCtxt, cnum: CrateNum) {
1089 self.wasm_imports.extend(tcx.wasm_import_module_map(cnum).iter().map(|(&id, module)| {
1090 let instance = Instance::mono(tcx, id);
1091 let import_name = tcx.symbol_name(instance);
1093 (import_name.to_string(), module.clone())
1098 fn compile_codegen_unit<'a, 'tcx>(tcx: TyCtxt<'a, 'tcx, 'tcx>,
1099 cgu_name: InternedString)
1101 let start_time = Instant::now();
1103 let dep_node = tcx.codegen_unit(cgu_name).codegen_dep_node(tcx);
1104 let ((stats, module), _) = tcx.dep_graph.with_task(dep_node,
1108 let time_to_codegen = start_time.elapsed();
1110 // We assume that the cost to run LLVM on a CGU is proportional to
1111 // the time we needed for codegenning it.
1112 let cost = time_to_codegen.as_secs() * 1_000_000_000 +
1113 time_to_codegen.subsec_nanos() as u64;
1115 write::submit_codegened_module_to_llvm(tcx,
1120 fn module_codegen<'a, 'tcx>(
1121 tcx: TyCtxt<'a, 'tcx, 'tcx>,
1122 cgu_name: InternedString)
1123 -> (Stats, ModuleCodegen)
1125 let cgu = tcx.codegen_unit(cgu_name);
1127 // Instantiate monomorphizations without filling out definitions yet...
1128 let llvm_module = ModuleLlvm::new(tcx.sess, &cgu_name.as_str());
1130 let cx = CodegenCx::new(tcx, cgu, &llvm_module);
1131 let mono_items = cx.codegen_unit
1132 .items_in_deterministic_order(cx.tcx);
1133 for &(mono_item, (linkage, visibility)) in &mono_items {
1134 mono_item.predefine(&cx, linkage, visibility);
1137 // ... and now that we have everything pre-defined, fill out those definitions.
1138 for &(mono_item, _) in &mono_items {
1139 mono_item.define(&cx);
1142 // If this codegen unit contains the main function, also create the
1144 maybe_create_entry_wrapper(&cx);
1146 // Run replace-all-uses-with for statics that need it
1147 for &(old_g, new_g) in cx.statics_to_rauw.borrow().iter() {
1149 let bitcast = llvm::LLVMConstPointerCast(new_g, val_ty(old_g));
1150 llvm::LLVMReplaceAllUsesWith(old_g, bitcast);
1151 llvm::LLVMDeleteGlobal(old_g);
1155 // Create the llvm.used variable
1156 // This variable has type [N x i8*] and is stored in the llvm.metadata section
1157 if !cx.used_statics.borrow().is_empty() {
1158 let name = const_cstr!("llvm.used");
1159 let section = const_cstr!("llvm.metadata");
1160 let array = C_array(Type::i8(&cx).ptr_to(), &*cx.used_statics.borrow());
1163 let g = llvm::LLVMAddGlobal(cx.llmod,
1166 llvm::LLVMSetInitializer(g, array);
1167 llvm::LLVMRustSetLinkage(g, llvm::Linkage::AppendingLinkage);
1168 llvm::LLVMSetSection(g, section.as_ptr());
1172 // Finalize debuginfo
1173 if cx.sess().opts.debuginfo != DebugInfo::None {
1174 debuginfo::finalize(&cx);
1177 cx.stats.into_inner()
1180 (stats, ModuleCodegen {
1181 name: cgu_name.to_string(),
1182 module_llvm: llvm_module,
1183 kind: ModuleKind::Regular,
1188 pub fn provide_both(providers: &mut Providers) {
1189 providers.dllimport_foreign_items = |tcx, krate| {
1190 let module_map = tcx.foreign_modules(krate);
1191 let module_map = module_map.iter()
1192 .map(|lib| (lib.def_id, lib))
1193 .collect::<FxHashMap<_, _>>();
1195 let dllimports = tcx.native_libraries(krate)
1198 if lib.kind != cstore::NativeLibraryKind::NativeUnknown {
1201 let cfg = match lib.cfg {
1202 Some(ref cfg) => cfg,
1203 None => return true,
1205 attr::cfg_matches(cfg, &tcx.sess.parse_sess, None)
1207 .filter_map(|lib| lib.foreign_module)
1208 .map(|id| &module_map[&id])
1209 .flat_map(|module| module.foreign_items.iter().cloned())
1211 Lrc::new(dllimports)
1214 providers.is_dllimport_foreign_item = |tcx, def_id| {
1215 tcx.dllimport_foreign_items(def_id.krate).contains(&def_id)
1219 pub fn linkage_to_llvm(linkage: Linkage) -> llvm::Linkage {
1221 Linkage::External => llvm::Linkage::ExternalLinkage,
1222 Linkage::AvailableExternally => llvm::Linkage::AvailableExternallyLinkage,
1223 Linkage::LinkOnceAny => llvm::Linkage::LinkOnceAnyLinkage,
1224 Linkage::LinkOnceODR => llvm::Linkage::LinkOnceODRLinkage,
1225 Linkage::WeakAny => llvm::Linkage::WeakAnyLinkage,
1226 Linkage::WeakODR => llvm::Linkage::WeakODRLinkage,
1227 Linkage::Appending => llvm::Linkage::AppendingLinkage,
1228 Linkage::Internal => llvm::Linkage::InternalLinkage,
1229 Linkage::Private => llvm::Linkage::PrivateLinkage,
1230 Linkage::ExternalWeak => llvm::Linkage::ExternalWeakLinkage,
1231 Linkage::Common => llvm::Linkage::CommonLinkage,
1235 pub fn visibility_to_llvm(linkage: Visibility) -> llvm::Visibility {
1237 Visibility::Default => llvm::Visibility::Default,
1238 Visibility::Hidden => llvm::Visibility::Hidden,
1239 Visibility::Protected => llvm::Visibility::Protected,
1243 // FIXME(mw): Anything that is produced via DepGraph::with_task() must implement
1244 // the HashStable trait. Normally DepGraph::with_task() calls are
1245 // hidden behind queries, but CGU creation is a special case in two
1246 // ways: (1) it's not a query and (2) CGU are output nodes, so their
1247 // Fingerprints are not actually needed. It remains to be clarified
1248 // how exactly this case will be handled in the red/green system but
1249 // for now we content ourselves with providing a no-op HashStable
1250 // implementation for CGUs.
1251 mod temp_stable_hash_impls {
1252 use rustc_data_structures::stable_hasher::{StableHasherResult, StableHasher,
1256 impl<HCX> HashStable<HCX> for ModuleCodegen {
1257 fn hash_stable<W: StableHasherResult>(&self,
1259 _: &mut StableHasher<W>) {