rust/compiler/rustc_codegen_llvm/src/consts.rs

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

589 lines
26 KiB
Rust
Raw Normal View History

2022-07-12 13:52:35 -07:00
use std::ops::Range;
use rustc_abi::{
Align, AlignFromBytesError, HasDataLayout, Primitive, Scalar, Size, WrappingRange,
};
use rustc_codegen_ssa::common;
2020-03-29 17:19:48 +02:00
use rustc_codegen_ssa::traits::*;
use rustc_hir::LangItem;
use rustc_hir::def::DefKind;
2020-03-29 17:19:48 +02:00
use rustc_hir::def_id::DefId;
2020-03-29 16:41:09 +02:00
use rustc_middle::middle::codegen_fn_attrs::{CodegenFnAttrFlags, CodegenFnAttrs};
2020-03-29 17:19:48 +02:00
use rustc_middle::mir::interpret::{
Allocation, ConstAllocation, ErrorHandled, InitChunk, Pointer, Scalar as InterpScalar,
read_target_uint,
2020-03-29 17:19:48 +02:00
};
use rustc_middle::mir::mono::{Linkage, MonoItem};
use rustc_middle::ty::layout::{HasTypingEnv, LayoutOf};
use rustc_middle::ty::{self, Instance};
2020-03-29 16:41:09 +02:00
use rustc_middle::{bug, span_bug};
use tracing::{debug, instrument, trace};
use crate::common::{AsCCharPtr, CodegenCx};
use crate::errors::{
InvalidMinimumAlignmentNotPowerOfTwo, InvalidMinimumAlignmentTooLarge, SymbolAlreadyDefined,
};
use crate::llvm::{self, True};
2019-02-18 03:58:58 +09:00
use crate::type_::Type;
use crate::type_of::LayoutLlvmExt;
use crate::value::Value;
2019-12-24 17:38:22 -05:00
use crate::{base, debuginfo};
pub(crate) fn const_alloc_to_llvm<'ll>(
cx: &CodegenCx<'ll, '_>,
alloc: ConstAllocation<'_>,
is_static: bool,
) -> &'ll Value {
let alloc = alloc.inner();
// We expect that callers of const_alloc_to_llvm will instead directly codegen a pointer or
// integer for any &ZST where the ZST is a constant (i.e. not a static). We should never be
// producing empty LLVM allocations as they're just adding noise to binaries and forcing less
// optimal codegen.
//
// Statics have a guaranteed meaningful address so it's less clear that we want to do
// something like this; it's also harder.
if !is_static {
assert!(alloc.len() != 0);
}
let mut llvals = Vec::with_capacity(alloc.provenance().ptrs().len() + 1);
let dl = cx.data_layout();
let pointer_size = dl.pointer_size.bytes() as usize;
// Note: this function may call `inspect_with_uninit_and_ptr_outside_interpreter`, so `range`
// must be within the bounds of `alloc` and not contain or overlap a pointer provenance.
fn append_chunks_of_init_and_uninit_bytes<'ll, 'a, 'b>(
llvals: &mut Vec<&'ll Value>,
cx: &'a CodegenCx<'ll, 'b>,
alloc: &'a Allocation,
range: Range<usize>,
) {
2022-11-06 13:44:50 +01:00
let chunks = alloc.init_mask().range_as_init_chunks(range.clone().into());
let chunk_to_llval = move |chunk| match chunk {
InitChunk::Init(range) => {
let range = (range.start.bytes() as usize)..(range.end.bytes() as usize);
let bytes = alloc.inspect_with_uninit_and_ptr_outside_interpreter(range);
cx.const_bytes(bytes)
}
InitChunk::Uninit(range) => {
let len = range.end.bytes() - range.start.bytes();
cx.const_undef(cx.type_array(cx.type_i8(), len))
}
};
// Generating partially-uninit consts is limited to small numbers of chunks,
// to avoid the cost of generating large complex const expressions.
// For example, `[(u32, u8); 1024 * 1024]` contains uninit padding in each element, and
// would result in `{ [5 x i8] zeroinitializer, [3 x i8] undef, ...repeat 1M times... }`.
2023-02-01 12:52:06 -08:00
let max = cx.sess().opts.unstable_opts.uninit_const_chunk_threshold;
let allow_uninit_chunks = chunks.clone().take(max.saturating_add(1)).count() <= max;
2021-04-27 00:15:41 -04:00
if allow_uninit_chunks {
2021-04-27 00:15:41 -04:00
llvals.extend(chunks.map(chunk_to_llval));
} else {
// If this allocation contains any uninit bytes, codegen as if it was initialized
// (using some arbitrary value for uninit bytes).
let bytes = alloc.inspect_with_uninit_and_ptr_outside_interpreter(range);
llvals.push(cx.const_bytes(bytes));
}
}
let mut next_offset = 0;
for &(offset, prov) in alloc.provenance().ptrs().iter() {
let offset = offset.bytes();
assert_eq!(offset as usize as u64, offset);
let offset = offset as usize;
if offset > next_offset {
// This `inspect` is okay since we have checked that there is no provenance, it
// is within the bounds of the allocation, and it doesn't affect interpreter execution
// (we inspect the result after interpreter execution).
append_chunks_of_init_and_uninit_bytes(&mut llvals, cx, alloc, next_offset..offset);
}
let ptr_offset = read_target_uint(
dl.endian,
// This `inspect` is okay since it is within the bounds of the allocation, it doesn't
// affect interpreter execution (we inspect the result after interpreter execution),
// and we properly interpret the provenance as a relocation pointer offset.
alloc.inspect_with_uninit_and_ptr_outside_interpreter(offset..(offset + pointer_size)),
2019-12-24 17:38:22 -05:00
)
.expect("const_alloc_to_llvm: could not read relocation pointer")
as u64;
let address_space = cx.tcx.global_alloc(prov.alloc_id()).address_space(cx);
llvals.push(cx.scalar_to_backend(
InterpScalar::from_pointer(Pointer::new(prov, Size::from_bytes(ptr_offset)), &cx.tcx),
Scalar::Initialized {
value: Primitive::Pointer(address_space),
valid_range: WrappingRange::full(dl.pointer_size),
},
cx.type_ptr_ext(address_space),
));
next_offset = offset + pointer_size;
}
if alloc.len() >= next_offset {
let range = next_offset..alloc.len();
// This `inspect` is okay since we have check that it is after all provenance, it is
// within the bounds of the allocation, and it doesn't affect interpreter execution (we
// inspect the result after interpreter execution).
append_chunks_of_init_and_uninit_bytes(&mut llvals, cx, alloc, range);
}
2025-03-25 12:57:42 +00:00
// Avoid wrapping in a struct if there is only a single value. This ensures
// that LLVM is able to perform the string merging optimization if the constant
// is a valid C string. LLVM only considers bare arrays for this optimization,
// not arrays wrapped in a struct. LLVM handles this at:
// https://github.com/rust-lang/llvm-project/blob/acaea3d2bb8f351b740db7ebce7d7a40b9e21488/llvm/lib/Target/TargetLoweringObjectFile.cpp#L249-L280
if let &[data] = &*llvals { data } else { cx.const_struct(&llvals, true) }
}
fn codegen_static_initializer<'ll, 'tcx>(
cx: &CodegenCx<'ll, 'tcx>,
def_id: DefId,
) -> Result<(&'ll Value, ConstAllocation<'tcx>), ErrorHandled> {
let alloc = cx.tcx.eval_static_initializer(def_id)?;
Ok((const_alloc_to_llvm(cx, alloc, /*static*/ true), alloc))
}
fn set_global_alignment<'ll>(cx: &CodegenCx<'ll, '_>, gv: &'ll Value, mut align: Align) {
// The target may require greater alignment for globals than the type does.
// Note: GCC and Clang also allow `__attribute__((aligned))` on variables,
// which can force it to be smaller. Rust doesn't support this yet.
if let Some(min) = cx.sess().target.min_global_align {
match Align::from_bits(min) {
Ok(min) => align = align.max(min),
Err(err) => match err {
AlignFromBytesError::NotPowerOfTwo(align) => {
cx.sess().dcx().emit_err(InvalidMinimumAlignmentNotPowerOfTwo { align });
}
AlignFromBytesError::TooLarge(align) => {
cx.sess().dcx().emit_err(InvalidMinimumAlignmentTooLarge { align });
}
},
}
}
unsafe {
llvm::LLVMSetAlignment(gv, align.bytes() as u32);
}
}
fn check_and_apply_linkage<'ll, 'tcx>(
cx: &CodegenCx<'ll, 'tcx>,
attrs: &CodegenFnAttrs,
llty: &'ll Type,
sym: &str,
2022-07-12 13:52:35 -07:00
def_id: DefId,
) -> &'ll Value {
if let Some(linkage) = attrs.import_linkage {
debug!("get_static: sym={} linkage={:?}", sym, linkage);
// Declare a symbol `foo`. If `foo` is an extern_weak symbol, we declare
// an extern_weak function, otherwise a global with the desired linkage.
let g1 = if matches!(attrs.import_linkage, Some(Linkage::ExternalWeak)) {
// An `extern_weak` function is represented as an `Option<unsafe extern ...>`,
// we extract the function signature and declare it as an extern_weak function
// instead of an extern_weak i8.
let instance = Instance::mono(cx.tcx, def_id);
if let ty::Adt(struct_def, args) = instance.ty(cx.tcx, cx.typing_env()).kind()
&& cx.tcx.is_lang_item(struct_def.did(), LangItem::Option)
&& let ty::FnPtr(sig, header) = args.type_at(0).kind()
{
let fn_sig = sig.with(*header);
let fn_abi = cx.fn_abi_of_fn_ptr(fn_sig, ty::List::empty());
cx.declare_fn(sym, &fn_abi, None)
} else {
cx.declare_global(sym, cx.type_i8())
}
} else {
cx.declare_global(sym, cx.type_i8())
};
llvm::set_linkage(g1, base::linkage_to_llvm(linkage));
// Declare an internal global `extern_with_linkage_foo` which
// is initialized with the address of `foo`. If `foo` is
// discarded during linking (for example, if `foo` has weak
// linkage and there are no definitions), then
// `extern_with_linkage_foo` will instead be initialized to
// zero.
let mut real_name = "_rust_extern_with_linkage_".to_string();
real_name.push_str(sym);
let g2 = cx.define_global(&real_name, llty).unwrap_or_else(|| {
cx.sess().dcx().emit_fatal(SymbolAlreadyDefined {
span: cx.tcx.def_span(def_id),
symbol_name: sym,
})
});
llvm::set_linkage(g2, llvm::Linkage::InternalLinkage);
llvm::set_initializer(g2, g1);
g2
2022-07-12 13:52:35 -07:00
} else if cx.tcx.sess.target.arch == "x86"
2024-09-19 15:00:30 -07:00
&& common::is_mingw_gnu_toolchain(&cx.tcx.sess.target)
&& let Some(dllimport) = crate::common::get_dllimport(cx.tcx, def_id, sym)
2022-07-12 13:52:35 -07:00
{
2024-09-19 15:00:30 -07:00
cx.declare_global(&common::i686_decorated_name(dllimport, true, true, false), llty)
} else {
// Generate an external declaration.
// FIXME(nagisa): investigate whether it can be changed into define_global
2021-09-30 19:38:50 +02:00
cx.declare_global(sym, llty)
}
}
impl<'ll> CodegenCx<'ll, '_> {
pub(crate) fn const_bitcast(&self, val: &'ll Value, ty: &'ll Type) -> &'ll Value {
2019-12-24 17:38:22 -05:00
unsafe { llvm::LLVMConstBitCast(val, ty) }
2018-09-10 16:28:47 +02:00
}
2018-11-24 17:11:59 +01:00
2025-01-02 13:10:11 +01:00
pub(crate) fn const_pointercast(&self, val: &'ll Value, ty: &'ll Type) -> &'ll Value {
unsafe { llvm::LLVMConstPointerCast(val, ty) }
}
2025-01-24 00:37:05 +01:00
/// Create a global variable.
///
/// The returned global variable is a pointer in the default address space for globals.
/// Fails if a symbol with the given name already exists.
pub(crate) fn static_addr_of_mut(
2018-09-10 16:28:47 +02:00
&self,
cv: &'ll Value,
align: Align,
2018-09-10 16:28:47 +02:00
kind: Option<&str>,
) -> &'ll Value {
let gv = match kind {
Some(kind) if !self.tcx.sess.fewer_names() => {
let name = self.generate_local_symbol_name(kind);
let gv = self.define_global(&name, self.val_ty(cv)).unwrap_or_else(|| {
bug!("symbol `{}` is already defined", name);
});
llvm::set_linkage(gv, llvm::Linkage::PrivateLinkage);
gv
}
_ => self.define_private_global(self.val_ty(cv)),
};
llvm::set_initializer(gv, cv);
set_global_alignment(self, gv, align);
llvm::SetUnnamedAddress(gv, llvm::UnnamedAddr::Global);
gv
2018-09-10 16:28:47 +02:00
}
2025-01-24 00:37:05 +01:00
/// Create a global constant.
///
/// The returned global variable is a pointer in the default address space for globals.
2025-01-02 13:10:11 +01:00
pub(crate) fn static_addr_of_impl(
&self,
cv: &'ll Value,
align: Align,
kind: Option<&str>,
) -> &'ll Value {
if let Some(&gv) = self.const_globals.borrow().get(&cv) {
unsafe {
// Upgrade the alignment in cases where the same constant is used with different
// alignment requirements
let llalign = align.bytes() as u32;
if llalign > llvm::LLVMGetAlignment(gv) {
llvm::LLVMSetAlignment(gv, llalign);
}
}
return gv;
}
let gv = self.static_addr_of_mut(cv, align, kind);
unsafe {
llvm::LLVMSetGlobalConstant(gv, True);
}
self.const_globals.borrow_mut().insert(cv, gv);
gv
}
#[instrument(level = "debug", skip(self))]
pub(crate) fn get_static(&self, def_id: DefId) -> &'ll Value {
2018-09-10 16:28:47 +02:00
let instance = Instance::mono(self.tcx, def_id);
trace!(?instance);
let DefKind::Static { nested, .. } = self.tcx.def_kind(def_id) else { bug!() };
// Nested statics do not have a type, so pick a dummy type and let `codegen_static` figure
// out the llvm type from the actual evaluated initializer.
let llty = if nested {
self.type_i8()
} else {
let ty = instance.ty(self.tcx, self.typing_env());
trace!(?ty);
self.layout_of(ty).llvm_type(self)
};
self.get_static_inner(def_id, llty)
}
#[instrument(level = "debug", skip(self, llty))]
2024-09-18 10:21:02 +10:00
fn get_static_inner(&self, def_id: DefId, llty: &'ll Type) -> &'ll Value {
let instance = Instance::mono(self.tcx, def_id);
if let Some(&g) = self.instances.borrow().get(&instance) {
trace!("used cached value");
2018-09-10 16:28:47 +02:00
return g;
}
2019-12-24 17:38:22 -05:00
let defined_in_current_codegen_unit =
self.codegen_unit.items().contains_key(&MonoItem::Static(def_id));
assert!(
!defined_in_current_codegen_unit,
"consts::get_static() should always hit the cache for \
statics defined in the same CGU, but did not for `{def_id:?}`"
2019-12-24 17:38:22 -05:00
);
2018-09-10 16:28:47 +02:00
let sym = self.tcx.symbol_name(instance).name;
2021-02-02 15:38:51 +01:00
let fn_attrs = self.tcx.codegen_fn_attrs(def_id);
2018-09-10 16:28:47 +02:00
debug!(?sym, ?fn_attrs);
2018-09-10 16:28:47 +02:00
2021-02-04 11:17:01 +01:00
let g = if def_id.is_local() && !self.tcx.is_foreign_item(def_id) {
2021-02-02 15:38:51 +01:00
if let Some(g) = self.get_declared_value(sym) {
if self.val_ty(g) != self.type_ptr() {
2021-02-02 15:38:51 +01:00
span_bug!(self.tcx.def_span(def_id), "Conflicting types for static");
2018-09-10 16:28:47 +02:00
}
2021-02-02 15:38:51 +01:00
}
2018-09-10 16:28:47 +02:00
2021-02-02 15:38:51 +01:00
let g = self.declare_global(sym, llty);
2018-09-10 16:28:47 +02:00
2021-02-02 15:38:51 +01:00
if !self.tcx.is_reachable_non_generic(def_id) {
llvm::set_visibility(g, llvm::Visibility::Hidden);
2018-09-10 16:28:47 +02:00
}
g
} else {
check_and_apply_linkage(self, fn_attrs, llty, sym, def_id)
2021-02-02 15:38:51 +01:00
};
2018-09-10 16:28:47 +02:00
2021-02-02 15:38:51 +01:00
// Thread-local statics in some other crate need to *always* be linked
// against in a thread-local fashion, so we need to be sure to apply the
// thread-local attribute locally if it was present remotely. If we
// don't do this then linker errors can be generated where the linker
// complains that one object files has a thread local version of the
// symbol and another one doesn't.
if fn_attrs.flags.contains(CodegenFnAttrFlags::THREAD_LOCAL) {
llvm::set_thread_local_mode(g, self.tls_model);
}
2018-09-10 16:28:47 +02:00
let dso_local = self.assume_dso_local(g, true);
2021-02-04 11:17:01 +01:00
if !def_id.is_local() {
let needs_dll_storage_attr = self.use_dll_storage_attrs
&& !self.tcx.is_foreign_item(def_id)
// Local definitions can never be imported, so we must not apply
// the DLLImport annotation.
&& !dso_local
2024-03-20 18:54:01 +01:00
// Linker plugin ThinLTO doesn't create the self-dllimport Rust uses for rlibs
// as the code generation happens out of process. Instead we assume static linkage
// and disallow dynamic linking when linker plugin based LTO is enabled.
// Regular in-process ThinLTO doesn't need this workaround.
&& !self.tcx.sess.opts.cg.linker_plugin_lto.enabled();
2018-09-10 16:28:47 +02:00
// If this assertion triggers, there's something wrong with commandline
// argument validation.
assert!(
2019-12-24 17:38:22 -05:00
!(self.tcx.sess.opts.cg.linker_plugin_lto.enabled()
&& self.tcx.sess.target.is_like_windows
2019-12-24 17:38:22 -05:00
&& self.tcx.sess.opts.cg.prefer_dynamic)
);
2018-09-10 16:28:47 +02:00
if needs_dll_storage_attr {
// This item is external but not foreign, i.e., it originates from an external Rust
2018-09-10 16:28:47 +02:00
// crate. Since we don't know whether this crate will be linked dynamically or
// statically in the final application, we always mark such symbols as 'dllimport'.
// If final linkage happens to be static, we rely on compiler-emitted __imp_ stubs
// to make things work.
//
// However, in some scenarios we defer emission of statics to downstream
// crates, so there are cases where a static with an upstream DefId
// is actually present in the current crate. We can find out via the
// is_codegened_item query.
2018-11-07 12:08:41 +02:00
if !self.tcx.is_codegened_item(def_id) {
llvm::set_dllimport_storage_class(g);
2018-09-10 16:28:47 +02:00
}
}
2021-02-02 15:38:51 +01:00
}
2018-09-10 16:28:47 +02:00
if self.use_dll_storage_attrs
&& let Some(library) = self.tcx.native_library(def_id)
&& library.kind.is_dllimport()
{
2018-09-10 16:28:47 +02:00
// For foreign (native) libs we know the exact storage type to use.
llvm::set_dllimport_storage_class(g);
2013-06-21 18:46:34 -07:00
}
self.instances.borrow_mut().insert(instance, g);
2018-09-10 16:28:47 +02:00
g
}
fn codegen_static_item(&self, def_id: DefId) {
2018-09-10 16:28:47 +02:00
unsafe {
assert!(
llvm::LLVMGetInitializer(
self.instances.borrow().get(&Instance::mono(self.tcx, def_id)).unwrap()
)
.is_none()
);
2018-11-07 12:08:41 +02:00
let attrs = self.tcx.codegen_fn_attrs(def_id);
2018-09-10 16:28:47 +02:00
2022-02-19 00:48:49 +01:00
let Ok((v, alloc)) = codegen_static_initializer(self, def_id) else {
2018-09-10 16:28:47 +02:00
// Error has already been reported
2022-02-19 00:48:49 +01:00
return;
2018-09-10 16:28:47 +02:00
};
let alloc = alloc.inner();
2018-09-10 16:28:47 +02:00
let val_llty = self.val_ty(v);
let g = self.get_static_inner(def_id, val_llty);
2024-08-08 19:29:47 +08:00
let llty = llvm::LLVMGlobalGetValueType(g);
2018-09-10 16:28:47 +02:00
let g = if val_llty == llty {
g
} else {
// codegen_static_initializer creates the global value just from the
// `Allocation` data by generating one big struct value that is just
// all the bytes and pointers after each other. This will almost never
// match the type that the static was declared with. Unfortunately
// we can't just LLVMConstBitCast our way out of it because that has very
// specific rules on what can be cast. So instead of adding a new way to
// generate static initializers that match the static's type, we picked
// the easier option and retroactively change the type of the static item itself.
let name = llvm::get_value_name(g).to_vec();
llvm::set_value_name(g, b"");
2018-09-10 16:28:47 +02:00
let linkage = llvm::get_linkage(g);
let visibility = llvm::get_visibility(g);
2018-09-10 16:28:47 +02:00
let new_g = llvm::LLVMRustGetOrInsertGlobal(
2019-12-24 17:38:22 -05:00
self.llmod,
name.as_c_char_ptr(),
2019-12-24 17:38:22 -05:00
name.len(),
val_llty,
);
2018-09-10 16:28:47 +02:00
llvm::set_linkage(new_g, linkage);
llvm::set_visibility(new_g, visibility);
2018-09-10 16:28:47 +02:00
// The old global has had its name removed but is returned by
// get_static since it is in the instance cache. Provide an
// alternative lookup that points to the new global so that
// global_asm! can compute the correct mangled symbol name
// for the global.
self.renamed_statics.borrow_mut().insert(def_id, new_g);
2018-09-10 16:28:47 +02:00
// To avoid breaking any invariants, we leave around the old
// global for the moment; we'll replace all references to it
// with the new global later. (See base::codegen_backend.)
2018-11-07 12:08:41 +02:00
self.statics_to_rauw.borrow_mut().push((g, new_g));
2018-09-10 16:28:47 +02:00
new_g
};
set_global_alignment(self, g, alloc.align);
llvm::set_initializer(g, v);
2018-09-10 16:28:47 +02:00
self.assume_dso_local(g, true);
2021-05-14 03:47:41 +02:00
2024-03-11 18:39:23 +00:00
// Forward the allocation's mutability (picked by the const interner) to LLVM.
if alloc.mutability.is_not() {
2020-10-26 21:02:48 -04:00
llvm::LLVMSetGlobalConstant(g, llvm::True);
}
debuginfo::build_global_var_di_node(self, def_id, g);
2018-09-10 16:28:47 +02:00
if attrs.flags.contains(CodegenFnAttrFlags::THREAD_LOCAL) {
llvm::set_thread_local_mode(g, self.tls_model);
}
2018-09-10 16:28:47 +02:00
// Wasm statics with custom link sections get special treatment as they
// go into custom sections of the wasm executable. The exception to this
// is the `.init_array` section which are treated specially by the wasm linker.
if self.tcx.sess.target.is_like_wasm
&& attrs
.link_section
.map(|link_section| !link_section.as_str().starts_with(".init_array"))
.unwrap_or(true)
{
2018-09-10 16:28:47 +02:00
if let Some(section) = attrs.link_section {
2023-04-05 15:08:17 +03:00
let section = llvm::LLVMMDStringInContext2(
2018-11-07 12:08:41 +02:00
self.llcx,
section.as_str().as_c_char_ptr(),
2023-04-05 15:08:17 +03:00
section.as_str().len(),
2018-09-10 16:28:47 +02:00
);
assert!(alloc.provenance().ptrs().is_empty());
// The `inspect` method is okay here because we checked for provenance, and
// because we are doing this access to inspect the final interpreter state (not
// as part of the interpreter execution).
2019-12-24 17:38:22 -05:00
let bytes =
alloc.inspect_with_uninit_and_ptr_outside_interpreter(0..alloc.len());
2023-04-05 15:08:17 +03:00
let alloc =
llvm::LLVMMDStringInContext2(self.llcx, bytes.as_c_char_ptr(), bytes.len());
2018-09-10 16:28:47 +02:00
let data = [section, alloc];
2023-04-05 15:08:17 +03:00
let meta = llvm::LLVMMDNodeInContext2(self.llcx, data.as_ptr(), data.len());
let val = self.get_metadata_value(meta);
2018-09-10 16:28:47 +02:00
llvm::LLVMAddNamedMetadataOperand(
2018-11-07 12:08:41 +02:00
self.llmod,
c"wasm.custom_sections".as_ptr(),
2023-04-05 15:08:17 +03:00
val,
2018-09-10 16:28:47 +02:00
);
}
} else {
2021-09-30 19:38:50 +02:00
base::set_link_section(g, attrs);
}
base::set_variable_sanitizer_attrs(g, attrs);
2018-09-10 16:28:47 +02:00
if attrs.flags.contains(CodegenFnAttrFlags::USED) {
// `USED` and `USED_LINKER` can't be used together.
assert!(!attrs.flags.contains(CodegenFnAttrFlags::USED_LINKER));
// The semantics of #[used] in Rust only require the symbol to make it into the
// object file. It is explicitly allowed for the linker to strip the symbol if it
// is dead, which means we are allowed to use `llvm.compiler.used` instead of
// `llvm.used` here.
//
// Additionally, https://reviews.llvm.org/D97448 in LLVM 13 started emitting unique
// sections with SHF_GNU_RETAIN flag for llvm.used symbols, which may trigger bugs
// in the handling of `.init_array` (the static constructor list) in versions of
// the gold linker (prior to the one released with binutils 2.36).
//
// That said, we only ever emit these when compiling for ELF targets, unless
// `#[used(compiler)]` is explicitly requested. This is to avoid similar breakage
// on other targets, in particular MachO targets have *their* static constructor
// lists broken if `llvm.compiler.used` is emitted rather than `llvm.used`. However,
// that check happens when assigning the `CodegenFnAttrFlags` in
// `rustc_hir_analysis`, so we don't need to take care of it here.
self.add_compiler_used_global(g);
2018-09-10 16:28:47 +02:00
}
if attrs.flags.contains(CodegenFnAttrFlags::USED_LINKER) {
// `USED` and `USED_LINKER` can't be used together.
assert!(!attrs.flags.contains(CodegenFnAttrFlags::USED));
self.add_used_global(g);
}
add an #[used] attribute similar to GCC's __attribute((used))__. This attribute prevents LLVM from optimizing away a non-exported symbol, within a compilation unit (object file), when there are no references to it. This is better explained with an example: ``` #[used] static LIVE: i32 = 0; static REFERENCED: i32 = 0; static DEAD: i32 = 0; fn internal() {} pub fn exported() -> &'static i32 { &REFERENCED } ``` Without optimizations, LLVM pretty much preserves all the static variables and functions within the compilation unit. ``` $ rustc --crate-type=lib --emit=obj symbols.rs && nm -C symbols.o 0000000000000000 t drop::h1be0f8f27a2ba94a 0000000000000000 r symbols::REFERENCED::hb3bdfd46050bc84c 0000000000000000 r symbols::DEAD::hc2ea8f9bd06f380b 0000000000000000 r symbols::LIVE::h0970cf9889edb56e 0000000000000000 T symbols::exported::h6f096c2b1fc292b2 0000000000000000 t symbols::internal::h0ac1aadbc1e3a494 ``` With optimizations, LLVM will drop dead code. Here `internal` is dropped because it's not a exported function/symbol (i.e. not `pub`lic). `DEAD` is dropped for the same reason. `REFERENCED` is preserved, even though it's not exported, because it's referenced by the `exported` function. Finally, `LIVE` survives because of the `#[used]` attribute even though it's not exported or referenced. ``` $ rustc --crate-type=lib -C opt-level=3 --emit=obj symbols.rs && nm -C symbols.o 0000000000000000 r symbols::REFERENCED::hb3bdfd46050bc84c 0000000000000000 r symbols::LIVE::h0970cf9889edb56e 0000000000000000 T symbols::exported::h6f096c2b1fc292b2 ``` Note that the linker knows nothing about `#[used]` and will drop `LIVE` because no other object references to it. ``` $ echo 'fn main() {}' >> symbols.rs $ rustc symbols.rs && nm -C symbols | grep LIVE ``` At this time, `#[used]` only works on `static` variables.
2017-02-20 14:42:47 -05:00
}
}
}
impl<'ll> StaticCodegenMethods for CodegenCx<'ll, '_> {
2025-01-24 00:37:05 +01:00
/// Get a pointer to a global variable.
///
/// The pointer will always be in the default address space. If global variables default to a
/// different address space, an addrspacecast is inserted.
fn static_addr_of(&self, cv: &'ll Value, align: Align, kind: Option<&str>) -> &'ll Value {
2025-01-02 13:10:11 +01:00
let gv = self.static_addr_of_impl(cv, align, kind);
2025-01-24 00:37:05 +01:00
// static_addr_of_impl returns the bare global variable, which might not be in the default
// address space. Cast to the default address space if necessary.
2025-01-02 13:10:11 +01:00
self.const_pointercast(gv, self.type_ptr())
}
fn codegen_static(&self, def_id: DefId) {
self.codegen_static_item(def_id)
}
/// Add a global value to a list to be stored in the `llvm.used` variable, an array of ptr.
fn add_used_global(&self, global: &'ll Value) {
self.used_statics.borrow_mut().push(global);
}
/// Add a global value to a list to be stored in the `llvm.compiler.used` variable,
/// an array of ptr.
fn add_compiler_used_global(&self, global: &'ll Value) {
self.compiler_used_statics.borrow_mut().push(global);
}
}