rustc_codegen_llvm/
consts.rs

1use std::ops::Range;
2
3use rustc_abi::{Align, HasDataLayout, Primitive, Scalar, Size, WrappingRange};
4use rustc_codegen_ssa::common;
5use rustc_codegen_ssa::traits::*;
6use rustc_hir::LangItem;
7use rustc_hir::attrs::Linkage;
8use rustc_hir::def::DefKind;
9use rustc_hir::def_id::{DefId, LOCAL_CRATE};
10use rustc_middle::middle::codegen_fn_attrs::{CodegenFnAttrFlags, CodegenFnAttrs};
11use rustc_middle::mir::interpret::{
12    Allocation, ConstAllocation, ErrorHandled, InitChunk, Pointer, Scalar as InterpScalar,
13    read_target_uint,
14};
15use rustc_middle::mir::mono::MonoItem;
16use rustc_middle::ty::layout::{HasTypingEnv, LayoutOf};
17use rustc_middle::ty::{self, Instance};
18use rustc_middle::{bug, span_bug};
19use rustc_span::Symbol;
20use rustc_target::spec::Arch;
21use tracing::{debug, instrument, trace};
22
23use crate::common::CodegenCx;
24use crate::errors::SymbolAlreadyDefined;
25use crate::llvm::{self, Type, Value};
26use crate::type_of::LayoutLlvmExt;
27use crate::{base, debuginfo};
28
29pub(crate) fn const_alloc_to_llvm<'ll>(
30    cx: &CodegenCx<'ll, '_>,
31    alloc: &Allocation,
32    is_static: bool,
33) -> &'ll Value {
34    // We expect that callers of const_alloc_to_llvm will instead directly codegen a pointer or
35    // integer for any &ZST where the ZST is a constant (i.e. not a static). We should never be
36    // producing empty LLVM allocations as they're just adding noise to binaries and forcing less
37    // optimal codegen.
38    //
39    // Statics have a guaranteed meaningful address so it's less clear that we want to do
40    // something like this; it's also harder.
41    if !is_static {
42        assert!(alloc.len() != 0);
43    }
44    let mut llvals = Vec::with_capacity(alloc.provenance().ptrs().len() + 1);
45    let dl = cx.data_layout();
46    let pointer_size = dl.pointer_size();
47    let pointer_size_bytes = pointer_size.bytes() as usize;
48
49    // Note: this function may call `inspect_with_uninit_and_ptr_outside_interpreter`, so `range`
50    // must be within the bounds of `alloc` and not contain or overlap a pointer provenance.
51    fn append_chunks_of_init_and_uninit_bytes<'ll, 'a, 'b>(
52        llvals: &mut Vec<&'ll Value>,
53        cx: &'a CodegenCx<'ll, 'b>,
54        alloc: &'a Allocation,
55        range: Range<usize>,
56    ) {
57        let chunks = alloc.init_mask().range_as_init_chunks(range.clone().into());
58
59        let chunk_to_llval = move |chunk| match chunk {
60            InitChunk::Init(range) => {
61                let range = (range.start.bytes() as usize)..(range.end.bytes() as usize);
62                let bytes = alloc.inspect_with_uninit_and_ptr_outside_interpreter(range);
63                cx.const_bytes(bytes)
64            }
65            InitChunk::Uninit(range) => {
66                let len = range.end.bytes() - range.start.bytes();
67                cx.const_undef(cx.type_array(cx.type_i8(), len))
68            }
69        };
70
71        // Generating partially-uninit consts is limited to small numbers of chunks,
72        // to avoid the cost of generating large complex const expressions.
73        // For example, `[(u32, u8); 1024 * 1024]` contains uninit padding in each element, and
74        // would result in `{ [5 x i8] zeroinitializer, [3 x i8] undef, ...repeat 1M times... }`.
75        let max = cx.sess().opts.unstable_opts.uninit_const_chunk_threshold;
76        let allow_uninit_chunks = chunks.clone().take(max.saturating_add(1)).count() <= max;
77
78        if allow_uninit_chunks {
79            llvals.extend(chunks.map(chunk_to_llval));
80        } else {
81            // If this allocation contains any uninit bytes, codegen as if it was initialized
82            // (using some arbitrary value for uninit bytes).
83            let bytes = alloc.inspect_with_uninit_and_ptr_outside_interpreter(range);
84            llvals.push(cx.const_bytes(bytes));
85        }
86    }
87
88    let mut next_offset = 0;
89    for &(offset, prov) in alloc.provenance().ptrs().iter() {
90        let offset = offset.bytes();
91        assert_eq!(offset as usize as u64, offset);
92        let offset = offset as usize;
93        if offset > next_offset {
94            // This `inspect` is okay since we have checked that there is no provenance, it
95            // is within the bounds of the allocation, and it doesn't affect interpreter execution
96            // (we inspect the result after interpreter execution).
97            append_chunks_of_init_and_uninit_bytes(&mut llvals, cx, alloc, next_offset..offset);
98        }
99        let ptr_offset = read_target_uint(
100            dl.endian,
101            // This `inspect` is okay since it is within the bounds of the allocation, it doesn't
102            // affect interpreter execution (we inspect the result after interpreter execution),
103            // and we properly interpret the provenance as a relocation pointer offset.
104            alloc.inspect_with_uninit_and_ptr_outside_interpreter(
105                offset..(offset + pointer_size_bytes),
106            ),
107        )
108        .expect("const_alloc_to_llvm: could not read relocation pointer")
109            as u64;
110
111        let address_space = cx.tcx.global_alloc(prov.alloc_id()).address_space(cx);
112
113        llvals.push(cx.scalar_to_backend(
114            InterpScalar::from_pointer(Pointer::new(prov, Size::from_bytes(ptr_offset)), &cx.tcx),
115            Scalar::Initialized {
116                value: Primitive::Pointer(address_space),
117                valid_range: WrappingRange::full(pointer_size),
118            },
119            cx.type_ptr_ext(address_space),
120        ));
121        next_offset = offset + pointer_size_bytes;
122    }
123    if alloc.len() >= next_offset {
124        let range = next_offset..alloc.len();
125        // This `inspect` is okay since we have check that it is after all provenance, it is
126        // within the bounds of the allocation, and it doesn't affect interpreter execution (we
127        // inspect the result after interpreter execution).
128        append_chunks_of_init_and_uninit_bytes(&mut llvals, cx, alloc, range);
129    }
130
131    // Avoid wrapping in a struct if there is only a single value. This ensures
132    // that LLVM is able to perform the string merging optimization if the constant
133    // is a valid C string. LLVM only considers bare arrays for this optimization,
134    // not arrays wrapped in a struct. LLVM handles this at:
135    // https://github.com/rust-lang/llvm-project/blob/acaea3d2bb8f351b740db7ebce7d7a40b9e21488/llvm/lib/Target/TargetLoweringObjectFile.cpp#L249-L280
136    if let &[data] = &*llvals { data } else { cx.const_struct(&llvals, true) }
137}
138
139fn codegen_static_initializer<'ll, 'tcx>(
140    cx: &CodegenCx<'ll, 'tcx>,
141    def_id: DefId,
142) -> Result<(&'ll Value, ConstAllocation<'tcx>), ErrorHandled> {
143    let alloc = cx.tcx.eval_static_initializer(def_id)?;
144    Ok((const_alloc_to_llvm(cx, alloc.inner(), /*static*/ true), alloc))
145}
146
147fn set_global_alignment<'ll>(cx: &CodegenCx<'ll, '_>, gv: &'ll Value, mut align: Align) {
148    // The target may require greater alignment for globals than the type does.
149    // Note: GCC and Clang also allow `__attribute__((aligned))` on variables,
150    // which can force it to be smaller. Rust doesn't support this yet.
151    if let Some(min_global) = cx.sess().target.min_global_align {
152        align = Ord::max(align, min_global);
153    }
154    llvm::set_alignment(gv, align);
155}
156
157fn check_and_apply_linkage<'ll, 'tcx>(
158    cx: &CodegenCx<'ll, 'tcx>,
159    attrs: &CodegenFnAttrs,
160    llty: &'ll Type,
161    sym: &str,
162    def_id: DefId,
163) -> &'ll Value {
164    if let Some(linkage) = attrs.import_linkage {
165        debug!("get_static: sym={} linkage={:?}", sym, linkage);
166
167        // Declare a symbol `foo`. If `foo` is an extern_weak symbol, we declare
168        // an extern_weak function, otherwise a global with the desired linkage.
169        let g1 = if matches!(attrs.import_linkage, Some(Linkage::ExternalWeak)) {
170            // An `extern_weak` function is represented as an `Option<unsafe extern ...>`,
171            // we extract the function signature and declare it as an extern_weak function
172            // instead of an extern_weak i8.
173            let instance = Instance::mono(cx.tcx, def_id);
174            if let ty::Adt(struct_def, args) = instance.ty(cx.tcx, cx.typing_env()).kind()
175                && cx.tcx.is_lang_item(struct_def.did(), LangItem::Option)
176                && let ty::FnPtr(sig, header) = args.type_at(0).kind()
177            {
178                let fn_sig = sig.with(*header);
179
180                let fn_abi = cx.fn_abi_of_fn_ptr(fn_sig, ty::List::empty());
181                cx.declare_fn(sym, &fn_abi, None)
182            } else {
183                cx.declare_global(sym, cx.type_i8())
184            }
185        } else {
186            cx.declare_global(sym, cx.type_i8())
187        };
188        llvm::set_linkage(g1, base::linkage_to_llvm(linkage));
189
190        // Normally this is done in `get_static_inner`, but when as we generate an internal global,
191        // it will apply the dso_local to the internal global instead, so do it here, too.
192        cx.assume_dso_local(g1, true);
193
194        // Declare an internal global `extern_with_linkage_foo` which
195        // is initialized with the address of `foo`. If `foo` is
196        // discarded during linking (for example, if `foo` has weak
197        // linkage and there are no definitions), then
198        // `extern_with_linkage_foo` will instead be initialized to
199        // zero.
200        let real_name =
201            format!("_rust_extern_with_linkage_{:016x}_{sym}", cx.tcx.stable_crate_id(LOCAL_CRATE));
202        let g2 = cx.define_global(&real_name, llty).unwrap_or_else(|| {
203            cx.sess().dcx().emit_fatal(SymbolAlreadyDefined {
204                span: cx.tcx.def_span(def_id),
205                symbol_name: sym,
206            })
207        });
208        llvm::set_linkage(g2, llvm::Linkage::InternalLinkage);
209        llvm::set_initializer(g2, g1);
210        g2
211    } else if cx.tcx.sess.target.arch == Arch::X86
212        && common::is_mingw_gnu_toolchain(&cx.tcx.sess.target)
213        && let Some(dllimport) = crate::common::get_dllimport(cx.tcx, def_id, sym)
214    {
215        cx.declare_global(&common::i686_decorated_name(dllimport, true, true, false), llty)
216    } else {
217        // Generate an external declaration.
218        // FIXME(nagisa): investigate whether it can be changed into define_global
219        cx.declare_global(sym, llty)
220    }
221}
222
223impl<'ll> CodegenCx<'ll, '_> {
224    pub(crate) fn const_bitcast(&self, val: &'ll Value, ty: &'ll Type) -> &'ll Value {
225        unsafe { llvm::LLVMConstBitCast(val, ty) }
226    }
227
228    pub(crate) fn const_pointercast(&self, val: &'ll Value, ty: &'ll Type) -> &'ll Value {
229        unsafe { llvm::LLVMConstPointerCast(val, ty) }
230    }
231
232    /// Create a global variable.
233    ///
234    /// The returned global variable is a pointer in the default address space for globals.
235    /// Fails if a symbol with the given name already exists.
236    pub(crate) fn static_addr_of_mut(
237        &self,
238        cv: &'ll Value,
239        align: Align,
240        kind: Option<&str>,
241    ) -> &'ll Value {
242        let gv = match kind {
243            Some(kind) if !self.tcx.sess.fewer_names() => {
244                let name = self.generate_local_symbol_name(kind);
245                let gv = self.define_global(&name, self.val_ty(cv)).unwrap_or_else(|| {
246                    bug!("symbol `{}` is already defined", name);
247                });
248                gv
249            }
250            _ => self.define_global("", self.val_ty(cv)).unwrap_or_else(|| {
251                bug!("anonymous global symbol is already defined");
252            }),
253        };
254        llvm::set_linkage(gv, llvm::Linkage::PrivateLinkage);
255        llvm::set_initializer(gv, cv);
256        set_global_alignment(self, gv, align);
257        llvm::set_unnamed_address(gv, llvm::UnnamedAddr::Global);
258        gv
259    }
260
261    /// Create a global constant.
262    ///
263    /// The returned global variable is a pointer in the default address space for globals.
264    pub(crate) fn static_addr_of_impl(
265        &self,
266        cv: &'ll Value,
267        align: Align,
268        kind: Option<&str>,
269    ) -> &'ll Value {
270        if let Some(&gv) = self.const_globals.borrow().get(&cv) {
271            unsafe {
272                // Upgrade the alignment in cases where the same constant is used with different
273                // alignment requirements
274                let llalign = align.bytes() as u32;
275                if llalign > llvm::LLVMGetAlignment(gv) {
276                    llvm::LLVMSetAlignment(gv, llalign);
277                }
278            }
279            return gv;
280        }
281        let gv = self.static_addr_of_mut(cv, align, kind);
282        llvm::set_global_constant(gv, true);
283
284        self.const_globals.borrow_mut().insert(cv, gv);
285        gv
286    }
287
288    #[instrument(level = "debug", skip(self))]
289    pub(crate) fn get_static(&self, def_id: DefId) -> &'ll Value {
290        let instance = Instance::mono(self.tcx, def_id);
291        trace!(?instance);
292
293        let DefKind::Static { nested, .. } = self.tcx.def_kind(def_id) else { bug!() };
294        // Nested statics do not have a type, so pick a dummy type and let `codegen_static` figure
295        // out the llvm type from the actual evaluated initializer.
296        let llty = if nested {
297            self.type_i8()
298        } else {
299            let ty = instance.ty(self.tcx, self.typing_env());
300            trace!(?ty);
301            self.layout_of(ty).llvm_type(self)
302        };
303        self.get_static_inner(def_id, llty)
304    }
305
306    #[instrument(level = "debug", skip(self, llty))]
307    fn get_static_inner(&self, def_id: DefId, llty: &'ll Type) -> &'ll Value {
308        let instance = Instance::mono(self.tcx, def_id);
309        if let Some(&g) = self.instances.borrow().get(&instance) {
310            trace!("used cached value");
311            return g;
312        }
313
314        let defined_in_current_codegen_unit =
315            self.codegen_unit.items().contains_key(&MonoItem::Static(def_id));
316        assert!(
317            !defined_in_current_codegen_unit,
318            "consts::get_static() should always hit the cache for \
319                 statics defined in the same CGU, but did not for `{def_id:?}`"
320        );
321
322        let sym = self.tcx.symbol_name(instance).name;
323        let fn_attrs = self.tcx.codegen_fn_attrs(def_id);
324
325        debug!(?sym, ?fn_attrs);
326
327        let g = if def_id.is_local() && !self.tcx.is_foreign_item(def_id) {
328            if let Some(g) = self.get_declared_value(sym) {
329                if self.val_ty(g) != self.type_ptr() {
330                    span_bug!(self.tcx.def_span(def_id), "Conflicting types for static");
331                }
332            }
333
334            let g = self.declare_global(sym, llty);
335
336            if !self.tcx.is_reachable_non_generic(def_id) {
337                llvm::set_visibility(g, llvm::Visibility::Hidden);
338            }
339
340            g
341        } else if let Some(classname) = fn_attrs.objc_class {
342            self.get_objc_classref(classname)
343        } else if let Some(methname) = fn_attrs.objc_selector {
344            self.get_objc_selref(methname)
345        } else {
346            check_and_apply_linkage(self, fn_attrs, llty, sym, def_id)
347        };
348
349        // Thread-local statics in some other crate need to *always* be linked
350        // against in a thread-local fashion, so we need to be sure to apply the
351        // thread-local attribute locally if it was present remotely. If we
352        // don't do this then linker errors can be generated where the linker
353        // complains that one object files has a thread local version of the
354        // symbol and another one doesn't.
355        if fn_attrs.flags.contains(CodegenFnAttrFlags::THREAD_LOCAL) {
356            llvm::set_thread_local_mode(g, self.tls_model);
357        }
358
359        let dso_local = self.assume_dso_local(g, true);
360
361        if !def_id.is_local() {
362            let needs_dll_storage_attr = self.use_dll_storage_attrs
363                && !self.tcx.is_foreign_item(def_id)
364                // Local definitions can never be imported, so we must not apply
365                // the DLLImport annotation.
366                && !dso_local
367                // Linker plugin ThinLTO doesn't create the self-dllimport Rust uses for rlibs
368                // as the code generation happens out of process. Instead we assume static linkage
369                // and disallow dynamic linking when linker plugin based LTO is enabled.
370                // Regular in-process ThinLTO doesn't need this workaround.
371                && !self.tcx.sess.opts.cg.linker_plugin_lto.enabled();
372
373            // If this assertion triggers, there's something wrong with commandline
374            // argument validation.
375            assert!(
376                !(self.tcx.sess.opts.cg.linker_plugin_lto.enabled()
377                    && self.tcx.sess.target.is_like_windows
378                    && self.tcx.sess.opts.cg.prefer_dynamic)
379            );
380
381            if needs_dll_storage_attr {
382                // This item is external but not foreign, i.e., it originates from an external Rust
383                // crate. Since we don't know whether this crate will be linked dynamically or
384                // statically in the final application, we always mark such symbols as 'dllimport'.
385                // If final linkage happens to be static, we rely on compiler-emitted __imp_ stubs
386                // to make things work.
387                //
388                // However, in some scenarios we defer emission of statics to downstream
389                // crates, so there are cases where a static with an upstream DefId
390                // is actually present in the current crate. We can find out via the
391                // is_codegened_item query.
392                if !self.tcx.is_codegened_item(def_id) {
393                    llvm::set_dllimport_storage_class(g);
394                }
395            }
396        }
397
398        if self.use_dll_storage_attrs
399            && let Some(library) = self.tcx.native_library(def_id)
400            && library.kind.is_dllimport()
401        {
402            // For foreign (native) libs we know the exact storage type to use.
403            llvm::set_dllimport_storage_class(g);
404        }
405
406        self.instances.borrow_mut().insert(instance, g);
407        g
408    }
409
410    fn codegen_static_item(&mut self, def_id: DefId) {
411        assert!(
412            llvm::LLVMGetInitializer(
413                self.instances.borrow().get(&Instance::mono(self.tcx, def_id)).unwrap()
414            )
415            .is_none()
416        );
417        let attrs = self.tcx.codegen_fn_attrs(def_id);
418
419        let Ok((v, alloc)) = codegen_static_initializer(self, def_id) else {
420            // Error has already been reported
421            return;
422        };
423        let alloc = alloc.inner();
424
425        let val_llty = self.val_ty(v);
426
427        let g = self.get_static_inner(def_id, val_llty);
428        let llty = self.get_type_of_global(g);
429
430        let g = if val_llty == llty {
431            g
432        } else {
433            // codegen_static_initializer creates the global value just from the
434            // `Allocation` data by generating one big struct value that is just
435            // all the bytes and pointers after each other. This will almost never
436            // match the type that the static was declared with. Unfortunately
437            // we can't just LLVMConstBitCast our way out of it because that has very
438            // specific rules on what can be cast. So instead of adding a new way to
439            // generate static initializers that match the static's type, we picked
440            // the easier option and retroactively change the type of the static item itself.
441            let name = String::from_utf8(llvm::get_value_name(g))
442                .expect("we declare our statics with a utf8-valid name");
443            llvm::set_value_name(g, b"");
444
445            let linkage = llvm::get_linkage(g);
446            let visibility = llvm::get_visibility(g);
447
448            let new_g = self.declare_global(&name, val_llty);
449
450            llvm::set_linkage(new_g, linkage);
451            llvm::set_visibility(new_g, visibility);
452
453            // The old global has had its name removed but is returned by
454            // get_static since it is in the instance cache. Provide an
455            // alternative lookup that points to the new global so that
456            // global_asm! can compute the correct mangled symbol name
457            // for the global.
458            self.renamed_statics.borrow_mut().insert(def_id, new_g);
459
460            // To avoid breaking any invariants, we leave around the old
461            // global for the moment; we'll replace all references to it
462            // with the new global later. (See base::codegen_backend.)
463            self.statics_to_rauw.borrow_mut().push((g, new_g));
464            new_g
465        };
466
467        // NOTE: Alignment from attributes has already been applied to the allocation.
468        set_global_alignment(self, g, alloc.align);
469        llvm::set_initializer(g, v);
470
471        self.assume_dso_local(g, true);
472
473        // Forward the allocation's mutability (picked by the const interner) to LLVM.
474        if alloc.mutability.is_not() {
475            llvm::set_global_constant(g, true);
476        }
477
478        debuginfo::build_global_var_di_node(self, def_id, g);
479
480        if attrs.flags.contains(CodegenFnAttrFlags::THREAD_LOCAL) {
481            llvm::set_thread_local_mode(g, self.tls_model);
482        }
483
484        // Wasm statics with custom link sections get special treatment as they
485        // go into custom sections of the wasm executable. The exception to this
486        // is the `.init_array` section which are treated specially by the wasm linker.
487        if self.tcx.sess.target.is_like_wasm
488            && attrs
489                .link_section
490                .map(|link_section| !link_section.as_str().starts_with(".init_array"))
491                .unwrap_or(true)
492        {
493            if let Some(section) = attrs.link_section {
494                let section = self.create_metadata(section.as_str().as_bytes());
495                assert!(alloc.provenance().ptrs().is_empty());
496
497                // The `inspect` method is okay here because we checked for provenance, and
498                // because we are doing this access to inspect the final interpreter state (not
499                // as part of the interpreter execution).
500                let bytes = alloc.inspect_with_uninit_and_ptr_outside_interpreter(0..alloc.len());
501                let alloc = self.create_metadata(bytes);
502                let data = [section, alloc];
503                self.module_add_named_metadata_node(self.llmod(), c"wasm.custom_sections", &data);
504            }
505        } else {
506            base::set_link_section(g, attrs);
507        }
508
509        base::set_variable_sanitizer_attrs(g, attrs);
510
511        if attrs.flags.contains(CodegenFnAttrFlags::USED_COMPILER) {
512            // `USED` and `USED_LINKER` can't be used together.
513            assert!(!attrs.flags.contains(CodegenFnAttrFlags::USED_LINKER));
514
515            // The semantics of #[used] in Rust only require the symbol to make it into the
516            // object file. It is explicitly allowed for the linker to strip the symbol if it
517            // is dead, which means we are allowed to use `llvm.compiler.used` instead of
518            // `llvm.used` here.
519            //
520            // Additionally, https://reviews.llvm.org/D97448 in LLVM 13 started emitting unique
521            // sections with SHF_GNU_RETAIN flag for llvm.used symbols, which may trigger bugs
522            // in the handling of `.init_array` (the static constructor list) in versions of
523            // the gold linker (prior to the one released with binutils 2.36).
524            //
525            // That said, we only ever emit these when `#[used(compiler)]` is explicitly
526            // requested. This is to avoid similar breakage on other targets, in particular
527            // MachO targets have *their* static constructor lists broken if `llvm.compiler.used`
528            // is emitted rather than `llvm.used`. However, that check happens when assigning
529            // the `CodegenFnAttrFlags` in the `codegen_fn_attrs` query, so we don't need to
530            // take care of it here.
531            self.add_compiler_used_global(g);
532        }
533        if attrs.flags.contains(CodegenFnAttrFlags::USED_LINKER) {
534            // `USED` and `USED_LINKER` can't be used together.
535            assert!(!attrs.flags.contains(CodegenFnAttrFlags::USED_COMPILER));
536
537            self.add_used_global(g);
538        }
539    }
540
541    /// Add a global value to a list to be stored in the `llvm.used` variable, an array of ptr.
542    pub(crate) fn add_used_global(&mut self, global: &'ll Value) {
543        self.used_statics.push(global);
544    }
545
546    /// Add a global value to a list to be stored in the `llvm.compiler.used` variable,
547    /// an array of ptr.
548    pub(crate) fn add_compiler_used_global(&self, global: &'ll Value) {
549        self.compiler_used_statics.borrow_mut().push(global);
550    }
551
552    // We do our best here to match what Clang does when compiling Objective-C natively.
553    // See Clang's `CGObjCCommonMac::CreateCStringLiteral`:
554    // https://github.com/llvm/llvm-project/blob/llvmorg-20.1.8/clang/lib/CodeGen/CGObjCMac.cpp#L4134
555    fn define_objc_classname(&self, classname: &str) -> &'ll Value {
556        assert_eq!(self.objc_abi_version(), 1);
557
558        let llval = self.null_terminate_const_bytes(classname.as_bytes());
559        let llty = self.val_ty(llval);
560        let sym = self.generate_local_symbol_name("OBJC_CLASS_NAME_");
561        let g = self.define_global(&sym, llty).unwrap_or_else(|| {
562            bug!("symbol `{}` is already defined", sym);
563        });
564        set_global_alignment(self, g, self.tcx.data_layout.i8_align);
565        llvm::set_initializer(g, llval);
566        llvm::set_linkage(g, llvm::Linkage::PrivateLinkage);
567        llvm::set_section(g, c"__TEXT,__cstring,cstring_literals");
568        llvm::LLVMSetGlobalConstant(g, llvm::TRUE);
569        llvm::LLVMSetUnnamedAddress(g, llvm::UnnamedAddr::Global);
570        self.add_compiler_used_global(g);
571
572        g
573    }
574
575    // We do our best here to match what Clang does when compiling Objective-C natively.
576    // See Clang's `ObjCNonFragileABITypesHelper`:
577    // https://github.com/llvm/llvm-project/blob/llvmorg-20.1.8/clang/lib/CodeGen/CGObjCMac.cpp#L6052
578    fn get_objc_class_t(&self) -> &'ll Type {
579        if let Some(class_t) = self.objc_class_t.get() {
580            return class_t;
581        }
582
583        assert_eq!(self.objc_abi_version(), 2);
584
585        // struct _class_t {
586        //     struct _class_t* isa;
587        //     struct _class_t* const superclass;
588        //     void* cache;
589        //     IMP* vtable;
590        //     struct class_ro_t* ro;
591        // }
592
593        let class_t = self.type_named_struct("struct._class_t");
594        let els = [self.type_ptr(); 5];
595        let packed = false;
596        self.set_struct_body(class_t, &els, packed);
597
598        self.objc_class_t.set(Some(class_t));
599        class_t
600    }
601
602    // We do our best here to match what Clang does when compiling Objective-C natively. We
603    // deduplicate references within a CGU, but we need a reference definition in each referencing
604    // CGU. All attempts at using external references to a single reference definition result in
605    // linker errors.
606    fn get_objc_classref(&self, classname: Symbol) -> &'ll Value {
607        let mut classrefs = self.objc_classrefs.borrow_mut();
608        if let Some(classref) = classrefs.get(&classname).copied() {
609            return classref;
610        }
611
612        let g = match self.objc_abi_version() {
613            1 => {
614                // See Clang's `CGObjCMac::EmitClassRefFromId`:
615                // https://github.com/llvm/llvm-project/blob/llvmorg-20.1.8/clang/lib/CodeGen/CGObjCMac.cpp#L5205
616                let llval = self.define_objc_classname(classname.as_str());
617                let llty = self.type_ptr();
618                let sym = self.generate_local_symbol_name("OBJC_CLASS_REFERENCES_");
619                let g = self.define_global(&sym, llty).unwrap_or_else(|| {
620                    bug!("symbol `{}` is already defined", sym);
621                });
622                set_global_alignment(self, g, self.tcx.data_layout.pointer_align().abi);
623                llvm::set_initializer(g, llval);
624                llvm::set_linkage(g, llvm::Linkage::PrivateLinkage);
625                llvm::set_section(g, c"__OBJC,__cls_refs,literal_pointers,no_dead_strip");
626                self.add_compiler_used_global(g);
627                g
628            }
629            2 => {
630                // See Clang's `CGObjCNonFragileABIMac::EmitClassRefFromId`:
631                // https://github.com/llvm/llvm-project/blob/llvmorg-20.1.8/clang/lib/CodeGen/CGObjCMac.cpp#L7423
632                let llval = {
633                    let extern_sym = format!("OBJC_CLASS_$_{}", classname.as_str());
634                    let extern_llty = self.get_objc_class_t();
635                    self.declare_global(&extern_sym, extern_llty)
636                };
637                let llty = self.type_ptr();
638                let sym = self.generate_local_symbol_name("OBJC_CLASSLIST_REFERENCES_$_");
639                let g = self.define_global(&sym, llty).unwrap_or_else(|| {
640                    bug!("symbol `{}` is already defined", sym);
641                });
642                set_global_alignment(self, g, self.tcx.data_layout.pointer_align().abi);
643                llvm::set_initializer(g, llval);
644                llvm::set_linkage(g, llvm::Linkage::InternalLinkage);
645                llvm::set_section(g, c"__DATA,__objc_classrefs,regular,no_dead_strip");
646                self.add_compiler_used_global(g);
647                g
648            }
649            _ => unreachable!(),
650        };
651
652        classrefs.insert(classname, g);
653        g
654    }
655
656    // We do our best here to match what Clang does when compiling Objective-C natively. We
657    // deduplicate references within a CGU, but we need a reference definition in each referencing
658    // CGU. All attempts at using external references to a single reference definition result in
659    // linker errors.
660    //
661    // Newer versions of Apple Clang generate calls to `@"objc_msgSend$methname"` selector stub
662    // functions. We don't currently do that. The code we generate is closer to what Apple Clang
663    // generates with the `-fno-objc-msgsend-selector-stubs` option.
664    fn get_objc_selref(&self, methname: Symbol) -> &'ll Value {
665        let mut selrefs = self.objc_selrefs.borrow_mut();
666        if let Some(selref) = selrefs.get(&methname).copied() {
667            return selref;
668        }
669
670        let abi_version = self.objc_abi_version();
671
672        // See Clang's `CGObjCCommonMac::CreateCStringLiteral`:
673        // https://github.com/llvm/llvm-project/blob/llvmorg-20.1.8/clang/lib/CodeGen/CGObjCMac.cpp#L4134
674        let methname_llval = self.null_terminate_const_bytes(methname.as_str().as_bytes());
675        let methname_llty = self.val_ty(methname_llval);
676        let methname_sym = self.generate_local_symbol_name("OBJC_METH_VAR_NAME_");
677        let methname_g = self.define_global(&methname_sym, methname_llty).unwrap_or_else(|| {
678            bug!("symbol `{}` is already defined", methname_sym);
679        });
680        set_global_alignment(self, methname_g, self.tcx.data_layout.i8_align);
681        llvm::set_initializer(methname_g, methname_llval);
682        llvm::set_linkage(methname_g, llvm::Linkage::PrivateLinkage);
683        llvm::set_section(
684            methname_g,
685            match abi_version {
686                1 => c"__TEXT,__cstring,cstring_literals",
687                2 => c"__TEXT,__objc_methname,cstring_literals",
688                _ => unreachable!(),
689            },
690        );
691        llvm::LLVMSetGlobalConstant(methname_g, llvm::TRUE);
692        llvm::LLVMSetUnnamedAddress(methname_g, llvm::UnnamedAddr::Global);
693        self.add_compiler_used_global(methname_g);
694
695        // See Clang's `CGObjCMac::EmitSelectorAddr`:
696        // https://github.com/llvm/llvm-project/blob/llvmorg-20.1.8/clang/lib/CodeGen/CGObjCMac.cpp#L5243
697        // And Clang's `CGObjCNonFragileABIMac::EmitSelectorAddr`:
698        // https://github.com/llvm/llvm-project/blob/llvmorg-20.1.8/clang/lib/CodeGen/CGObjCMac.cpp#L7586
699        let selref_llval = methname_g;
700        let selref_llty = self.type_ptr();
701        let selref_sym = self.generate_local_symbol_name("OBJC_SELECTOR_REFERENCES_");
702        let selref_g = self.define_global(&selref_sym, selref_llty).unwrap_or_else(|| {
703            bug!("symbol `{}` is already defined", selref_sym);
704        });
705        set_global_alignment(self, selref_g, self.tcx.data_layout.pointer_align().abi);
706        llvm::set_initializer(selref_g, selref_llval);
707        llvm::set_externally_initialized(selref_g, true);
708        llvm::set_linkage(
709            selref_g,
710            match abi_version {
711                1 => llvm::Linkage::PrivateLinkage,
712                2 => llvm::Linkage::InternalLinkage,
713                _ => unreachable!(),
714            },
715        );
716        llvm::set_section(
717            selref_g,
718            match abi_version {
719                1 => c"__OBJC,__message_refs,literal_pointers,no_dead_strip",
720                2 => c"__DATA,__objc_selrefs,literal_pointers,no_dead_strip",
721                _ => unreachable!(),
722            },
723        );
724        self.add_compiler_used_global(selref_g);
725
726        selrefs.insert(methname, selref_g);
727        selref_g
728    }
729
730    // We do our best here to match what Clang does when compiling Objective-C natively.
731    // See Clang's `ObjCTypesHelper`:
732    // https://github.com/llvm/llvm-project/blob/llvmorg-20.1.8/clang/lib/CodeGen/CGObjCMac.cpp#L5936
733    // And Clang's `CGObjCMac::EmitModuleInfo`:
734    // https://github.com/llvm/llvm-project/blob/llvmorg-20.1.8/clang/lib/CodeGen/CGObjCMac.cpp#L5151
735    pub(crate) fn define_objc_module_info(&mut self) {
736        assert_eq!(self.objc_abi_version(), 1);
737
738        // struct _objc_module {
739        //     long version;                // Hardcoded to 7 in Clang.
740        //     long size;                   // sizeof(struct _objc_module)
741        //     char* name;                  // Hardcoded to classname "" in Clang.
742        //     struct _objc_symtab* symtab; // Null without class or category definitions.
743        //  }
744
745        let llty = self.type_named_struct("struct._objc_module");
746        let i32_llty = self.type_i32();
747        let ptr_llty = self.type_ptr();
748        let packed = false;
749        self.set_struct_body(llty, &[i32_llty, i32_llty, ptr_llty, ptr_llty], packed);
750
751        let version = self.const_uint(i32_llty, 7);
752        let size = self.const_uint(i32_llty, 16);
753        let name = self.define_objc_classname("");
754        let symtab = self.const_null(ptr_llty);
755        let llval = crate::common::named_struct(llty, &[version, size, name, symtab]);
756
757        let sym = "OBJC_MODULES";
758        let g = self.define_global(&sym, llty).unwrap_or_else(|| {
759            bug!("symbol `{}` is already defined", sym);
760        });
761        set_global_alignment(self, g, self.tcx.data_layout.pointer_align().abi);
762        llvm::set_initializer(g, llval);
763        llvm::set_linkage(g, llvm::Linkage::PrivateLinkage);
764        llvm::set_section(g, c"__OBJC,__module_info,regular,no_dead_strip");
765
766        self.add_compiler_used_global(g);
767    }
768}
769
770impl<'ll> StaticCodegenMethods for CodegenCx<'ll, '_> {
771    /// Get a pointer to a global variable.
772    ///
773    /// The pointer will always be in the default address space. If global variables default to a
774    /// different address space, an addrspacecast is inserted.
775    fn static_addr_of(&self, cv: &'ll Value, align: Align, kind: Option<&str>) -> &'ll Value {
776        let gv = self.static_addr_of_impl(cv, align, kind);
777        // static_addr_of_impl returns the bare global variable, which might not be in the default
778        // address space. Cast to the default address space if necessary.
779        self.const_pointercast(gv, self.type_ptr())
780    }
781
782    fn codegen_static(&mut self, def_id: DefId) {
783        self.codegen_static_item(def_id)
784    }
785}