rustc_codegen_ssa/back/
metadata.rs

1//! Reading of the rustc metadata for rlibs and dylibs
2
3use std::borrow::Cow;
4use std::fs::File;
5use std::io::Write;
6use std::path::Path;
7
8use itertools::Itertools;
9use object::write::{self, StandardSegment, Symbol, SymbolSection};
10use object::{
11    Architecture, BinaryFormat, Endianness, FileFlags, Object, ObjectSection, ObjectSymbol,
12    SectionFlags, SectionKind, SymbolFlags, SymbolKind, SymbolScope, elf, pe, xcoff,
13};
14use rustc_abi::Endian;
15use rustc_data_structures::memmap::Mmap;
16use rustc_data_structures::owned_slice::{OwnedSlice, try_slice_owned};
17use rustc_metadata::EncodedMetadata;
18use rustc_metadata::creader::MetadataLoader;
19use rustc_metadata::fs::METADATA_FILENAME;
20use rustc_middle::bug;
21use rustc_session::Session;
22use rustc_span::sym;
23use rustc_target::spec::{RelocModel, Target, ef_avr_arch};
24use tracing::debug;
25
26use super::apple;
27
28/// The default metadata loader. This is used by cg_llvm and cg_clif.
29///
30/// # Metadata location
31///
32/// <dl>
33/// <dt>rlib</dt>
34/// <dd>The metadata can be found in the `lib.rmeta` file inside of the ar archive.</dd>
35/// <dt>dylib</dt>
36/// <dd>The metadata can be found in the `.rustc` section of the shared library.</dd>
37/// </dl>
38#[derive(Debug)]
39pub(crate) struct DefaultMetadataLoader;
40
41static AIX_METADATA_SYMBOL_NAME: &'static str = "__aix_rust_metadata";
42
43fn load_metadata_with(
44    path: &Path,
45    f: impl for<'a> FnOnce(&'a [u8]) -> Result<&'a [u8], String>,
46) -> Result<OwnedSlice, String> {
47    let file =
48        File::open(path).map_err(|e| format!("failed to open file '{}': {}", path.display(), e))?;
49
50    unsafe { Mmap::map(file) }
51        .map_err(|e| format!("failed to mmap file '{}': {}", path.display(), e))
52        .and_then(|mmap| try_slice_owned(mmap, |mmap| f(mmap)))
53}
54
55impl MetadataLoader for DefaultMetadataLoader {
56    fn get_rlib_metadata(&self, target: &Target, path: &Path) -> Result<OwnedSlice, String> {
57        debug!("getting rlib metadata for {}", path.display());
58        load_metadata_with(path, |data| {
59            let archive = object::read::archive::ArchiveFile::parse(&*data)
60                .map_err(|e| format!("failed to parse rlib '{}': {}", path.display(), e))?;
61
62            for entry_result in archive.members() {
63                let entry = entry_result
64                    .map_err(|e| format!("failed to parse rlib '{}': {}", path.display(), e))?;
65                if entry.name() == METADATA_FILENAME.as_bytes() {
66                    let data = entry
67                        .data(data)
68                        .map_err(|e| format!("failed to parse rlib '{}': {}", path.display(), e))?;
69                    if target.is_like_aix {
70                        return get_metadata_xcoff(path, data);
71                    } else {
72                        return search_for_section(path, data, ".rmeta");
73                    }
74                }
75            }
76
77            Err(format!("metadata not found in rlib '{}'", path.display()))
78        })
79    }
80
81    fn get_dylib_metadata(&self, target: &Target, path: &Path) -> Result<OwnedSlice, String> {
82        debug!("getting dylib metadata for {}", path.display());
83        if target.is_like_aix {
84            load_metadata_with(path, |data| {
85                let archive = object::read::archive::ArchiveFile::parse(&*data).map_err(|e| {
86                    format!("failed to parse aix dylib '{}': {}", path.display(), e)
87                })?;
88
89                match archive.members().exactly_one() {
90                    Ok(lib) => {
91                        let lib = lib.map_err(|e| {
92                            format!("failed to parse aix dylib '{}': {}", path.display(), e)
93                        })?;
94                        let data = lib.data(data).map_err(|e| {
95                            format!("failed to parse aix dylib '{}': {}", path.display(), e)
96                        })?;
97                        get_metadata_xcoff(path, data)
98                    }
99                    Err(e) => Err(format!("failed to parse aix dylib '{}': {}", path.display(), e)),
100                }
101            })
102        } else {
103            load_metadata_with(path, |data| search_for_section(path, data, ".rustc"))
104        }
105    }
106}
107
108pub(super) fn search_for_section<'a>(
109    path: &Path,
110    bytes: &'a [u8],
111    section: &str,
112) -> Result<&'a [u8], String> {
113    let Ok(file) = object::File::parse(bytes) else {
114        // The parse above could fail for odd reasons like corruption, but for
115        // now we just interpret it as this target doesn't support metadata
116        // emission in object files so the entire byte slice itself is probably
117        // a metadata file. Ideally though if necessary we could at least check
118        // the prefix of bytes to see if it's an actual metadata object and if
119        // not forward the error along here.
120        return Ok(bytes);
121    };
122    file.section_by_name(section)
123        .ok_or_else(|| format!("no `{}` section in '{}'", section, path.display()))?
124        .data()
125        .map_err(|e| format!("failed to read {} section in '{}': {}", section, path.display(), e))
126}
127
128fn add_gnu_property_note(
129    file: &mut write::Object<'static>,
130    architecture: Architecture,
131    binary_format: BinaryFormat,
132    endianness: Endianness,
133) {
134    // check bti protection
135    if binary_format != BinaryFormat::Elf
136        || !matches!(architecture, Architecture::X86_64 | Architecture::Aarch64)
137    {
138        return;
139    }
140
141    let section = file.add_section(
142        file.segment_name(StandardSegment::Data).to_vec(),
143        b".note.gnu.property".to_vec(),
144        SectionKind::Note,
145    );
146    let mut data: Vec<u8> = Vec::new();
147    let n_namsz: u32 = 4; // Size of the n_name field
148    let n_descsz: u32 = 16; // Size of the n_desc field
149    let n_type: u32 = object::elf::NT_GNU_PROPERTY_TYPE_0; // Type of note descriptor
150    let header_values = [n_namsz, n_descsz, n_type];
151    header_values.iter().for_each(|v| {
152        data.extend_from_slice(&match endianness {
153            Endianness::Little => v.to_le_bytes(),
154            Endianness::Big => v.to_be_bytes(),
155        })
156    });
157    data.extend_from_slice(b"GNU\0"); // Owner of the program property note
158    let pr_type: u32 = match architecture {
159        Architecture::X86_64 => object::elf::GNU_PROPERTY_X86_FEATURE_1_AND,
160        Architecture::Aarch64 => object::elf::GNU_PROPERTY_AARCH64_FEATURE_1_AND,
161        _ => unreachable!(),
162    };
163    let pr_datasz: u32 = 4; //size of the pr_data field
164    let pr_data: u32 = 3; //program property descriptor
165    let pr_padding: u32 = 0;
166    let property_values = [pr_type, pr_datasz, pr_data, pr_padding];
167    property_values.iter().for_each(|v| {
168        data.extend_from_slice(&match endianness {
169            Endianness::Little => v.to_le_bytes(),
170            Endianness::Big => v.to_be_bytes(),
171        })
172    });
173    file.append_section_data(section, &data, 8);
174}
175
176pub(super) fn get_metadata_xcoff<'a>(path: &Path, data: &'a [u8]) -> Result<&'a [u8], String> {
177    let Ok(file) = object::File::parse(data) else {
178        return Ok(data);
179    };
180    let info_data = search_for_section(path, data, ".info")?;
181    if let Some(metadata_symbol) =
182        file.symbols().find(|sym| sym.name() == Ok(AIX_METADATA_SYMBOL_NAME))
183    {
184        let offset = metadata_symbol.address() as usize;
185        // The offset specifies the location of rustc metadata in the .info section of XCOFF.
186        // Each string stored in .info section of XCOFF is preceded by a 4-byte length field.
187        if offset < 4 {
188            return Err(format!("Invalid metadata symbol offset: {offset}"));
189        }
190        // XCOFF format uses big-endian byte order.
191        let len = u32::from_be_bytes(info_data[(offset - 4)..offset].try_into().unwrap()) as usize;
192        if offset + len > (info_data.len() as usize) {
193            return Err(format!(
194                "Metadata at offset {offset} with size {len} is beyond .info section"
195            ));
196        }
197        Ok(&info_data[offset..(offset + len)])
198    } else {
199        Err(format!("Unable to find symbol {AIX_METADATA_SYMBOL_NAME}"))
200    }
201}
202
203pub(crate) fn create_object_file(sess: &Session) -> Option<write::Object<'static>> {
204    let endianness = match sess.target.options.endian {
205        Endian::Little => Endianness::Little,
206        Endian::Big => Endianness::Big,
207    };
208    let Some((architecture, sub_architecture)) =
209        sess.target.object_architecture(&sess.unstable_target_features)
210    else {
211        return None;
212    };
213    let binary_format = sess.target.binary_format.to_object();
214
215    let mut file = write::Object::new(binary_format, architecture, endianness);
216    file.set_sub_architecture(sub_architecture);
217    if sess.target.is_like_darwin {
218        if macho_is_arm64e(&sess.target) {
219            file.set_macho_cpu_subtype(object::macho::CPU_SUBTYPE_ARM64E);
220        }
221
222        file.set_macho_build_version(macho_object_build_version_for_target(sess))
223    }
224    if binary_format == BinaryFormat::Coff {
225        // Disable the default mangler to avoid mangling the special "@feat.00" symbol name.
226        let original_mangling = file.mangling();
227        file.set_mangling(object::write::Mangling::None);
228
229        let mut feature = 0;
230
231        if file.architecture() == object::Architecture::I386 {
232            // When linking with /SAFESEH on x86, lld requires that all linker inputs be marked as
233            // safe exception handling compatible. Metadata files masquerade as regular COFF
234            // objects and are treated as linker inputs, despite containing no actual code. Thus,
235            // they still need to be marked as safe exception handling compatible. See #96498.
236            // Reference: https://docs.microsoft.com/en-us/windows/win32/debug/pe-format
237            feature |= 1;
238        }
239
240        file.add_symbol(object::write::Symbol {
241            name: "@feat.00".into(),
242            value: feature,
243            size: 0,
244            kind: object::SymbolKind::Data,
245            scope: object::SymbolScope::Compilation,
246            weak: false,
247            section: object::write::SymbolSection::Absolute,
248            flags: object::SymbolFlags::None,
249        });
250
251        file.set_mangling(original_mangling);
252    }
253    let e_flags = elf_e_flags(architecture, sess);
254    // adapted from LLVM's `MCELFObjectTargetWriter::getOSABI`
255    let os_abi = elf_os_abi(sess);
256    let abi_version = 0;
257    add_gnu_property_note(&mut file, architecture, binary_format, endianness);
258    file.flags = FileFlags::Elf { os_abi, abi_version, e_flags };
259    Some(file)
260}
261
262pub(super) fn elf_os_abi(sess: &Session) -> u8 {
263    match sess.target.options.os.as_ref() {
264        "hermit" => elf::ELFOSABI_STANDALONE,
265        "freebsd" => elf::ELFOSABI_FREEBSD,
266        "solaris" => elf::ELFOSABI_SOLARIS,
267        _ => elf::ELFOSABI_NONE,
268    }
269}
270
271pub(super) fn elf_e_flags(architecture: Architecture, sess: &Session) -> u32 {
272    match architecture {
273        Architecture::Mips | Architecture::Mips64 | Architecture::Mips64_N32 => {
274            // "N32" indicates an "ILP32" data model on a 64-bit MIPS CPU
275            // like SPARC's "v8+", x86_64's "x32", or the watchOS "arm64_32".
276            let is_32bit = architecture == Architecture::Mips;
277            let mut e_flags = match sess.target.options.cpu.as_ref() {
278                "mips1" if is_32bit => elf::EF_MIPS_ARCH_1,
279                "mips2" if is_32bit => elf::EF_MIPS_ARCH_2,
280                "mips3" => elf::EF_MIPS_ARCH_3,
281                "mips4" => elf::EF_MIPS_ARCH_4,
282                "mips5" => elf::EF_MIPS_ARCH_5,
283                "mips32r2" if is_32bit => elf::EF_MIPS_ARCH_32R2,
284                "mips32r6" if is_32bit => elf::EF_MIPS_ARCH_32R6,
285                "mips64r2" if !is_32bit => elf::EF_MIPS_ARCH_64R2,
286                "mips64r6" if !is_32bit => elf::EF_MIPS_ARCH_64R6,
287                s if s.starts_with("mips32") && !is_32bit => {
288                    sess.dcx().fatal(format!("invalid CPU `{}` for 64-bit MIPS target", s))
289                }
290                s if s.starts_with("mips64") && is_32bit => {
291                    sess.dcx().fatal(format!("invalid CPU `{}` for 32-bit MIPS target", s))
292                }
293                _ if is_32bit => elf::EF_MIPS_ARCH_32R2,
294                _ => elf::EF_MIPS_ARCH_64R2,
295            };
296
297            // If the ABI is explicitly given, use it, or default to O32 on 32-bit MIPS,
298            // which is the only "true" 32-bit option that LLVM supports.
299            match sess.target.options.llvm_abiname.as_ref() {
300                "o32" if is_32bit => e_flags |= elf::EF_MIPS_ABI_O32,
301                "n32" if !is_32bit => e_flags |= elf::EF_MIPS_ABI2,
302                "n64" if !is_32bit => {}
303                "" if is_32bit => e_flags |= elf::EF_MIPS_ABI_O32,
304                "" => sess.dcx().fatal("LLVM ABI must be specifed for 64-bit MIPS targets"),
305                s if is_32bit => {
306                    sess.dcx().fatal(format!("invalid LLVM ABI `{}` for 32-bit MIPS target", s))
307                }
308                s => sess.dcx().fatal(format!("invalid LLVM ABI `{}` for 64-bit MIPS target", s)),
309            };
310
311            if sess.target.options.relocation_model != RelocModel::Static {
312                // PIC means position-independent code. CPIC means "calls PIC".
313                // CPIC was mutually exclusive with PIC according to
314                // the SVR4 MIPS ABI https://refspecs.linuxfoundation.org/elf/mipsabi.pdf
315                // and should have only appeared on static objects with dynamically calls.
316                // At some point someone (GCC?) decided to set CPIC even for PIC.
317                // Nowadays various things expect both set on the same object file
318                // and may even error if you mix CPIC and non-CPIC object files,
319                // despite that being the entire point of the CPIC ABI extension!
320                // As we are in Rome, we do as the Romans do.
321                e_flags |= elf::EF_MIPS_PIC | elf::EF_MIPS_CPIC;
322            }
323            if sess.target.options.cpu.contains("r6") {
324                e_flags |= elf::EF_MIPS_NAN2008;
325            }
326            e_flags
327        }
328        Architecture::Riscv32 | Architecture::Riscv64 => {
329            // Source: https://github.com/riscv-non-isa/riscv-elf-psabi-doc/blob/079772828bd10933d34121117a222b4cc0ee2200/riscv-elf.adoc
330            let mut e_flags: u32 = 0x0;
331
332            // Check if compressed is enabled
333            // `unstable_target_features` is used here because "c" is gated behind riscv_target_feature.
334            if sess.unstable_target_features.contains(&sym::c) {
335                e_flags |= elf::EF_RISCV_RVC;
336            }
337
338            // Set the appropriate flag based on ABI
339            // This needs to match LLVM `RISCVELFStreamer.cpp`
340            match &*sess.target.llvm_abiname {
341                "ilp32" | "lp64" => (),
342                "ilp32f" | "lp64f" => e_flags |= elf::EF_RISCV_FLOAT_ABI_SINGLE,
343                "ilp32d" | "lp64d" => e_flags |= elf::EF_RISCV_FLOAT_ABI_DOUBLE,
344                // Note that the `lp64e` is still unstable as it's not (yet) part of the ELF psABI.
345                "ilp32e" | "lp64e" => e_flags |= elf::EF_RISCV_RVE,
346                _ => bug!("unknown RISC-V ABI name"),
347            }
348
349            e_flags
350        }
351        Architecture::LoongArch64 => {
352            // Source: https://github.com/loongson/la-abi-specs/blob/release/laelf.adoc#e_flags-identifies-abi-type-and-version
353            let mut e_flags: u32 = elf::EF_LARCH_OBJABI_V1;
354
355            // Set the appropriate flag based on ABI
356            // This needs to match LLVM `LoongArchELFStreamer.cpp`
357            match &*sess.target.llvm_abiname {
358                "ilp32s" | "lp64s" => e_flags |= elf::EF_LARCH_ABI_SOFT_FLOAT,
359                "ilp32f" | "lp64f" => e_flags |= elf::EF_LARCH_ABI_SINGLE_FLOAT,
360                "ilp32d" | "lp64d" => e_flags |= elf::EF_LARCH_ABI_DOUBLE_FLOAT,
361                _ => bug!("unknown LoongArch ABI name"),
362            }
363
364            e_flags
365        }
366        Architecture::Avr => {
367            // Resolve the ISA revision and set
368            // the appropriate EF_AVR_ARCH flag.
369            if let Some(ref cpu) = sess.opts.cg.target_cpu {
370                ef_avr_arch(cpu)
371            } else {
372                bug!("AVR CPU not explicitly specified")
373            }
374        }
375        Architecture::Csky => {
376            let e_flags = match sess.target.options.abi.as_ref() {
377                "abiv2" => elf::EF_CSKY_ABIV2,
378                _ => elf::EF_CSKY_ABIV1,
379            };
380            e_flags
381        }
382        _ => 0,
383    }
384}
385
386/// Mach-O files contain information about:
387/// - The platform/OS they were built for (macOS/watchOS/Mac Catalyst/iOS simulator etc).
388/// - The minimum OS version / deployment target.
389/// - The version of the SDK they were targetting.
390///
391/// In the past, this was accomplished using the LC_VERSION_MIN_MACOSX, LC_VERSION_MIN_IPHONEOS,
392/// LC_VERSION_MIN_TVOS or LC_VERSION_MIN_WATCHOS load commands, which each contain information
393/// about the deployment target and SDK version, and implicitly, by their presence, which OS they
394/// target. Simulator targets were determined if the architecture was x86_64, but there was e.g. a
395/// LC_VERSION_MIN_IPHONEOS present.
396///
397/// This is of course brittle and limited, so modern tooling emit the LC_BUILD_VERSION load
398/// command (which contains all three pieces of information in one) when the deployment target is
399/// high enough, or the target is something that wouldn't be encodable with the old load commands
400/// (such as Mac Catalyst, or Aarch64 iOS simulator).
401///
402/// Since Xcode 15, Apple's LD apparently requires object files to use this load command, so this
403/// returns the `MachOBuildVersion` for the target to do so.
404fn macho_object_build_version_for_target(sess: &Session) -> object::write::MachOBuildVersion {
405    /// The `object` crate demands "X.Y.Z encoded in nibbles as xxxx.yy.zz"
406    /// e.g. minOS 14.0 = 0x000E0000, or SDK 16.2 = 0x00100200
407    fn pack_version(apple::OSVersion { major, minor, patch }: apple::OSVersion) -> u32 {
408        let (major, minor, patch) = (major as u32, minor as u32, patch as u32);
409        (major << 16) | (minor << 8) | patch
410    }
411
412    let platform = apple::macho_platform(&sess.target);
413    let min_os = sess.apple_deployment_target();
414
415    let mut build_version = object::write::MachOBuildVersion::default();
416    build_version.platform = platform;
417    build_version.minos = pack_version(min_os);
418    // The version here does not _really_ matter, since it is only used at runtime, and we specify
419    // it when linking the final binary, so we will omit the version. This is also what LLVM does,
420    // and the tooling also allows this (and shows the SDK version as `n/a`). Finally, it is the
421    // semantically correct choice, as the SDK has not influenced the binary generated by rustc at
422    // this point in time.
423    build_version.sdk = 0;
424
425    build_version
426}
427
428/// Is Apple's CPU subtype `arm64e`s
429fn macho_is_arm64e(target: &Target) -> bool {
430    target.llvm_target.starts_with("arm64e")
431}
432
433pub(crate) enum MetadataPosition {
434    First,
435    Last,
436}
437
438/// For rlibs we "pack" rustc metadata into a dummy object file.
439///
440/// Historically it was needed because rustc linked rlibs as whole-archive in some cases.
441/// In that case linkers try to include all files located in an archive, so if metadata is stored
442/// in an archive then it needs to be of a form that the linker is able to process.
443/// Now it's not clear whether metadata still needs to be wrapped into an object file or not.
444///
445/// Note, though, that we don't actually want this metadata to show up in any
446/// final output of the compiler. Instead this is purely for rustc's own
447/// metadata tracking purposes.
448///
449/// With the above in mind, each "flavor" of object format gets special
450/// handling here depending on the target:
451///
452/// * MachO - macos-like targets will insert the metadata into a section that
453///   is sort of fake dwarf debug info. Inspecting the source of the macos
454///   linker this causes these sections to be skipped automatically because
455///   it's not in an allowlist of otherwise well known dwarf section names to
456///   go into the final artifact.
457///
458/// * WebAssembly - this uses wasm files themselves as the object file format
459///   so an empty file with no linking metadata but a single custom section is
460///   created holding our metadata.
461///
462/// * COFF - Windows-like targets create an object with a section that has
463///   the `IMAGE_SCN_LNK_REMOVE` flag set which ensures that if the linker
464///   ever sees the section it doesn't process it and it's removed.
465///
466/// * ELF - All other targets are similar to Windows in that there's a
467///   `SHF_EXCLUDE` flag we can set on sections in an object file to get
468///   automatically removed from the final output.
469pub(crate) fn create_wrapper_file(
470    sess: &Session,
471    section_name: String,
472    data: &[u8],
473) -> (Vec<u8>, MetadataPosition) {
474    let Some(mut file) = create_object_file(sess) else {
475        if sess.target.is_like_wasm {
476            return (
477                create_metadata_file_for_wasm(sess, data, &section_name),
478                MetadataPosition::First,
479            );
480        }
481
482        // Targets using this branch don't have support implemented here yet or
483        // they're not yet implemented in the `object` crate and will likely
484        // fill out this module over time.
485        return (data.to_vec(), MetadataPosition::Last);
486    };
487    let section = if file.format() == BinaryFormat::Xcoff {
488        file.add_section(Vec::new(), b".info".to_vec(), SectionKind::Debug)
489    } else {
490        file.add_section(
491            file.segment_name(StandardSegment::Debug).to_vec(),
492            section_name.into_bytes(),
493            SectionKind::Debug,
494        )
495    };
496    match file.format() {
497        BinaryFormat::Coff => {
498            file.section_mut(section).flags =
499                SectionFlags::Coff { characteristics: pe::IMAGE_SCN_LNK_REMOVE };
500        }
501        BinaryFormat::Elf => {
502            file.section_mut(section).flags =
503                SectionFlags::Elf { sh_flags: elf::SHF_EXCLUDE as u64 };
504        }
505        BinaryFormat::Xcoff => {
506            // AIX system linker may aborts if it meets a valid XCOFF file in archive with no .text, no .data and no .bss.
507            file.add_section(Vec::new(), b".text".to_vec(), SectionKind::Text);
508            file.section_mut(section).flags =
509                SectionFlags::Xcoff { s_flags: xcoff::STYP_INFO as u32 };
510            // Encode string stored in .info section of XCOFF.
511            // FIXME: The length of data here is not guaranteed to fit in a u32.
512            // We may have to split the data into multiple pieces in order to
513            // store in .info section.
514            let len: u32 = data.len().try_into().unwrap();
515            let offset = file.append_section_data(section, &len.to_be_bytes(), 1);
516            // Add a symbol referring to the data in .info section.
517            file.add_symbol(Symbol {
518                name: AIX_METADATA_SYMBOL_NAME.into(),
519                value: offset + 4,
520                size: 0,
521                kind: SymbolKind::Unknown,
522                scope: SymbolScope::Compilation,
523                weak: false,
524                section: SymbolSection::Section(section),
525                flags: SymbolFlags::Xcoff {
526                    n_sclass: xcoff::C_INFO,
527                    x_smtyp: xcoff::C_HIDEXT,
528                    x_smclas: xcoff::C_HIDEXT,
529                    containing_csect: None,
530                },
531            });
532        }
533        _ => {}
534    };
535    file.append_section_data(section, data, 1);
536    (file.write().unwrap(), MetadataPosition::First)
537}
538
539// Historical note:
540//
541// When using link.exe it was seen that the section name `.note.rustc`
542// was getting shortened to `.note.ru`, and according to the PE and COFF
543// specification:
544//
545// > Executable images do not use a string table and do not support
546// > section names longer than 8 characters
547//
548// https://docs.microsoft.com/en-us/windows/win32/debug/pe-format
549//
550// As a result, we choose a slightly shorter name! As to why
551// `.note.rustc` works on MinGW, see
552// https://github.com/llvm/llvm-project/blob/llvmorg-12.0.0/lld/COFF/Writer.cpp#L1190-L1197
553pub fn create_compressed_metadata_file(
554    sess: &Session,
555    metadata: &EncodedMetadata,
556    symbol_name: &str,
557) -> Vec<u8> {
558    let mut packed_metadata = rustc_metadata::METADATA_HEADER.to_vec();
559    packed_metadata.write_all(&(metadata.stub_or_full().len() as u64).to_le_bytes()).unwrap();
560    packed_metadata.extend(metadata.stub_or_full());
561
562    let Some(mut file) = create_object_file(sess) else {
563        if sess.target.is_like_wasm {
564            return create_metadata_file_for_wasm(sess, &packed_metadata, ".rustc");
565        }
566        return packed_metadata.to_vec();
567    };
568    if file.format() == BinaryFormat::Xcoff {
569        return create_compressed_metadata_file_for_xcoff(file, &packed_metadata, symbol_name);
570    }
571    let section = file.add_section(
572        file.segment_name(StandardSegment::Data).to_vec(),
573        b".rustc".to_vec(),
574        SectionKind::ReadOnlyData,
575    );
576    match file.format() {
577        BinaryFormat::Elf => {
578            // Explicitly set no flags to avoid SHF_ALLOC default for data section.
579            file.section_mut(section).flags = SectionFlags::Elf { sh_flags: 0 };
580        }
581        _ => {}
582    };
583    let offset = file.append_section_data(section, &packed_metadata, 1);
584
585    // For MachO and probably PE this is necessary to prevent the linker from throwing away the
586    // .rustc section. For ELF this isn't necessary, but it also doesn't harm.
587    file.add_symbol(Symbol {
588        name: symbol_name.as_bytes().to_vec(),
589        value: offset,
590        size: packed_metadata.len() as u64,
591        kind: SymbolKind::Data,
592        scope: SymbolScope::Dynamic,
593        weak: false,
594        section: SymbolSection::Section(section),
595        flags: SymbolFlags::None,
596    });
597
598    file.write().unwrap()
599}
600
601/// * Xcoff - On AIX, custom sections are merged into predefined sections,
602///   so custom .rustc section is not preserved during linking.
603///   For this reason, we store metadata in predefined .info section, and
604///   define a symbol to reference the metadata. To preserve metadata during
605///   linking on AIX, we have to
606///   1. Create an empty .text section, a empty .data section.
607///   2. Define an empty symbol named `symbol_name` inside .data section.
608///   3. Define an symbol named `AIX_METADATA_SYMBOL_NAME` referencing
609///      data inside .info section.
610///   From XCOFF's view, (2) creates a csect entry in the symbol table, the
611///   symbol created by (3) is a info symbol for the preceding csect. Thus
612///   two symbols are preserved during linking and we can use the second symbol
613///   to reference the metadata.
614pub fn create_compressed_metadata_file_for_xcoff(
615    mut file: write::Object<'_>,
616    data: &[u8],
617    symbol_name: &str,
618) -> Vec<u8> {
619    assert!(file.format() == BinaryFormat::Xcoff);
620    // AIX system linker may aborts if it meets a valid XCOFF file in archive with no .text, no .data and no .bss.
621    file.add_section(Vec::new(), b".text".to_vec(), SectionKind::Text);
622    let data_section = file.add_section(Vec::new(), b".data".to_vec(), SectionKind::Data);
623    let section = file.add_section(Vec::new(), b".info".to_vec(), SectionKind::Debug);
624    file.add_file_symbol("lib.rmeta".into());
625    file.section_mut(section).flags = SectionFlags::Xcoff { s_flags: xcoff::STYP_INFO as u32 };
626    // Add a global symbol to data_section.
627    file.add_symbol(Symbol {
628        name: symbol_name.as_bytes().into(),
629        value: 0,
630        size: 0,
631        kind: SymbolKind::Data,
632        scope: SymbolScope::Dynamic,
633        weak: true,
634        section: SymbolSection::Section(data_section),
635        flags: SymbolFlags::None,
636    });
637    let len: u32 = data.len().try_into().unwrap();
638    let offset = file.append_section_data(section, &len.to_be_bytes(), 1);
639    // Add a symbol referring to the rustc metadata.
640    file.add_symbol(Symbol {
641        name: AIX_METADATA_SYMBOL_NAME.into(),
642        value: offset + 4, // The metadata is preceded by a 4-byte length field.
643        size: 0,
644        kind: SymbolKind::Unknown,
645        scope: SymbolScope::Dynamic,
646        weak: false,
647        section: SymbolSection::Section(section),
648        flags: SymbolFlags::Xcoff {
649            n_sclass: xcoff::C_INFO,
650            x_smtyp: xcoff::C_HIDEXT,
651            x_smclas: xcoff::C_HIDEXT,
652            containing_csect: None,
653        },
654    });
655    file.append_section_data(section, data, 1);
656    file.write().unwrap()
657}
658
659/// Creates a simple WebAssembly object file, which is itself a wasm module,
660/// that contains a custom section of the name `section_name` with contents
661/// `data`.
662///
663/// NB: the `object` crate does not yet have support for writing the wasm
664/// object file format. In lieu of that the `wasm-encoder` crate is used to
665/// build a wasm file by hand.
666///
667/// The wasm object file format is defined at
668/// <https://github.com/WebAssembly/tool-conventions/blob/main/Linking.md>
669/// and mainly consists of a `linking` custom section. In this case the custom
670/// section there is empty except for a version marker indicating what format
671/// it's in.
672///
673/// The main purpose of this is to contain a custom section with `section_name`,
674/// which is then appended after `linking`.
675///
676/// As a further detail the object needs to have a 64-bit memory if `wasm64` is
677/// the target or otherwise it's interpreted as a 32-bit object which is
678/// incompatible with 64-bit ones.
679pub fn create_metadata_file_for_wasm(sess: &Session, data: &[u8], section_name: &str) -> Vec<u8> {
680    assert!(sess.target.is_like_wasm);
681    let mut module = wasm_encoder::Module::new();
682    let mut imports = wasm_encoder::ImportSection::new();
683
684    if sess.target.pointer_width == 64 {
685        imports.import(
686            "env",
687            "__linear_memory",
688            wasm_encoder::MemoryType {
689                minimum: 0,
690                maximum: None,
691                memory64: true,
692                shared: false,
693                page_size_log2: None,
694            },
695        );
696    }
697
698    if imports.len() > 0 {
699        module.section(&imports);
700    }
701    module.section(&wasm_encoder::CustomSection {
702        name: "linking".into(),
703        data: Cow::Borrowed(&[2]),
704    });
705    module.section(&wasm_encoder::CustomSection { name: section_name.into(), data: data.into() });
706    module.finish()
707}