// SPDX-License-Identifier: Apache-2.0 use std::env; use std::fs::File; use std::io::{self, Error, ErrorKind, Read, Seek, SeekFrom}; use std::path::{Path, PathBuf}; use super::common; //================================================ // Validation //================================================ /// Extracts the ELF class from the ELF header in a shared library. fn parse_elf_header(path: &Path) -> io::Result { let mut file = File::open(path)?; let mut buffer = [0; 5]; file.read_exact(&mut buffer)?; if buffer[..4] == [127, 69, 76, 70] { Ok(buffer[4]) } else { Err(Error::new(ErrorKind::InvalidData, "invalid ELF header")) } } /// Extracts the magic number and machine type from the PE header in a shared library. fn parse_pe_header(path: &Path) -> io::Result<(u16, u16)> { let mut file = File::open(path)?; // Extract the header offset. let mut buffer = [0; 4]; let start = SeekFrom::Start(0x3C); file.seek(start)?; file.read_exact(&mut buffer)?; let offset = i32::from_le_bytes(buffer); // Check the validity of the header. file.seek(SeekFrom::Start(offset as u64))?; file.read_exact(&mut buffer)?; if buffer != [80, 69, 0, 0] { return Err(Error::new(ErrorKind::InvalidData, "invalid PE header")); } // Extract the magic number. let mut buffer = [0; 2]; file.seek(SeekFrom::Current(20))?; file.read_exact(&mut buffer)?; let magic_number = u16::from_le_bytes(buffer); // Extract the machine type. let mut buffer = [0; 2]; file.seek(SeekFrom::Current(-22))?; file.read_exact(&mut buffer)?; let machine_type = u16::from_le_bytes(buffer); return Ok((magic_number, machine_type)); } /// Checks that a `libclang` shared library matches the target platform. fn validate_library(path: &Path) -> Result<(), String> { if target_os!("linux") || target_os!("freebsd") { let class = parse_elf_header(path).map_err(|e| e.to_string())?; if target_pointer_width!("32") && class != 1 { return Err("invalid ELF class (64-bit)".into()); } if target_pointer_width!("64") && class != 2 { return Err("invalid ELF class (32-bit)".into()); } Ok(()) } else if target_os!("windows") { let (magic, machine_type) = parse_pe_header(path).map_err(|e| e.to_string())?; if target_pointer_width!("32") && magic != 267 { return Err("invalid DLL (64-bit)".into()); } if target_pointer_width!("64") && magic != 523 { return Err("invalid DLL (32-bit)".into()); } let arch_mismatch = match machine_type { 0x014C if !target_arch!("x86") => Some("x86"), 0x8664 if !target_arch!("x86_64") => Some("x86-64"), 0xAA64 if !target_arch!("aarch64") => Some("ARM64"), _ => None, }; if let Some(arch) = arch_mismatch { Err(format!("invalid DLL ({arch})")) } else { Ok(()) } } else { Ok(()) } } //================================================ // Searching //================================================ /// Extracts the version components in a `libclang` shared library filename. fn parse_version(filename: &str) -> Vec { let version = if let Some(version) = filename.strip_prefix("libclang.so.") { version } else if filename.starts_with("libclang-") { &filename[9..filename.len() - 3] } else { return vec![]; }; version.split('.').map(|s| s.parse().unwrap_or(0)).collect() } /// Finds `libclang` shared libraries and returns the paths to, filenames of, /// and versions of those shared libraries. fn search_libclang_directories(runtime: bool) -> Result)>, String> { let mut files = vec![format!( "{}clang{}", env::consts::DLL_PREFIX, env::consts::DLL_SUFFIX )]; if target_os!("linux") { // Some Linux distributions don't create a `libclang.so` symlink, so we // need to look for versioned files (e.g., `libclang-3.9.so`). files.push("libclang-*.so".into()); // Some Linux distributions don't create a `libclang.so` symlink and // don't have versioned files as described above, so we need to look for // suffix versioned files (e.g., `libclang.so.1`). However, `ld` cannot // link to these files, so this will only be included when linking at // runtime. if runtime { files.push("libclang.so.*".into()); files.push("libclang-*.so.*".into()); } } if target_os!("freebsd") || target_os!("haiku") || target_os!("netbsd") || target_os!("openbsd") { // Some BSD distributions don't create a `libclang.so` symlink either, // but use a different naming scheme for versioned files (e.g., // `libclang.so.7.0`). files.push("libclang.so.*".into()); } if target_os!("windows") { // The official LLVM build uses `libclang.dll` on Windows instead of // `clang.dll`. However, unofficial builds such as MinGW use `clang.dll`. files.push("libclang.dll".into()); } // Find and validate `libclang` shared libraries and collect the versions. let mut valid = vec![]; let mut invalid = vec![]; for (directory, filename) in common::search_libclang_directories(&files, "LIBCLANG_PATH") { let path = directory.join(&filename); match validate_library(&path) { Ok(()) => { let version = parse_version(&filename); valid.push((directory, filename, version)) } Err(message) => invalid.push(format!("({}: {})", path.display(), message)), } } if !valid.is_empty() { return Ok(valid); } let message = format!( "couldn't find any valid shared libraries matching: [{}], set the \ `LIBCLANG_PATH` environment variable to a path where one of these files \ can be found (invalid: [{}])", files .iter() .map(|f| format!("'{}'", f)) .collect::>() .join(", "), invalid.join(", "), ); Err(message) } /// Finds the "best" `libclang` shared library and returns the directory and /// filename of that library. pub fn find(runtime: bool) -> Result<(PathBuf, String), String> { search_libclang_directories(runtime)? .iter() // We want to find the `libclang` shared library with the highest // version number, hence `max_by_key` below. // // However, in the case where there are multiple such `libclang` shared // libraries, we want to use the order in which they appeared in the // list returned by `search_libclang_directories` as a tiebreaker since // that function returns `libclang` shared libraries in descending order // of preference by how they were found. // // `max_by_key`, perhaps surprisingly, returns the *last* item with the // maximum key rather than the first which results in the opposite of // the tiebreaking behavior we want. This is easily fixed by reversing // the list first. .rev() .max_by_key(|f| &f.2) .cloned() .map(|(path, filename, _)| (path, filename)) .ok_or_else(|| "unreachable".into()) } //================================================ // Linking //================================================ /// Finds and links to a `libclang` shared library. #[cfg(not(feature = "runtime"))] pub fn link() { let cep = common::CommandErrorPrinter::default(); use std::fs; let (directory, filename) = find(false).unwrap(); println!("cargo:rustc-link-search={}", directory.display()); if cfg!(all(target_os = "windows", target_env = "msvc")) { // Find the `libclang` stub static library required for the MSVC // toolchain. let lib = if !directory.ends_with("bin") { directory } else { directory.parent().unwrap().join("lib") }; if lib.join("libclang.lib").exists() { println!("cargo:rustc-link-search={}", lib.display()); } else if lib.join("libclang.dll.a").exists() { // MSYS and MinGW use `libclang.dll.a` instead of `libclang.lib`. // It is linkable with the MSVC linker, but Rust doesn't recognize // the `.a` suffix, so we need to copy it with a different name. // // FIXME: Maybe we can just hardlink or symlink it? let out = env::var("OUT_DIR").unwrap(); fs::copy( lib.join("libclang.dll.a"), Path::new(&out).join("libclang.lib"), ) .unwrap(); println!("cargo:rustc-link-search=native={}", out); } else { panic!( "using '{}', so 'libclang.lib' or 'libclang.dll.a' must be \ available in {}", filename, lib.display(), ); } println!("cargo:rustc-link-lib=dylib=libclang"); } else { let name = filename.trim_start_matches("lib"); // Strip extensions and trailing version numbers (e.g., the `.so.7.0` in // `libclang.so.7.0`) and also `.dll` for MinGW / MSYS. let name = match name.find(".dylib").or_else(|| name.find(".so")).or_else(|| name.find(".dll")) { Some(index) => &name[0..index], None => name, }; println!("cargo:rustc-link-lib=dylib={}", name); } cep.discard(); }