use crate::config::LLVM;
use crate::config::OptimizationStyle;
use crate::translator::FuncTrampoline;
use crate::translator::FuncTranslator;
use rayon::ThreadPoolBuilder;
use rayon::prelude::{IntoParallelRefIterator, ParallelIterator};
use std::{
borrow::Cow,
collections::{HashMap, HashSet},
sync::Arc,
};
use wasmer_compiler::progress::ProgressContext;
use wasmer_compiler::types::function::{Compilation, UnwindInfo};
use wasmer_compiler::types::module::CompileModuleInfo;
use wasmer_compiler::types::relocation::RelocationKind;
use wasmer_compiler::{
Compiler, FunctionBodyData, ModuleMiddleware, ModuleTranslationState,
types::{
relocation::RelocationTarget,
section::{CustomSection, CustomSectionProtection, SectionBody, SectionIndex},
symbols::{Symbol, SymbolRegistry},
},
};
use wasmer_compiler::{
WASM_LARGE_FUNCTION_THRESHOLD, WASM_TRAMPOLINE_ESTIMATED_BODY_SIZE, build_function_buckets,
translate_function_buckets,
};
use wasmer_types::ExportIndex;
use wasmer_types::entity::{EntityRef, PrimaryMap};
use wasmer_types::target::Target;
use wasmer_types::{
CompilationProgressCallback, CompileError, FunctionIndex, LocalFunctionIndex, ModuleInfo,
SignatureIndex,
};
use wasmer_vm::LibCall;
#[derive(Debug)]
pub struct LLVMCompiler {
config: LLVM,
}
impl LLVMCompiler {
pub fn new(config: LLVM) -> LLVMCompiler {
LLVMCompiler { config }
}
fn config(&self) -> &LLVM {
&self.config
}
}
struct ShortNames {}
impl SymbolRegistry for ShortNames {
fn symbol_to_name(&self, symbol: Symbol) -> String {
match symbol {
Symbol::Metadata => "M".to_string(),
Symbol::LocalFunction(index) => format!("f{}", index.index()),
Symbol::Section(index) => format!("s{}", index.index()),
Symbol::FunctionCallTrampoline(index) => format!("t{}", index.index()),
Symbol::DynamicFunctionTrampoline(index) => format!("d{}", index.index()),
}
}
fn name_to_symbol(&self, name: &str) -> Option<Symbol> {
if name.len() < 2 {
return None;
}
let (ty, idx) = name.split_at(1);
if ty.starts_with('M') {
return Some(Symbol::Metadata);
}
let idx = idx.parse::<u32>().ok()?;
match ty.chars().next().unwrap() {
'f' => Some(Symbol::LocalFunction(LocalFunctionIndex::from_u32(idx))),
's' => Some(Symbol::Section(SectionIndex::from_u32(idx))),
't' => Some(Symbol::FunctionCallTrampoline(SignatureIndex::from_u32(
idx,
))),
'd' => Some(Symbol::DynamicFunctionTrampoline(FunctionIndex::from_u32(
idx,
))),
_ => None,
}
}
}
pub(crate) struct ModuleBasedSymbolRegistry {
wasm_module: Arc<ModuleInfo>,
local_func_names: HashMap<String, LocalFunctionIndex>,
short_names: ShortNames,
}
impl ModuleBasedSymbolRegistry {
const PROBLEMATIC_PREFIXES: &[&'static str] = &[
".L", "llvm.", ];
fn new(wasm_module: Arc<ModuleInfo>) -> Self {
let local_func_names = HashMap::from_iter(
wasm_module
.function_names
.iter()
.map(|(f, v)| (wasm_module.local_func_index(*f), v))
.filter(|(f, _)| f.is_some())
.map(|(f, v)| (format!("{}_{}", v.clone(), f.unwrap().as_u32()), f.unwrap())),
);
Self {
wasm_module,
local_func_names,
short_names: ShortNames {},
}
}
fn fixup_problematic_name(name: &str) -> Cow<'_, str> {
for prefix in Self::PROBLEMATIC_PREFIXES {
if name.starts_with(prefix) {
return format!("_{name}").into();
}
}
name.into()
}
fn unfixup_problematic_name(name: &str) -> &str {
if let Some(stripped_name) = name.strip_prefix('_') {
for prefix in Self::PROBLEMATIC_PREFIXES {
if stripped_name.starts_with(prefix) {
return stripped_name;
}
}
}
name
}
}
impl SymbolRegistry for ModuleBasedSymbolRegistry {
fn symbol_to_name(&self, symbol: Symbol) -> String {
match symbol {
Symbol::LocalFunction(index) => self
.wasm_module
.function_names
.get(&self.wasm_module.func_index(index))
.map(|name| format!("{}_{}", Self::fixup_problematic_name(name), index.as_u32()))
.unwrap_or(self.short_names.symbol_to_name(symbol)),
_ => self.short_names.symbol_to_name(symbol),
}
}
fn name_to_symbol(&self, name: &str) -> Option<Symbol> {
let name = Self::unfixup_problematic_name(name);
if let Some(idx) = self.local_func_names.get(name) {
Some(Symbol::LocalFunction(*idx))
} else {
self.short_names.name_to_symbol(name)
}
}
}
impl Compiler for LLVMCompiler {
fn name(&self) -> &str {
"llvm"
}
fn get_perfmap_enabled(&self) -> bool {
self.config.enable_perfmap
}
fn deterministic_id(&self) -> String {
format!(
"llvm-{}",
match self.config.opt_level {
inkwell::OptimizationLevel::None => "opt0",
inkwell::OptimizationLevel::Less => "optl",
inkwell::OptimizationLevel::Default => "optd",
inkwell::OptimizationLevel::Aggressive => "opta",
}
)
}
fn get_middlewares(&self) -> &[Arc<dyn ModuleMiddleware>] {
&self.config.middlewares
}
fn compile_module(
&self,
target: &Target,
compile_info: &CompileModuleInfo,
module_translation: &ModuleTranslationState,
function_body_inputs: PrimaryMap<LocalFunctionIndex, FunctionBodyData<'_>>,
progress_callback: Option<&CompilationProgressCallback>,
) -> Result<Compilation, CompileError> {
let binary_format = self.config.target_binary_format(target);
let module = &compile_info.module;
let module_hash = module.hash_string();
let total_function_call_trampolines = module.signatures.len();
let total_dynamic_trampolines = module.num_imported_functions;
let total_steps = WASM_TRAMPOLINE_ESTIMATED_BODY_SIZE
* ((total_dynamic_trampolines + total_function_call_trampolines) as u64)
+ function_body_inputs
.iter()
.map(|(_, body)| body.data.len() as u64)
.sum::<u64>();
let progress = progress_callback
.cloned()
.map(|cb| ProgressContext::new(cb, total_steps, "Compiling functions"));
let mut module_custom_sections = PrimaryMap::new();
let mut eh_frame_section_bytes = vec![];
let mut eh_frame_section_relocations = vec![];
let mut compact_unwind_section_bytes = vec![];
let mut compact_unwind_section_relocations = vec![];
let mut got_targets: HashSet<wasmer_compiler::types::relocation::RelocationTarget> = if matches!(
target.triple().binary_format,
target_lexicon::BinaryFormat::Macho
) {
HashSet::from_iter(vec![RelocationTarget::LibCall(LibCall::EHPersonality)])
} else {
HashSet::default()
};
let symbol_registry = ModuleBasedSymbolRegistry::new(module.clone());
let module = &compile_info.module;
let memory_styles = &compile_info.memory_styles;
let table_styles = &compile_info.table_styles;
let pool = ThreadPoolBuilder::new()
.num_threads(self.config.num_threads.get())
.build()
.map_err(|e| CompileError::Resource(e.to_string()))?;
let buckets =
build_function_buckets(&function_body_inputs, WASM_LARGE_FUNCTION_THRESHOLD / 3);
let largest_bucket = buckets.first().map(|b| b.size).unwrap_or_default();
tracing::debug!(buckets = buckets.len(), largest_bucket, "buckets built");
let functions = translate_function_buckets(
&pool,
|| {
let compiler = &self;
let target_machines = enum_iterator::all::<OptimizationStyle>()
.map(|style| {
(
style,
compiler.config().target_machine_with_opt(target, style),
)
})
.collect();
let pointer_width = target.triple().pointer_width().unwrap().bytes();
FuncTranslator::new(
target.triple().clone(),
target_machines,
binary_format,
pointer_width,
*target.cpu_features(),
self.config.enable_non_volatile_memops,
module
.exports
.get("__wasm_apply_data_relocs")
.and_then(|export| {
if let ExportIndex::Function(index) = export {
Some(*index)
} else {
None
}
}),
)
.unwrap()
},
|func_translator, i, input| {
func_translator.translate(
module,
module_translation,
i,
input,
self.config(),
memory_styles,
table_styles,
&symbol_registry,
target.triple(),
)
},
progress.clone(),
&buckets,
)?;
let functions = functions
.into_iter()
.map(|mut compiled_function| {
let first_section = module_custom_sections.len() as u32;
for (section_index, custom_section) in compiled_function.custom_sections.iter() {
let mut custom_section = custom_section.clone();
for reloc in &mut custom_section.relocations {
if let RelocationTarget::CustomSection(index) = reloc.reloc_target {
reloc.reloc_target = RelocationTarget::CustomSection(
SectionIndex::from_u32(first_section + index.as_u32()),
)
}
if reloc.kind.needs_got() {
got_targets.insert(reloc.reloc_target);
}
}
if compiled_function
.eh_frame_section_indices
.contains(§ion_index)
{
let offset = eh_frame_section_bytes.len() as u32;
for reloc in &mut custom_section.relocations {
reloc.offset += offset;
}
eh_frame_section_bytes.extend_from_slice(custom_section.bytes.as_slice());
eh_frame_section_bytes.extend_from_slice(&[0, 0, 0, 0]);
eh_frame_section_relocations.extend(custom_section.relocations);
module_custom_sections.push(CustomSection {
protection: CustomSectionProtection::Read,
alignment: None,
bytes: SectionBody::new_with_vec(vec![]),
relocations: vec![],
});
} else if compiled_function
.compact_unwind_section_indices
.contains(§ion_index)
{
let offset = compact_unwind_section_bytes.len() as u32;
for reloc in &mut custom_section.relocations {
reloc.offset += offset;
}
compact_unwind_section_bytes
.extend_from_slice(custom_section.bytes.as_slice());
compact_unwind_section_relocations.extend(custom_section.relocations);
module_custom_sections.push(CustomSection {
protection: CustomSectionProtection::Read,
alignment: None,
bytes: SectionBody::new_with_vec(vec![]),
relocations: vec![],
});
} else {
module_custom_sections.push(custom_section);
}
}
for reloc in &mut compiled_function.compiled_function.relocations {
if let RelocationTarget::CustomSection(index) = reloc.reloc_target {
reloc.reloc_target = RelocationTarget::CustomSection(
SectionIndex::from_u32(first_section + index.as_u32()),
)
}
if reloc.kind.needs_got() {
got_targets.insert(reloc.reloc_target);
}
}
compiled_function.compiled_function
})
.collect::<PrimaryMap<LocalFunctionIndex, _>>();
let progress = progress.clone();
let function_call_trampolines = pool.install(|| {
module
.signatures
.values()
.collect::<Vec<_>>()
.par_iter()
.map_init(
|| {
let target_machine = self.config().target_machine(target);
FuncTrampoline::new(target_machine, target.triple().clone(), binary_format)
.unwrap()
},
|func_trampoline, sig| {
let trampoline =
func_trampoline.trampoline(sig, self.config(), "", compile_info);
if let Some(progress) = progress.as_ref() {
progress.notify_steps(WASM_TRAMPOLINE_ESTIMATED_BODY_SIZE)?;
}
trampoline
},
)
.collect::<Vec<_>>()
.into_iter()
.collect::<Result<PrimaryMap<_, _>, CompileError>>()
})?;
let dynamic_function_trampolines = {
let progress = progress.clone();
let target_machine = self.config().target_machine(target);
let func_trampoline =
FuncTrampoline::new(target_machine, target.triple().clone(), binary_format)
.unwrap();
module
.imported_function_types()
.collect::<Vec<_>>()
.into_iter()
.enumerate()
.map(|(index, func_type)| {
let trampoline = func_trampoline.dynamic_trampoline(
&func_type,
self.config(),
"",
index as u32,
&mut module_custom_sections,
&mut eh_frame_section_bytes,
&mut eh_frame_section_relocations,
&mut compact_unwind_section_bytes,
&mut compact_unwind_section_relocations,
&module_hash,
)?;
if let Some(progress) = progress.as_ref() {
progress.notify_steps(WASM_TRAMPOLINE_ESTIMATED_BODY_SIZE)?;
}
Ok(trampoline)
})
.collect::<Vec<_>>()
.into_iter()
.collect::<Result<PrimaryMap<_, _>, CompileError>>()?
};
let mut unwind_info = UnwindInfo::default();
if !eh_frame_section_bytes.is_empty() {
let eh_frame_idx = SectionIndex::from_u32(module_custom_sections.len() as u32);
module_custom_sections.push(CustomSection {
protection: CustomSectionProtection::Read,
alignment: None,
bytes: SectionBody::new_with_vec(eh_frame_section_bytes),
relocations: eh_frame_section_relocations,
});
unwind_info.eh_frame = Some(eh_frame_idx);
}
if !compact_unwind_section_bytes.is_empty() {
let cu_index = SectionIndex::from_u32(module_custom_sections.len() as u32);
module_custom_sections.push(CustomSection {
protection: CustomSectionProtection::Read,
alignment: None,
bytes: SectionBody::new_with_vec(compact_unwind_section_bytes),
relocations: compact_unwind_section_relocations,
});
unwind_info.compact_unwind = Some(cu_index);
}
let mut got = wasmer_compiler::types::function::GOT::empty();
if !got_targets.is_empty() {
let pointer_width = target
.triple()
.pointer_width()
.map_err(|_| CompileError::Codegen("Could not get pointer width".to_string()))?;
let got_entry_size = match pointer_width {
target_lexicon::PointerWidth::U64 => 8,
target_lexicon::PointerWidth::U32 => 4,
target_lexicon::PointerWidth::U16 => todo!(),
};
let got_entry_reloc_kind = match pointer_width {
target_lexicon::PointerWidth::U64 => RelocationKind::Abs8,
target_lexicon::PointerWidth::U32 => RelocationKind::Abs4,
target_lexicon::PointerWidth::U16 => todo!(),
};
let got_data: Vec<u8> = vec![0; got_targets.len() * got_entry_size];
let mut got_relocs = vec![];
for (i, target) in got_targets.into_iter().enumerate() {
got_relocs.push(wasmer_compiler::types::relocation::Relocation {
kind: got_entry_reloc_kind,
reloc_target: target,
offset: (i * got_entry_size) as u32,
addend: 0,
});
}
let got_idx = SectionIndex::from_u32(module_custom_sections.len() as u32);
module_custom_sections.push(CustomSection {
protection: CustomSectionProtection::Read,
alignment: None,
bytes: SectionBody::new_with_vec(got_data),
relocations: got_relocs,
});
got.index = Some(got_idx);
};
Ok(Compilation {
functions,
custom_sections: module_custom_sections,
function_call_trampolines,
dynamic_function_trampolines,
unwind_info,
got,
})
}
fn with_opts(
&mut self,
_suggested_compiler_opts: &wasmer_types::target::UserCompilerOptimizations,
) -> Result<(), CompileError> {
Ok(())
}
}