mod callgraph;
mod debug;
mod errors;
mod library;
mod module;
mod resolver;
mod rewrites;
mod symbols;
use alloc::{boxed::Box, collections::BTreeMap, string::ToString, sync::Arc, vec::Vec};
use core::{
cell::{Cell, RefCell},
ops::{ControlFlow, Index},
};
use miden_assembly_syntax::{
ast::{
self, Alias, AttributeSet, GlobalItemIndex, InvocationTarget, InvokeKind, ItemIndex,
Module, ModuleIndex, Path, SymbolResolution, Visibility, types,
},
debuginfo::{SourceManager, SourceSpan, Span, Spanned},
library::{ItemInfo, ModuleInfo},
};
use miden_core::{Word, advice::AdviceMap, program::Kernel};
use miden_project::Linkage;
use smallvec::{SmallVec, smallvec};
pub use self::{
callgraph::{CallGraph, CycleError},
errors::LinkerError,
library::{LinkLibrary, LinkLibraryKind},
resolver::{ResolverCache, SymbolResolutionContext, SymbolResolver},
symbols::{Symbol, SymbolItem},
};
use self::{
module::{LinkModule, ModuleSource},
resolver::*,
};
#[derive(Debug, Default, Copy, Clone, PartialEq, Eq)]
pub enum LinkStatus {
#[default]
Unlinked,
PartiallyLinked,
Linked,
}
#[derive(Clone)]
pub struct Linker {
libraries: BTreeMap<Word, LinkLibrary>,
modules: Vec<LinkModule>,
callgraph: CallGraph,
procedures_by_mast_root: BTreeMap<Word, SmallVec<[GlobalItemIndex; 1]>>,
kernel_index: Option<ModuleIndex>,
kernel: Kernel,
source_manager: Arc<dyn SourceManager>,
}
impl Linker {
pub fn new(source_manager: Arc<dyn SourceManager>) -> Self {
Self {
libraries: Default::default(),
modules: Default::default(),
callgraph: Default::default(),
procedures_by_mast_root: Default::default(),
kernel_index: None,
kernel: Default::default(),
source_manager,
}
}
pub fn link_library(&mut self, library: LinkLibrary) -> Result<(), LinkerError> {
use alloc::collections::btree_map::Entry;
match self.libraries.entry(library.mast.commitment()) {
Entry::Vacant(entry) => {
entry.insert(library.clone());
self.link_assembled_modules(library.module_infos)
},
Entry::Occupied(mut entry) => {
let prev = entry.get_mut();
if matches!(prev.linkage, Linkage::Dynamic) {
prev.linkage = library.linkage;
}
Ok(())
},
}
}
pub fn link_assembled_modules(
&mut self,
modules: impl IntoIterator<Item = ModuleInfo>,
) -> Result<(), LinkerError> {
for module in modules {
self.link_assembled_module(module)?;
}
Ok(())
}
pub fn link_assembled_module(
&mut self,
module: ModuleInfo,
) -> Result<ModuleIndex, LinkerError> {
log::debug!(target: "linker", "adding pre-assembled module {} to module graph", module.path());
let module_path = module.path();
let is_duplicate = self.find_module_index(module_path).is_some();
if is_duplicate {
return Err(LinkerError::DuplicateModule {
path: module_path.to_path_buf().into_boxed_path().into(),
});
}
let module_index = self.next_module_id();
let items = module.items();
let mut symbols = Vec::with_capacity(items.len());
for (idx, item) in items {
let gid = module_index + idx;
self.callgraph.get_or_insert_node(gid);
match &item {
ItemInfo::Procedure(item) => {
self.register_procedure_root(gid, item.digest)?;
},
ItemInfo::Constant(_) | ItemInfo::Type(_) => (),
}
symbols.push(Symbol::new(
item.name().clone(),
Visibility::Public,
LinkStatus::Linked,
SymbolItem::Compiled(item.clone()),
));
}
let link_module = LinkModule::new(
module_index,
ast::ModuleKind::Library,
LinkStatus::Linked,
ModuleSource::Mast,
module_path.into(),
)
.with_symbols(symbols);
self.modules.push(link_module);
Ok(module_index)
}
pub fn link_modules(
&mut self,
modules: impl IntoIterator<Item = Box<Module>>,
) -> Result<Vec<ModuleIndex>, LinkerError> {
modules.into_iter().map(|mut m| self.link_module(&mut m)).collect()
}
pub fn link_module(&mut self, module: &mut Module) -> Result<ModuleIndex, LinkerError> {
log::debug!(target: "linker", "adding unprocessed module {}", module.path());
let is_duplicate = self.find_module_index(module.path()).is_some();
if is_duplicate {
return Err(LinkerError::DuplicateModule { path: module.path().into() });
}
let module_index = self.next_module_id();
let symbols = {
core::mem::take(module.items_mut())
.into_iter()
.enumerate()
.map(|(idx, item)| {
let gid = module_index + ast::ItemIndex::new(idx);
self.callgraph.get_or_insert_node(gid);
Symbol::new(
item.name().clone(),
item.visibility(),
LinkStatus::Unlinked,
match item {
ast::Export::Alias(alias) => {
SymbolItem::Alias { alias, resolved: Cell::new(None) }
},
ast::Export::Type(item) => SymbolItem::Type(item),
ast::Export::Constant(item) => SymbolItem::Constant(item),
ast::Export::Procedure(item) => {
SymbolItem::Procedure(RefCell::new(Box::new(item)))
},
},
)
})
.collect()
};
let link_module = LinkModule::new(
module_index,
module.kind(),
LinkStatus::Unlinked,
ModuleSource::Ast,
module.path().into(),
)
.with_advice_map(module.advice_map().clone())
.with_symbols(symbols);
self.modules.push(link_module);
Ok(module_index)
}
#[inline]
fn next_module_id(&self) -> ModuleIndex {
ModuleIndex::new(self.modules.len())
}
}
impl Linker {
pub(super) fn with_kernel(
source_manager: Arc<dyn SourceManager>,
kernel: Kernel,
kernel_module: ModuleInfo,
) -> Self {
assert!(!kernel.is_empty());
assert!(
kernel_module.path().is_kernel_path(),
"invalid root kernel module path: {}",
kernel_module.path()
);
log::debug!(target: "linker", "instantiating linker with kernel {}", kernel_module.path());
let mut graph = Self::new(source_manager);
let kernel_index = graph
.link_assembled_module(kernel_module)
.expect("failed to add kernel module to the module graph");
graph.kernel_index = Some(kernel_index);
graph.kernel = kernel;
graph
}
pub(super) fn link_with_kernel(
&mut self,
kernel: Kernel,
kernel_module: ModuleInfo,
) -> Result<(), LinkerError> {
assert!(self.kernel.is_empty());
assert!(!kernel.is_empty());
assert!(
kernel_module.path().is_kernel_path(),
"invalid root kernel module path: {}",
kernel_module.path()
);
log::debug!(target: "linker", "modifying linker with kernel {}", kernel_module.path());
let kernel_index = self.link_assembled_module(kernel_module)?;
self.kernel_index = Some(kernel_index);
self.kernel = kernel;
Ok(())
}
pub fn kernel(&self) -> &Kernel {
&self.kernel
}
pub fn has_nonempty_kernel(&self) -> bool {
self.kernel_index.is_some() || !self.kernel.is_empty()
}
}
impl Linker {
pub fn link(
&mut self,
modules: impl IntoIterator<Item = Box<Module>>,
) -> Result<Vec<ModuleIndex>, LinkerError> {
let module_indices = self.link_modules(modules)?;
self.link_and_rewrite()?;
Ok(module_indices)
}
pub fn link_kernel(
&mut self,
mut kernel: Box<Module>,
) -> Result<Vec<ModuleIndex>, LinkerError> {
let module_index = self.link_module(&mut kernel)?;
for module in self.modules.iter_mut().take(module_index.as_usize()) {
if matches!(module.source(), ModuleSource::Ast) {
module.set_kind(ast::ModuleKind::Kernel);
}
}
self.kernel_index = Some(module_index);
self.link_and_rewrite()?;
Ok(vec![module_index])
}
fn link_and_rewrite(&mut self) -> Result<(), LinkerError> {
log::debug!(
target: "linker",
"processing {} unlinked/partially-linked modules, and recomputing module graph",
self.modules.iter().filter(|m| !m.is_linked()).count()
);
if self.modules.is_empty() {
return Err(LinkerError::Empty);
}
if self.modules.iter().all(|m| m.is_linked()) {
return Ok(());
}
let resolver = SymbolResolver::new(self);
let mut edges = Vec::new();
let mut cache = ResolverCache::default();
for (module_index, module) in self.modules.iter().enumerate() {
if !module.is_unlinked() {
continue;
}
let module_index = ModuleIndex::new(module_index);
for (symbol_idx, symbol) in module.symbols().enumerate() {
assert!(
symbol.is_unlinked(),
"an unlinked module should only have unlinked symbols"
);
let gid = module_index + ItemIndex::new(symbol_idx);
rewrites::rewrite_symbol(gid, symbol, &resolver, &mut cache)?;
match symbol.item() {
SymbolItem::Compiled(_) | SymbolItem::Type(_) | SymbolItem::Constant(_) => (),
SymbolItem::Alias { alias, resolved } => {
if let Some(resolved) = resolved.get() {
log::debug!(target: "linker", " | resolved alias {} to item {resolved}", alias.target());
if self[resolved].is_procedure() {
edges.push((gid, resolved));
}
} else {
log::debug!(target: "linker", " | resolving alias {}..", alias.target());
let context = SymbolResolutionContext {
span: alias.target().span(),
module: module_index,
kind: None,
};
if let Some(callee) =
resolver.resolve_alias_target(&context, alias)?.into_global_id()
{
log::debug!(
target: "linker",
" | resolved alias to gid {:?}:{:?}",
callee.module,
callee.index
);
edges.push((gid, callee));
resolved.set(Some(callee));
}
}
},
SymbolItem::Procedure(proc) => {
let proc = proc.borrow();
for invoke in proc.invoked() {
log::debug!(target: "linker", " | recording {} dependency on {}", invoke.kind, &invoke.target);
let context = SymbolResolutionContext {
span: invoke.span(),
module: module_index,
kind: None,
};
if let Some(callee) = resolver
.resolve_invoke_target(&context, &invoke.target)?
.into_global_id()
{
log::debug!(
target: "linker",
" | resolved dependency to gid {}:{}",
callee.module.as_usize(),
callee.index.as_usize()
);
edges.push((gid, callee));
}
}
},
}
}
module.set_status(LinkStatus::Linked);
}
edges
.into_iter()
.for_each(|(caller, callee)| self.callgraph.add_edge(caller, callee));
self.callgraph.toposort().map_err(|cycle| {
let iter = cycle.into_node_ids();
let mut nodes = Vec::with_capacity(iter.len());
for node in iter {
let module = self[node.module].path();
let item = self[node].name();
nodes.push(module.join(item).to_string());
}
LinkerError::Cycle { nodes: nodes.into() }
})?;
Ok(())
}
}
impl Linker {
pub fn libraries(&self) -> impl Iterator<Item = &LinkLibrary> {
self.libraries.values()
}
pub fn topological_sort_from_root(
&self,
caller: GlobalItemIndex,
) -> Result<Vec<GlobalItemIndex>, CycleError> {
self.callgraph.toposort_caller(caller)
}
pub fn get_procedure_index_by_digest(
&self,
procedure_digest: &Word,
) -> Option<GlobalItemIndex> {
self.procedures_by_mast_root.get(procedure_digest).map(|indices| indices[0])
}
pub fn resolve_invoke_target(
&self,
caller: &SymbolResolutionContext,
target: &InvocationTarget,
) -> Result<SymbolResolution, LinkerError> {
let resolver = SymbolResolver::new(self);
resolver.resolve_invoke_target(caller, target)
}
pub fn resolve_alias_target(
&self,
caller: &SymbolResolutionContext,
target: &Alias,
) -> Result<SymbolResolution, LinkerError> {
let resolver = SymbolResolver::new(self);
resolver.resolve_alias_target(caller, target)
}
pub fn resolve_path(
&self,
caller: &SymbolResolutionContext,
path: &Path,
) -> Result<SymbolResolution, LinkerError> {
let resolver = SymbolResolver::new(self);
resolver.resolve_path(caller, Span::new(caller.span, path))
}
pub(super) fn resolve_signature(
&self,
gid: GlobalItemIndex,
) -> Result<Option<Arc<types::FunctionType>>, LinkerError> {
match self[gid].item() {
SymbolItem::Compiled(ItemInfo::Procedure(proc)) => Ok(proc.signature.clone()),
SymbolItem::Procedure(proc) => {
let proc = proc.borrow();
match proc.signature() {
Some(ty) => self.translate_function_type(gid.module, ty).map(Some),
None => Ok(None),
}
},
SymbolItem::Alias { alias, resolved } => {
if let Some(resolved) = resolved.get() {
return self.resolve_signature(resolved);
}
let context = SymbolResolutionContext {
span: alias.target().span(),
module: gid.module,
kind: Some(InvokeKind::ProcRef),
};
let resolution = self.resolve_alias_target(&context, alias)?;
match resolution {
SymbolResolution::MastRoot(_) => Ok(None),
SymbolResolution::Exact { gid, .. } => self.resolve_signature(gid),
SymbolResolution::Module { .. }
| SymbolResolution::Local(_)
| SymbolResolution::External(_) => unreachable!(),
}
},
SymbolItem::Compiled(_) | SymbolItem::Constant(_) | SymbolItem::Type(_) => {
panic!("procedure index unexpectedly refers to non-procedure item")
},
}
}
fn translate_function_type(
&self,
module_index: ModuleIndex,
ty: &ast::FunctionType,
) -> Result<Arc<types::FunctionType>, LinkerError> {
use miden_assembly_syntax::ast::TypeResolver;
let cc = ty.cc;
let mut args = Vec::with_capacity(ty.args.len());
let symbol_resolver = SymbolResolver::new(self);
let mut cache = ResolverCache::default();
let mut resolver = Resolver {
resolver: &symbol_resolver,
cache: &mut cache,
current_module: module_index,
};
for arg in ty.args.iter() {
if let Some(arg) = resolver.resolve(arg)? {
args.push(arg);
} else {
let span = arg.span();
return Err(LinkerError::UndefinedType {
span,
source_file: self.source_manager.get(span.source_id()).ok(),
});
}
}
let mut results = Vec::with_capacity(ty.results.len());
for result in ty.results.iter() {
if let Some(result) = resolver.resolve(result)? {
results.push(result);
} else {
let span = result.span();
return Err(LinkerError::UndefinedType {
span,
source_file: self.source_manager.get(span.source_id()).ok(),
});
}
}
Ok(Arc::new(types::FunctionType::new(cc, args, results)))
}
pub(super) fn resolve_attributes(
&self,
gid: GlobalItemIndex,
) -> Result<AttributeSet, LinkerError> {
match self[gid].item() {
SymbolItem::Compiled(ItemInfo::Procedure(proc)) => Ok(proc.attributes.clone()),
SymbolItem::Procedure(proc) => {
let proc = proc.borrow();
Ok(proc.attributes().clone())
},
SymbolItem::Alias { alias, resolved } => {
if let Some(resolved) = resolved.get() {
return self.resolve_attributes(resolved);
}
let context = SymbolResolutionContext {
span: alias.target().span(),
module: gid.module,
kind: Some(InvokeKind::ProcRef),
};
let resolution = self.resolve_alias_target(&context, alias)?;
match resolution {
SymbolResolution::MastRoot(_)
| SymbolResolution::Local(_)
| SymbolResolution::External(_) => Ok(AttributeSet::default()),
SymbolResolution::Exact { gid, .. } => self.resolve_attributes(gid),
SymbolResolution::Module { .. } => {
unreachable!("expected resolver to raise error")
},
}
},
SymbolItem::Compiled(_) | SymbolItem::Constant(_) | SymbolItem::Type(_) => {
panic!("procedure index unexpectedly refers to non-procedure item")
},
}
}
pub(super) fn resolve_type(
&self,
span: SourceSpan,
gid: GlobalItemIndex,
) -> Result<ast::types::Type, LinkerError> {
use miden_assembly_syntax::ast::TypeResolver;
let symbol_resolver = SymbolResolver::new(self);
let mut cache = ResolverCache::default();
let mut resolver = Resolver {
cache: &mut cache,
resolver: &symbol_resolver,
current_module: gid.module,
};
resolver.get_type(span, gid)
}
pub(crate) fn register_procedure_root(
&mut self,
id: GlobalItemIndex,
procedure_mast_root: Word,
) -> Result<(), LinkerError> {
use alloc::collections::btree_map::Entry;
match self.procedures_by_mast_root.entry(procedure_mast_root) {
Entry::Occupied(ref mut entry) => {
let prev_id = entry.get()[0];
if prev_id != id {
entry.get_mut().push(id);
}
},
Entry::Vacant(entry) => {
entry.insert(smallvec![id]);
},
}
Ok(())
}
pub fn find_module_index(&self, path: &Path) -> Option<ModuleIndex> {
self.modules.iter().position(|m| path == m.path()).map(ModuleIndex::new)
}
pub fn find_module(&self, path: &Path) -> Option<&LinkModule> {
self.modules.iter().find(|m| path == m.path())
}
}
impl Linker {
pub(super) fn const_eval(
&self,
gid: GlobalItemIndex,
expr: &ast::ConstantExpr,
cache: &mut ResolverCache,
) -> Result<ast::ConstantValue, LinkerError> {
let symbol_resolver = SymbolResolver::new(self);
let mut resolver = Resolver {
resolver: &symbol_resolver,
cache,
current_module: gid.module,
};
ast::constants::eval::expr(expr, &mut resolver).map(|expr| expr.expect_value())
}
}
impl Index<ModuleIndex> for Linker {
type Output = LinkModule;
fn index(&self, index: ModuleIndex) -> &Self::Output {
&self.modules[index.as_usize()]
}
}
impl Index<GlobalItemIndex> for Linker {
type Output = Symbol;
fn index(&self, index: GlobalItemIndex) -> &Self::Output {
&self.modules[index.module.as_usize()][index.index]
}
}