miden_assembly/ast/ident.rs
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185
use alloc::{string::ToString, sync::Arc};
use core::{
fmt,
hash::{Hash, Hasher},
str::FromStr,
};
use crate::{SourceSpan, Span, Spanned};
/// Represents the types of errors that can occur when parsing/validating an [Ident]
#[derive(Debug, thiserror::Error, PartialEq, Eq)]
pub enum IdentError {
#[error("invalid identifier: cannot be empty")]
Empty,
#[error("invalid identifier '{ident}': must contain only lowercase, ascii alphanumeric characters, or underscores")]
InvalidChars { ident: Arc<str> },
#[error("invalid identifier: must start with lowercase ascii alphabetic character")]
InvalidStart,
#[error("invalid identifier: length exceeds the maximum of {max} bytes")]
InvalidLength { max: usize },
#[error("invalid identifier: {0}")]
Casing(CaseKindError),
}
/// Represents the various types of casing errors that can occur, e.g. using an identifier
/// with `SCREAMING_CASE` where one with `snake_case` is expected.
#[derive(Debug, thiserror::Error, PartialEq, Eq)]
pub enum CaseKindError {
#[error("only uppercase characters or underscores are allowed, and must start with an alphabetic character")]
Screaming,
#[error("only lowercase characters or underscores are allowed, and must start with an alphabetic character")]
Snake,
#[error("only alphanumeric characters are allowed, and must start with a lowercase alphabetic character")]
Camel,
}
/// Represents a generic identifier in Miden Assembly source code.
///
/// This type is used internally by all other specialized identifier types, e.g.
/// [super::ProcedureName], and enforces the baseline rules for bare identifiers in Miden Assembly.
/// Higher-level types, such as `ProcedureName`, can implement their own variations on these rules,
/// and construct an [Ident] using [Ident::new_unchecked].
///
/// All identifiers are associated with a source span, and are interned to the extent possible, i.e.
/// rather than allocating a new `String` for every use of the same identifier, we attempt to have
/// all such uses share a single reference-counted allocation. This interning is not perfect or
/// guaranteed globally, but generally holds within a given module. In the future we may make these
/// actually interned strings with a global interner, but for now it is simply best-effort.
#[derive(Clone)]
pub struct Ident {
/// The source span associated with this identifier.
///
/// NOTE: To make use of this span, we need to know the context in which it was used, i.e.,
/// either the containing module or procedure, both of which have a source file which we can
/// use to render a source snippet for this span.
///
/// If a span is not known, the default value is used, which has zero-length and thus will not
/// be rendered as a source snippet.
span: SourceSpan,
/// The actual content of the identifier
name: Arc<str>,
}
impl Ident {
/// Parses an [Ident] from `source`.
pub fn new(source: impl AsRef<str>) -> Result<Self, IdentError> {
source.as_ref().parse()
}
/// Parses an [Ident] from `source`.
pub fn new_with_span(span: SourceSpan, source: impl AsRef<str>) -> Result<Self, IdentError> {
source.as_ref().parse::<Self>().map(|id| id.with_span(span))
}
/// Sets the span for this identifier.
pub fn with_span(mut self, span: SourceSpan) -> Self {
self.span = span;
self
}
/// This allows constructing an [Ident] directly from a ref-counted string that is known to be
/// a valid identifier, and so does not require re-parsing/re-validating. This must _not_ be
/// used to bypass validation when you have an identifier that is not valid, and such
/// identifiers will be caught during compilation and result in a panic being raised.
///
/// NOTE: This function is perma-unstable, it may be removed or modified at any time.
pub fn new_unchecked(name: Span<Arc<str>>) -> Self {
let (span, name) = name.into_parts();
Self { span, name }
}
/// Unwraps this [Ident], extracting the inner [`Arc<str>`].
pub fn into_inner(self) -> Arc<str> {
self.name
}
/// Returns the content of this identifier as a `str`.
pub fn as_str(&self) -> &str {
self.name.as_ref()
}
/// Applies the default [Ident] validation rules to `source`.
pub fn validate(source: impl AsRef<str>) -> Result<(), IdentError> {
let source = source.as_ref();
if source.is_empty() {
return Err(IdentError::Empty);
}
if !source.starts_with(|c: char| c.is_ascii_alphabetic()) {
return Err(IdentError::InvalidStart);
}
if !source.chars().all(|c| c.is_ascii_alphabetic() || matches!(c, '_' | '0'..='9')) {
return Err(IdentError::InvalidChars { ident: source.into() });
}
Ok(())
}
}
impl fmt::Debug for Ident {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
f.debug_tuple("Ident").field(&self.name).finish()
}
}
impl Eq for Ident {}
impl PartialEq for Ident {
fn eq(&self, other: &Self) -> bool {
self.name == other.name
}
}
impl Ord for Ident {
fn cmp(&self, other: &Self) -> core::cmp::Ordering {
self.name.cmp(&other.name)
}
}
impl PartialOrd for Ident {
fn partial_cmp(&self, other: &Self) -> Option<core::cmp::Ordering> {
Some(self.cmp(other))
}
}
impl Hash for Ident {
fn hash<H: Hasher>(&self, state: &mut H) {
self.name.hash(state);
}
}
impl Spanned for Ident {
fn span(&self) -> SourceSpan {
self.span
}
}
impl core::ops::Deref for Ident {
type Target = str;
fn deref(&self) -> &Self::Target {
self.name.as_ref()
}
}
impl AsRef<str> for Ident {
#[inline]
fn as_ref(&self) -> &str {
&self.name
}
}
impl fmt::Display for Ident {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
fmt::Display::fmt(&self.name, f)
}
}
impl FromStr for Ident {
type Err = IdentError;
fn from_str(s: &str) -> Result<Self, Self::Err> {
Self::validate(s)?;
let name = Arc::from(s.to_string().into_boxed_str());
Ok(Self { span: SourceSpan::default(), name })
}
}