typst_syntax/span.rs
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157
use std::fmt::{self, Debug, Formatter};
use std::num::NonZeroU64;
use std::ops::Range;
use ecow::EcoString;
use crate::FileId;
/// A unique identifier for a syntax node.
///
/// This is used throughout the compiler to track which source section an error
/// or element stems from. Can be [mapped back](crate::Source::range) to a byte
/// range for user facing display.
///
/// During editing, the span values stay mostly stable, even for nodes behind an
/// insertion. This is not true for simple ranges as they would shift. Spans can
/// be used as inputs to memoized functions without hurting cache performance
/// when text is inserted somewhere in the document other than the end.
///
/// Span ids are ordered in the syntax tree to enable quickly finding the node
/// with some id:
/// - The id of a parent is always smaller than the ids of any of its children.
/// - The id of a node is always greater than any id in the subtrees of any left
/// sibling and smaller than any id in the subtrees of any right sibling.
///
/// This type takes up 8 bytes and is null-optimized (i.e. `Option<Span>` also
/// takes 8 bytes).
#[derive(Debug, Copy, Clone, Eq, PartialEq, Hash)]
pub struct Span(NonZeroU64);
impl Span {
/// The full range of numbers available for span numbering.
pub(super) const FULL: Range<u64> = 2..(1 << Self::BITS);
/// The value reserved for the detached span.
const DETACHED: u64 = 1;
/// Data layout:
/// | 16 bits source id | 48 bits number |
const BITS: usize = 48;
/// Create a new span from a source id and a unique number.
///
/// Returns `None` if `number` is not contained in `FULL`.
pub(super) const fn new(id: FileId, number: u64) -> Option<Self> {
if number < Self::FULL.start || number >= Self::FULL.end {
return None;
}
let bits = ((id.into_raw() as u64) << Self::BITS) | number;
match NonZeroU64::new(bits) {
Some(v) => Some(Self(v)),
None => unreachable!(),
}
}
/// Create a span that does not point into any source file.
pub const fn detached() -> Self {
match NonZeroU64::new(Self::DETACHED) {
Some(v) => Self(v),
None => unreachable!(),
}
}
/// Whether the span is detached.
pub const fn is_detached(self) -> bool {
self.0.get() == Self::DETACHED
}
/// The id of the source file the span points into.
///
/// Returns `None` if the span is detached.
pub const fn id(self) -> Option<FileId> {
if self.is_detached() {
return None;
}
let bits = (self.0.get() >> Self::BITS) as u16;
Some(FileId::from_raw(bits))
}
/// The unique number of the span within its [`Source`](crate::Source).
pub const fn number(self) -> u64 {
self.0.get() & ((1 << Self::BITS) - 1)
}
/// Return `other` if `self` is detached and `self` otherwise.
pub fn or(self, other: Self) -> Self {
if self.is_detached() {
other
} else {
self
}
}
/// Find the first non-detached span in the iterator.
pub fn find(iter: impl IntoIterator<Item = Self>) -> Self {
iter.into_iter()
.find(|span| !span.is_detached())
.unwrap_or(Span::detached())
}
/// Resolve a file location relative to this span's source.
pub fn resolve_path(self, path: &str) -> Result<FileId, EcoString> {
let Some(file) = self.id() else {
return Err("cannot access file system from here".into());
};
Ok(file.join(path))
}
}
/// A value with a span locating it in the source code.
#[derive(Copy, Clone, Eq, PartialEq, Hash)]
pub struct Spanned<T> {
/// The spanned value.
pub v: T,
/// The value's location in source code.
pub span: Span,
}
impl<T> Spanned<T> {
/// Create a new instance from a value and its span.
pub fn new(v: T, span: Span) -> Self {
Self { v, span }
}
/// Convert from `&Spanned<T>` to `Spanned<&T>`
pub fn as_ref(&self) -> Spanned<&T> {
Spanned { v: &self.v, span: self.span }
}
/// Map the value using a function.
pub fn map<F, U>(self, f: F) -> Spanned<U>
where
F: FnOnce(T) -> U,
{
Spanned { v: f(self.v), span: self.span }
}
}
impl<T: Debug> Debug for Spanned<T> {
fn fmt(&self, f: &mut Formatter) -> fmt::Result {
self.v.fmt(f)
}
}
#[cfg(test)]
mod tests {
use crate::{FileId, Span};
#[test]
fn test_span_encoding() {
let id = FileId::from_raw(5);
let span = Span::new(id, 10).unwrap();
assert_eq!(span.id(), Some(id));
assert_eq!(span.number(), 10);
}
}