rune/
source.rs

1//! Module for dealing with sources.
2//!
3//! The primary type in here is the [`Source`] struct, which holds onto all
4//! metadata necessary related to a source in order to build it.
5//!
6//! Sources are stored in the [`Sources`] collection.
7//!
8//! [`Sources`]: crate::sources::Sources
9
10#[cfg(feature = "emit")]
11use core::cmp;
12use core::fmt;
13use core::iter;
14#[cfg(feature = "emit")]
15use core::ops::Range;
16use core::slice;
17
18use crate as rune;
19#[cfg(feature = "std")]
20use crate::alloc::borrow::Cow;
21use crate::alloc::path::Path;
22use crate::alloc::prelude::*;
23use crate::alloc::{self, Box};
24
25#[cfg(feature = "emit")]
26use crate::ast::Span;
27
28/// Error raised when constructing a source.
29#[derive(Debug)]
30pub struct FromPathError {
31    kind: FromPathErrorKind,
32}
33
34impl From<alloc::Error> for FromPathError {
35    fn from(error: alloc::Error) -> Self {
36        Self {
37            kind: FromPathErrorKind::Alloc(error),
38        }
39    }
40}
41
42cfg_std! {
43    impl From<std::io::Error> for FromPathError {
44        fn from(error: std::io::Error) -> Self {
45            Self {
46                kind: FromPathErrorKind::Io(error),
47            }
48        }
49    }
50}
51
52impl fmt::Display for FromPathError {
53    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
54        match &self.kind {
55            FromPathErrorKind::Alloc(error) => error.fmt(f),
56            #[cfg(feature = "std")]
57            FromPathErrorKind::Io(error) => error.fmt(f),
58        }
59    }
60}
61
62#[derive(Debug)]
63enum FromPathErrorKind {
64    Alloc(alloc::Error),
65    #[cfg(feature = "std")]
66    Io(std::io::Error),
67}
68
69impl core::error::Error for FromPathError {
70    fn source(&self) -> Option<&(dyn core::error::Error + 'static)> {
71        match &self.kind {
72            FromPathErrorKind::Alloc(error) => Some(error),
73            #[cfg(feature = "std")]
74            FromPathErrorKind::Io(error) => Some(error),
75        }
76    }
77}
78
79/// A single source file.
80#[derive(Default, TryClone)]
81pub struct Source {
82    /// The name of the source.
83    name: SourceName,
84    /// The source string.
85    source: Box<str>,
86    /// The path the source was loaded from.
87    path: Option<Box<Path>>,
88    /// The starting byte indices in the source code.
89    line_starts: Box<[usize]>,
90}
91
92impl Source {
93    /// Construct a new source with the given name.
94    pub fn new(name: impl AsRef<str>, source: impl AsRef<str>) -> alloc::Result<Self> {
95        let name = Box::try_from(name.as_ref())?;
96        let source = source.as_ref();
97        let line_starts = line_starts(source).try_collect::<Box<[_]>>()?;
98
99        Ok(Self {
100            name: SourceName::Name(name),
101            source: source.try_into()?,
102            path: None,
103            line_starts,
104        })
105    }
106
107    /// Construct a new anonymously named `<memory>` source.
108    ///
109    /// # Examples
110    ///
111    /// ```
112    /// use rune::Source;
113    ///
114    /// let source = Source::memory("pub fn main() { 42 }")?;
115    /// assert_eq!(source.name(), "<memory>");
116    /// # Ok::<_, rune::support::Error>(())
117    /// ```
118    pub fn memory(source: impl AsRef<str>) -> alloc::Result<Self> {
119        let source = source.as_ref();
120        let line_starts = line_starts(source).try_collect::<Box<[_]>>()?;
121
122        Ok(Self {
123            name: SourceName::Memory,
124            source: source.try_into()?,
125            path: None,
126            line_starts,
127        })
128    }
129
130    cfg_std! {
131        /// Read and load a source from the given filesystem path.
132        pub fn from_path(path: impl AsRef<Path>) -> Result<Self, FromPathError> {
133            let name = Box::try_from(Cow::try_from(path.as_ref().to_string_lossy())?)?;
134            let source = Box::try_from(std::fs::read_to_string(path.as_ref())?)?;
135            let path = Some(path.as_ref().try_into()?);
136            let line_starts = line_starts(source.as_ref()).try_collect::<Box<[_]>>()?;
137
138            Ok(Self {
139                name: SourceName::Name(name),
140                source,
141                path,
142                line_starts,
143            })
144        }
145    }
146
147    /// Construct a new source with the given content and path.
148    ///
149    /// # Examples
150    ///
151    /// ```
152    /// use std::path::Path;
153    /// use rune::Source;
154    ///
155    /// let source = Source::with_path("test", "pub fn main() { 42 }", "test.rn")?;
156    /// assert_eq!(source.name(), "test");
157    /// assert_eq!(source.path(), Some(Path::new("test.rn")));
158    /// # Ok::<_, rune::support::Error>(())
159    /// ```
160    pub fn with_path(
161        name: impl AsRef<str>,
162        source: impl AsRef<str>,
163        path: impl AsRef<Path>,
164    ) -> alloc::Result<Self> {
165        let name = Box::try_from(name.as_ref())?;
166        let source = Box::try_from(source.as_ref())?;
167        let path = Some(path.as_ref().try_into()?);
168        let line_starts = line_starts(source.as_ref()).try_collect::<Box<[_]>>()?;
169
170        Ok(Self {
171            name: SourceName::Name(name),
172            source,
173            path,
174            line_starts,
175        })
176    }
177
178    /// Access all line starts in the source.
179    #[cfg(feature = "emit")]
180    pub(crate) fn line_starts(&self) -> &[usize] {
181        &self.line_starts
182    }
183
184    /// Get the name of the source.
185    pub fn name(&self) -> &str {
186        match &self.name {
187            SourceName::Memory => "<memory>",
188            SourceName::Name(name) => name,
189        }
190    }
191
192    ///  et the given range from the source.
193    pub(crate) fn get<I>(&self, i: I) -> Option<&I::Output>
194    where
195        I: slice::SliceIndex<str>,
196    {
197        self.source.get(i)
198    }
199
200    /// Access the underlying string for the source.
201    pub(crate) fn as_str(&self) -> &str {
202        &self.source
203    }
204
205    /// Get the path associated with the source.
206    ///
207    /// # Examples
208    ///
209    /// ```
210    /// use std::path::Path;
211    /// use rune::Source;
212    ///
213    /// let source = Source::with_path("test", "pub fn main() { 42 }", "test.rn")?;
214    /// assert_eq!(source.name(), "test");
215    /// assert_eq!(source.path(), Some(Path::new("test.rn")));
216    /// # Ok::<_, rune::support::Error>(())
217    /// ```
218    pub fn path(&self) -> Option<&Path> {
219        self.path.as_deref()
220    }
221
222    /// Convert the given offset to a utf-16 line and character.
223    #[cfg(feature = "languageserver")]
224    pub(crate) fn pos_to_utf16cu_linecol(&self, offset: usize) -> (usize, usize) {
225        let (line, offset, rest) = self.position(offset);
226
227        let col = rest
228            .char_indices()
229            .flat_map(|(n, c)| (n < offset).then(|| c.encode_utf16(&mut [0u16; 2]).len()))
230            .sum();
231
232        (line, col)
233    }
234
235    /// Convert the given offset to a utf-16 line and character.
236    pub fn pos_to_utf8_linecol(&self, offset: usize) -> (usize, usize) {
237        let (line, offset, rest) = self.position(offset);
238        let col = rest.char_indices().take_while(|&(n, _)| n < offset).count();
239        (line, col)
240    }
241
242    /// Get the line index for the given byte.
243    #[cfg(feature = "emit")]
244    pub(crate) fn line_index(&self, byte_index: usize) -> usize {
245        self.line_starts
246            .binary_search(&byte_index)
247            .unwrap_or_else(|next_line| next_line.saturating_sub(1))
248    }
249
250    /// Get the range corresponding to the given line index.
251    #[cfg(feature = "emit")]
252    pub(crate) fn line_range(&self, line_index: usize) -> Option<Range<usize>> {
253        let line_start = self.line_start(line_index)?;
254        let next_line_start = self.line_start(line_index.saturating_add(1))?;
255        Some(line_start..next_line_start)
256    }
257
258    /// Get the number of lines in the source.
259    #[cfg(feature = "emit")]
260    pub(crate) fn line_count(&self) -> usize {
261        self.line_starts.len()
262    }
263
264    /// Access the line number of content that starts with the given span.
265    #[cfg(feature = "emit")]
266    pub(crate) fn line(&self, span: Span) -> Option<(usize, usize, [&str; 3])> {
267        let from = span.range();
268        let (lin, col) = self.pos_to_utf8_linecol(from.start);
269        let line = self.line_range(lin)?;
270
271        let start = from.start.checked_sub(line.start)?;
272        let end = from.end.checked_sub(line.start)?;
273
274        let text = self.source.get(line)?;
275        let prefix = text.get(..start)?;
276        let mid = text.get(start..end)?;
277        let suffix = text.get(end..)?;
278
279        Some((lin, col, [prefix, mid, suffix]))
280    }
281
282    fn position(&self, offset: usize) -> (usize, usize, &str) {
283        if offset == 0 {
284            return Default::default();
285        }
286
287        let line = match self.line_starts.binary_search(&offset) {
288            Ok(exact) => exact,
289            Err(0) => return Default::default(),
290            Err(n) => n - 1,
291        };
292
293        let line_start = self.line_starts[line];
294
295        let rest = &self.source[line_start..];
296        let offset = offset.saturating_sub(line_start);
297        (line, offset, rest)
298    }
299
300    #[cfg(feature = "emit")]
301    fn line_start(&self, line_index: usize) -> Option<usize> {
302        match line_index.cmp(&self.line_starts.len()) {
303            cmp::Ordering::Less => self.line_starts.get(line_index).copied(),
304            cmp::Ordering::Equal => Some(self.source.as_ref().len()),
305            cmp::Ordering::Greater => None,
306        }
307    }
308
309    pub(crate) fn len(&self) -> usize {
310        self.source.len()
311    }
312}
313
314impl fmt::Debug for Source {
315    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
316        f.debug_struct("Source")
317            .field("name", &self.name)
318            .field("path", &self.path)
319            .finish()
320    }
321}
322
323/// Holder for the name of a source.
324#[derive(Default, Debug, TryClone, PartialEq, Eq)]
325enum SourceName {
326    /// An in-memory source, will use `<memory>` when the source is being
327    /// referred to in diagnostics.
328    #[default]
329    Memory,
330    /// A named source.
331    Name(Box<str>),
332}
333
334fn line_starts(source: &str) -> impl Iterator<Item = usize> + '_ {
335    iter::once(0).chain(source.match_indices('\n').map(|(i, _)| i + 1))
336}