syntect/
easy.rs

1//! API wrappers for common use cases like highlighting strings and
2//! files without caring about intermediate semantic representation
3//! and caching.
4
5use crate::Error;
6use crate::parsing::{ScopeStack, ParseState, SyntaxReference, SyntaxSet, ScopeStackOp};
7use crate::highlighting::{Highlighter, HighlightState, HighlightIterator, Theme, Style};
8use std::io::{self, BufReader};
9use std::fs::File;
10use std::path::Path;
11// use util::debug_print_ops;
12
13/// Simple way to go directly from lines of text to colored tokens.
14///
15/// Depending on how you load the syntaxes (see the [`SyntaxSet`] docs), this can either take
16/// strings with trailing `\n`s or without.
17///
18/// [`SyntaxSet`]: ../parsing/struct.SyntaxSet.html
19///
20/// # Examples
21///
22/// Prints colored lines of a string to the terminal
23///
24/// ```
25/// use syntect::easy::HighlightLines;
26/// use syntect::parsing::SyntaxSet;
27/// use syntect::highlighting::{ThemeSet, Style};
28/// use syntect::util::{as_24_bit_terminal_escaped, LinesWithEndings};
29///
30/// // Load these once at the start of your program
31/// let ps = SyntaxSet::load_defaults_newlines();
32/// let ts = ThemeSet::load_defaults();
33///
34/// let syntax = ps.find_syntax_by_extension("rs").unwrap();
35/// let mut h = HighlightLines::new(syntax, &ts.themes["base16-ocean.dark"]);
36/// let s = "pub struct Wow { hi: u64 }\nfn blah() -> u64 {}";
37/// for line in LinesWithEndings::from(s) { // LinesWithEndings enables use of newlines mode
38///     let ranges: Vec<(Style, &str)> = h.highlight_line(line, &ps).unwrap();
39///     let escaped = as_24_bit_terminal_escaped(&ranges[..], true);
40///     print!("{}", escaped);
41/// }
42/// ```
43pub struct HighlightLines<'a> {
44    highlighter: Highlighter<'a>,
45    parse_state: ParseState,
46    highlight_state: HighlightState,
47}
48
49impl<'a> HighlightLines<'a> {
50    pub fn new(syntax: &SyntaxReference, theme: &'a Theme) -> HighlightLines<'a> {
51        let highlighter = Highlighter::new(theme);
52        let highlight_state = HighlightState::new(&highlighter, ScopeStack::new());
53        HighlightLines {
54            highlighter,
55            parse_state: ParseState::new(syntax),
56            highlight_state,
57        }
58    }
59
60    #[deprecated(since="5.0.0", note="Renamed to `highlight_line` to make it clear it should be passed a single line at a time")]
61    pub fn highlight<'b>(&mut self, line: &'b str, syntax_set: &SyntaxSet) -> Vec<(Style, &'b str)> {
62        self.highlight_line(line, syntax_set).expect("`highlight` is deprecated, use `highlight_line` instead")
63    }
64
65    /// Highlights a line of a file
66    pub fn highlight_line<'b>(&mut self, line: &'b str, syntax_set: &SyntaxSet) -> Result<Vec<(Style, &'b str)>, Error> {
67        // println!("{}", self.highlight_state.path);
68        let ops = self.parse_state.parse_line(line, syntax_set)?;
69        // use util::debug_print_ops;
70        // debug_print_ops(line, &ops);
71        let iter =
72            HighlightIterator::new(&mut self.highlight_state, &ops[..], line, &self.highlighter);
73        Ok(iter.collect())
74    }
75}
76
77/// Convenience struct containing everything you need to highlight a file
78///
79/// Use the `reader` to get the lines of the file and the `highlight_lines` to highlight them. See
80/// the [`new`] method docs for more information.
81///
82/// [`new`]: #method.new
83pub struct HighlightFile<'a> {
84    pub reader: BufReader<File>,
85    pub highlight_lines: HighlightLines<'a>,
86}
87
88impl<'a> HighlightFile<'a> {
89    /// Constructs a file reader and a line highlighter to get you reading files as fast as possible.
90    ///
91    /// This auto-detects the syntax from the extension and constructs a [`HighlightLines`] with the
92    /// correct syntax and theme.
93    ///
94    /// [`HighlightLines`]: struct.HighlightLines.html
95    ///
96    /// # Examples
97    ///
98    /// Using the `newlines` mode is a bit involved but yields more robust and glitch-free highlighting,
99    /// as well as being slightly faster since it can re-use a line buffer.
100    ///
101    /// ```
102    /// use syntect::parsing::SyntaxSet;
103    /// use syntect::highlighting::{ThemeSet, Style};
104    /// use syntect::util::as_24_bit_terminal_escaped;
105    /// use syntect::easy::HighlightFile;
106    /// use std::io::BufRead;
107    ///
108    /// # use std::io;
109    /// # fn foo() -> io::Result<()> {
110    /// let ss = SyntaxSet::load_defaults_newlines();
111    /// let ts = ThemeSet::load_defaults();
112    ///
113    /// let mut highlighter = HighlightFile::new("testdata/highlight_test.erb", &ss, &ts.themes["base16-ocean.dark"]).unwrap();
114    /// let mut line = String::new();
115    /// while highlighter.reader.read_line(&mut line)? > 0 {
116    ///     {
117    ///         let regions: Vec<(Style, &str)> = highlighter.highlight_lines.highlight_line(&line, &ss).unwrap();
118    ///         print!("{}", as_24_bit_terminal_escaped(&regions[..], true));
119    ///     } // until NLL this scope is needed so we can clear the buffer after
120    ///     line.clear(); // read_line appends so we need to clear between lines
121    /// }
122    /// # Ok(())
123    /// # }
124    /// ```
125    ///
126    /// This example uses `reader.lines()` to get lines without a newline character, it's simpler but may break on rare tricky cases.
127    ///
128    /// ```
129    /// use syntect::parsing::SyntaxSet;
130    /// use syntect::highlighting::{ThemeSet, Style};
131    /// use syntect::util::as_24_bit_terminal_escaped;
132    /// use syntect::easy::HighlightFile;
133    /// use std::io::BufRead;
134    ///
135    /// let ss = SyntaxSet::load_defaults_nonewlines();
136    /// let ts = ThemeSet::load_defaults();
137    ///
138    /// let mut highlighter = HighlightFile::new("testdata/highlight_test.erb", &ss, &ts.themes["base16-ocean.dark"]).unwrap();
139    /// for maybe_line in highlighter.reader.lines() {
140    ///     let line = maybe_line.unwrap();
141    ///     let regions: Vec<(Style, &str)> = highlighter.highlight_lines.highlight_line(&line, &ss).unwrap();
142    ///     println!("{}", as_24_bit_terminal_escaped(&regions[..], true));
143    /// }
144    /// ```
145    pub fn new<P: AsRef<Path>>(path_obj: P,
146                               ss: &SyntaxSet,
147                               theme: &'a Theme)
148                               -> io::Result<HighlightFile<'a>> {
149        let path: &Path = path_obj.as_ref();
150        let f = File::open(path)?;
151        let syntax = ss.find_syntax_for_file(path)?
152            .unwrap_or_else(|| ss.find_syntax_plain_text());
153
154        Ok(HighlightFile {
155            reader: BufReader::new(f),
156            highlight_lines: HighlightLines::new(syntax, theme),
157        })
158    }
159}
160
161/// Iterator over the ranges of a line which a given the operation from the parser applies.
162///
163/// Use [`ScopeRegionIterator`] to obtain directly regions (`&str`s) from the line.
164///
165/// To use, just keep your own [`ScopeStack`] and then `ScopeStack.apply(op)` the operation that is
166/// yielded at the top of your `for` loop over this iterator. Now you have a substring of the line
167/// and the scope stack for that token.
168///
169/// See the `synstats.rs` example for an example of using this iterator.
170///
171/// **Note:** This will often return empty ranges, just `continue` after applying the op if you
172/// don't want them.
173///
174/// [`ScopeStack`]: ../parsing/struct.ScopeStack.html
175/// [`ScopeRegionIterator`]: ./struct.ScopeRegionIterator.html
176#[derive(Debug)]
177pub struct ScopeRangeIterator<'a> {
178    ops: &'a [(usize, ScopeStackOp)],
179    line: &'a str,
180    index: usize,
181    last_str_index: usize,
182}
183
184impl<'a> ScopeRangeIterator<'a> {
185    pub fn new(ops: &'a [(usize, ScopeStackOp)], line: &'a str) -> ScopeRangeIterator<'a> {
186        ScopeRangeIterator {
187            ops,
188            line,
189            index: 0,
190            last_str_index: 0,
191        }
192    }
193}
194
195static NOOP_OP: ScopeStackOp = ScopeStackOp::Noop;
196
197impl<'a> Iterator for ScopeRangeIterator<'a> {
198    type Item = (std::ops::Range<usize>, &'a ScopeStackOp);
199    fn next(&mut self) -> Option<Self::Item> {
200        if self.index > self.ops.len() {
201            return None;
202        }
203
204        // region extends up to next operation (ops[index]) or string end if there is none
205        // note the next operation may be at, last_str_index, in which case the region is empty
206        let next_str_i = if self.index == self.ops.len() {
207            self.line.len()
208        } else {
209            self.ops[self.index].0
210        };
211        let range = self.last_str_index..next_str_i;
212        self.last_str_index = next_str_i;
213
214        // the first region covers everything before the first op, which may be empty
215        let op = if self.index == 0 {
216            &NOOP_OP
217        } else {
218            &self.ops[self.index - 1].1
219        };
220
221        self.index += 1;
222        Some((range, op))
223    }
224}
225
226/// A convenience wrapper over [`ScopeRangeIterator`] to return `&str`s directly.
227///
228/// To use, just keep your own [`ScopeStack`] and then `ScopeStack.apply(op)` the operation that is
229/// yielded at the top of your `for` loop over this iterator. Now you have a substring of the line
230/// and the scope stack for that token.
231///
232/// See the `synstats.rs` example for an example of using this iterator.
233///
234/// **Note:** This will often return empty regions, just `continue` after applying the op if you
235/// don't want them.
236///
237/// [`ScopeStack`]: ../parsing/struct.ScopeStack.html
238/// [`ScopeRangeIterator`]: ./struct.ScopeRangeIterator.html
239#[derive(Debug)]
240pub struct ScopeRegionIterator<'a> {
241    range_iter: ScopeRangeIterator<'a>,
242}
243
244impl<'a> ScopeRegionIterator<'a> {
245    pub fn new(ops: &'a [(usize, ScopeStackOp)], line: &'a str) -> ScopeRegionIterator<'a> {
246        ScopeRegionIterator {
247            range_iter: ScopeRangeIterator::new(ops, line),
248        }
249    }
250}
251
252impl<'a> Iterator for ScopeRegionIterator<'a> {
253    type Item = (&'a str, &'a ScopeStackOp);
254    fn next(&mut self) -> Option<Self::Item> {
255        let (range, op) = self.range_iter.next()?;
256        Some((&self.range_iter.line[range], op))
257    }
258}
259
260#[cfg(test)]
261mod tests {
262    use super::*;
263    use crate::parsing::{SyntaxSet, ParseState, ScopeStack};
264    #[cfg(feature = "default-themes")]
265    use crate::highlighting::ThemeSet;
266    use std::str::FromStr;
267
268    #[cfg(all(feature = "default-syntaxes", feature = "default-themes"))]
269    #[test]
270    fn can_highlight_lines() {
271        let ss = SyntaxSet::load_defaults_nonewlines();
272        let ts = ThemeSet::load_defaults();
273        let syntax = ss.find_syntax_by_extension("rs").unwrap();
274        let mut h = HighlightLines::new(syntax, &ts.themes["base16-ocean.dark"]);
275        let ranges = h.highlight_line("pub struct Wow { hi: u64 }", &ss).expect("#[cfg(test)]");
276        assert!(ranges.len() > 4);
277    }
278
279    #[cfg(all(feature = "default-syntaxes", feature = "default-themes"))]
280    #[test]
281    fn can_highlight_file() {
282        let ss = SyntaxSet::load_defaults_nonewlines();
283        let ts = ThemeSet::load_defaults();
284        HighlightFile::new("testdata/highlight_test.erb",
285                           &ss,
286                           &ts.themes["base16-ocean.dark"])
287            .unwrap();
288    }
289
290    #[cfg(feature = "default-syntaxes")]
291    #[test]
292    fn can_find_regions() {
293        let ss = SyntaxSet::load_defaults_nonewlines();
294        let mut state = ParseState::new(ss.find_syntax_by_extension("rb").unwrap());
295        let line = "lol =5+2";
296        let ops = state.parse_line(line, &ss).expect("#[cfg(test)]");
297
298        let mut stack = ScopeStack::new();
299        let mut token_count = 0;
300        for (s, op) in ScopeRegionIterator::new(&ops, line) {
301            stack.apply(op).expect("#[cfg(test)]");
302            if s.is_empty() { // in this case we don't care about blank tokens
303                continue;
304            }
305            if token_count == 1 {
306                assert_eq!(stack, ScopeStack::from_str("source.ruby keyword.operator.assignment.ruby").unwrap());
307                assert_eq!(s, "=");
308            }
309            token_count += 1;
310            println!("{:?} {}", s, stack);
311        }
312        assert_eq!(token_count, 5);
313    }
314
315    #[cfg(feature = "default-syntaxes")]
316    #[test]
317    fn can_find_regions_with_trailing_newline() {
318        let ss = SyntaxSet::load_defaults_newlines();
319        let mut state = ParseState::new(ss.find_syntax_by_extension("rb").unwrap());
320        let lines = ["# hello world\n", "lol=5+2\n"];
321        let mut stack = ScopeStack::new();
322
323        for line in lines.iter() {
324            let ops = state.parse_line(line, &ss).expect("#[cfg(test)]");
325            println!("{:?}", ops);
326
327            let mut iterated_ops: Vec<&ScopeStackOp> = Vec::new();
328            for (_, op) in ScopeRegionIterator::new(&ops, line) {
329                stack.apply(op).expect("#[cfg(test)]");
330                iterated_ops.push(op);
331                println!("{:?}", op);
332            }
333
334            let all_ops = ops.iter().map(|t| &t.1);
335            assert_eq!(all_ops.count(), iterated_ops.len() - 1); // -1 because we want to ignore the NOOP
336        }
337    }
338}