syntect/easy.rs
1//! API wrappers for common use cases like highlighting strings and
2//! files without caring about intermediate semantic representation
3//! and caching.
4
5use crate::Error;
6use crate::parsing::{ScopeStack, ParseState, SyntaxReference, SyntaxSet, ScopeStackOp};
7use crate::highlighting::{Highlighter, HighlightState, HighlightIterator, Theme, Style};
8use std::io::{self, BufReader};
9use std::fs::File;
10use std::path::Path;
11// use util::debug_print_ops;
12
13/// Simple way to go directly from lines of text to colored tokens.
14///
15/// Depending on how you load the syntaxes (see the [`SyntaxSet`] docs), this can either take
16/// strings with trailing `\n`s or without.
17///
18/// [`SyntaxSet`]: ../parsing/struct.SyntaxSet.html
19///
20/// # Examples
21///
22/// Prints colored lines of a string to the terminal
23///
24/// ```
25/// use syntect::easy::HighlightLines;
26/// use syntect::parsing::SyntaxSet;
27/// use syntect::highlighting::{ThemeSet, Style};
28/// use syntect::util::{as_24_bit_terminal_escaped, LinesWithEndings};
29///
30/// // Load these once at the start of your program
31/// let ps = SyntaxSet::load_defaults_newlines();
32/// let ts = ThemeSet::load_defaults();
33///
34/// let syntax = ps.find_syntax_by_extension("rs").unwrap();
35/// let mut h = HighlightLines::new(syntax, &ts.themes["base16-ocean.dark"]);
36/// let s = "pub struct Wow { hi: u64 }\nfn blah() -> u64 {}";
37/// for line in LinesWithEndings::from(s) { // LinesWithEndings enables use of newlines mode
38/// let ranges: Vec<(Style, &str)> = h.highlight_line(line, &ps).unwrap();
39/// let escaped = as_24_bit_terminal_escaped(&ranges[..], true);
40/// print!("{}", escaped);
41/// }
42/// ```
43pub struct HighlightLines<'a> {
44 highlighter: Highlighter<'a>,
45 parse_state: ParseState,
46 highlight_state: HighlightState,
47}
48
49impl<'a> HighlightLines<'a> {
50 pub fn new(syntax: &SyntaxReference, theme: &'a Theme) -> HighlightLines<'a> {
51 let highlighter = Highlighter::new(theme);
52 let highlight_state = HighlightState::new(&highlighter, ScopeStack::new());
53 HighlightLines {
54 highlighter,
55 parse_state: ParseState::new(syntax),
56 highlight_state,
57 }
58 }
59
60 #[deprecated(since="5.0.0", note="Renamed to `highlight_line` to make it clear it should be passed a single line at a time")]
61 pub fn highlight<'b>(&mut self, line: &'b str, syntax_set: &SyntaxSet) -> Vec<(Style, &'b str)> {
62 self.highlight_line(line, syntax_set).expect("`highlight` is deprecated, use `highlight_line` instead")
63 }
64
65 /// Highlights a line of a file
66 pub fn highlight_line<'b>(&mut self, line: &'b str, syntax_set: &SyntaxSet) -> Result<Vec<(Style, &'b str)>, Error> {
67 // println!("{}", self.highlight_state.path);
68 let ops = self.parse_state.parse_line(line, syntax_set)?;
69 // use util::debug_print_ops;
70 // debug_print_ops(line, &ops);
71 let iter =
72 HighlightIterator::new(&mut self.highlight_state, &ops[..], line, &self.highlighter);
73 Ok(iter.collect())
74 }
75}
76
77/// Convenience struct containing everything you need to highlight a file
78///
79/// Use the `reader` to get the lines of the file and the `highlight_lines` to highlight them. See
80/// the [`new`] method docs for more information.
81///
82/// [`new`]: #method.new
83pub struct HighlightFile<'a> {
84 pub reader: BufReader<File>,
85 pub highlight_lines: HighlightLines<'a>,
86}
87
88impl<'a> HighlightFile<'a> {
89 /// Constructs a file reader and a line highlighter to get you reading files as fast as possible.
90 ///
91 /// This auto-detects the syntax from the extension and constructs a [`HighlightLines`] with the
92 /// correct syntax and theme.
93 ///
94 /// [`HighlightLines`]: struct.HighlightLines.html
95 ///
96 /// # Examples
97 ///
98 /// Using the `newlines` mode is a bit involved but yields more robust and glitch-free highlighting,
99 /// as well as being slightly faster since it can re-use a line buffer.
100 ///
101 /// ```
102 /// use syntect::parsing::SyntaxSet;
103 /// use syntect::highlighting::{ThemeSet, Style};
104 /// use syntect::util::as_24_bit_terminal_escaped;
105 /// use syntect::easy::HighlightFile;
106 /// use std::io::BufRead;
107 ///
108 /// # use std::io;
109 /// # fn foo() -> io::Result<()> {
110 /// let ss = SyntaxSet::load_defaults_newlines();
111 /// let ts = ThemeSet::load_defaults();
112 ///
113 /// let mut highlighter = HighlightFile::new("testdata/highlight_test.erb", &ss, &ts.themes["base16-ocean.dark"]).unwrap();
114 /// let mut line = String::new();
115 /// while highlighter.reader.read_line(&mut line)? > 0 {
116 /// {
117 /// let regions: Vec<(Style, &str)> = highlighter.highlight_lines.highlight_line(&line, &ss).unwrap();
118 /// print!("{}", as_24_bit_terminal_escaped(®ions[..], true));
119 /// } // until NLL this scope is needed so we can clear the buffer after
120 /// line.clear(); // read_line appends so we need to clear between lines
121 /// }
122 /// # Ok(())
123 /// # }
124 /// ```
125 ///
126 /// This example uses `reader.lines()` to get lines without a newline character, it's simpler but may break on rare tricky cases.
127 ///
128 /// ```
129 /// use syntect::parsing::SyntaxSet;
130 /// use syntect::highlighting::{ThemeSet, Style};
131 /// use syntect::util::as_24_bit_terminal_escaped;
132 /// use syntect::easy::HighlightFile;
133 /// use std::io::BufRead;
134 ///
135 /// let ss = SyntaxSet::load_defaults_nonewlines();
136 /// let ts = ThemeSet::load_defaults();
137 ///
138 /// let mut highlighter = HighlightFile::new("testdata/highlight_test.erb", &ss, &ts.themes["base16-ocean.dark"]).unwrap();
139 /// for maybe_line in highlighter.reader.lines() {
140 /// let line = maybe_line.unwrap();
141 /// let regions: Vec<(Style, &str)> = highlighter.highlight_lines.highlight_line(&line, &ss).unwrap();
142 /// println!("{}", as_24_bit_terminal_escaped(®ions[..], true));
143 /// }
144 /// ```
145 pub fn new<P: AsRef<Path>>(path_obj: P,
146 ss: &SyntaxSet,
147 theme: &'a Theme)
148 -> io::Result<HighlightFile<'a>> {
149 let path: &Path = path_obj.as_ref();
150 let f = File::open(path)?;
151 let syntax = ss.find_syntax_for_file(path)?
152 .unwrap_or_else(|| ss.find_syntax_plain_text());
153
154 Ok(HighlightFile {
155 reader: BufReader::new(f),
156 highlight_lines: HighlightLines::new(syntax, theme),
157 })
158 }
159}
160
161/// Iterator over the ranges of a line which a given the operation from the parser applies.
162///
163/// Use [`ScopeRegionIterator`] to obtain directly regions (`&str`s) from the line.
164///
165/// To use, just keep your own [`ScopeStack`] and then `ScopeStack.apply(op)` the operation that is
166/// yielded at the top of your `for` loop over this iterator. Now you have a substring of the line
167/// and the scope stack for that token.
168///
169/// See the `synstats.rs` example for an example of using this iterator.
170///
171/// **Note:** This will often return empty ranges, just `continue` after applying the op if you
172/// don't want them.
173///
174/// [`ScopeStack`]: ../parsing/struct.ScopeStack.html
175/// [`ScopeRegionIterator`]: ./struct.ScopeRegionIterator.html
176#[derive(Debug)]
177pub struct ScopeRangeIterator<'a> {
178 ops: &'a [(usize, ScopeStackOp)],
179 line: &'a str,
180 index: usize,
181 last_str_index: usize,
182}
183
184impl<'a> ScopeRangeIterator<'a> {
185 pub fn new(ops: &'a [(usize, ScopeStackOp)], line: &'a str) -> ScopeRangeIterator<'a> {
186 ScopeRangeIterator {
187 ops,
188 line,
189 index: 0,
190 last_str_index: 0,
191 }
192 }
193}
194
195static NOOP_OP: ScopeStackOp = ScopeStackOp::Noop;
196
197impl<'a> Iterator for ScopeRangeIterator<'a> {
198 type Item = (std::ops::Range<usize>, &'a ScopeStackOp);
199 fn next(&mut self) -> Option<Self::Item> {
200 if self.index > self.ops.len() {
201 return None;
202 }
203
204 // region extends up to next operation (ops[index]) or string end if there is none
205 // note the next operation may be at, last_str_index, in which case the region is empty
206 let next_str_i = if self.index == self.ops.len() {
207 self.line.len()
208 } else {
209 self.ops[self.index].0
210 };
211 let range = self.last_str_index..next_str_i;
212 self.last_str_index = next_str_i;
213
214 // the first region covers everything before the first op, which may be empty
215 let op = if self.index == 0 {
216 &NOOP_OP
217 } else {
218 &self.ops[self.index - 1].1
219 };
220
221 self.index += 1;
222 Some((range, op))
223 }
224}
225
226/// A convenience wrapper over [`ScopeRangeIterator`] to return `&str`s directly.
227///
228/// To use, just keep your own [`ScopeStack`] and then `ScopeStack.apply(op)` the operation that is
229/// yielded at the top of your `for` loop over this iterator. Now you have a substring of the line
230/// and the scope stack for that token.
231///
232/// See the `synstats.rs` example for an example of using this iterator.
233///
234/// **Note:** This will often return empty regions, just `continue` after applying the op if you
235/// don't want them.
236///
237/// [`ScopeStack`]: ../parsing/struct.ScopeStack.html
238/// [`ScopeRangeIterator`]: ./struct.ScopeRangeIterator.html
239#[derive(Debug)]
240pub struct ScopeRegionIterator<'a> {
241 range_iter: ScopeRangeIterator<'a>,
242}
243
244impl<'a> ScopeRegionIterator<'a> {
245 pub fn new(ops: &'a [(usize, ScopeStackOp)], line: &'a str) -> ScopeRegionIterator<'a> {
246 ScopeRegionIterator {
247 range_iter: ScopeRangeIterator::new(ops, line),
248 }
249 }
250}
251
252impl<'a> Iterator for ScopeRegionIterator<'a> {
253 type Item = (&'a str, &'a ScopeStackOp);
254 fn next(&mut self) -> Option<Self::Item> {
255 let (range, op) = self.range_iter.next()?;
256 Some((&self.range_iter.line[range], op))
257 }
258}
259
260#[cfg(test)]
261mod tests {
262 use super::*;
263 use crate::parsing::{SyntaxSet, ParseState, ScopeStack};
264 #[cfg(feature = "default-themes")]
265 use crate::highlighting::ThemeSet;
266 use std::str::FromStr;
267
268 #[cfg(all(feature = "default-syntaxes", feature = "default-themes"))]
269 #[test]
270 fn can_highlight_lines() {
271 let ss = SyntaxSet::load_defaults_nonewlines();
272 let ts = ThemeSet::load_defaults();
273 let syntax = ss.find_syntax_by_extension("rs").unwrap();
274 let mut h = HighlightLines::new(syntax, &ts.themes["base16-ocean.dark"]);
275 let ranges = h.highlight_line("pub struct Wow { hi: u64 }", &ss).expect("#[cfg(test)]");
276 assert!(ranges.len() > 4);
277 }
278
279 #[cfg(all(feature = "default-syntaxes", feature = "default-themes"))]
280 #[test]
281 fn can_highlight_file() {
282 let ss = SyntaxSet::load_defaults_nonewlines();
283 let ts = ThemeSet::load_defaults();
284 HighlightFile::new("testdata/highlight_test.erb",
285 &ss,
286 &ts.themes["base16-ocean.dark"])
287 .unwrap();
288 }
289
290 #[cfg(feature = "default-syntaxes")]
291 #[test]
292 fn can_find_regions() {
293 let ss = SyntaxSet::load_defaults_nonewlines();
294 let mut state = ParseState::new(ss.find_syntax_by_extension("rb").unwrap());
295 let line = "lol =5+2";
296 let ops = state.parse_line(line, &ss).expect("#[cfg(test)]");
297
298 let mut stack = ScopeStack::new();
299 let mut token_count = 0;
300 for (s, op) in ScopeRegionIterator::new(&ops, line) {
301 stack.apply(op).expect("#[cfg(test)]");
302 if s.is_empty() { // in this case we don't care about blank tokens
303 continue;
304 }
305 if token_count == 1 {
306 assert_eq!(stack, ScopeStack::from_str("source.ruby keyword.operator.assignment.ruby").unwrap());
307 assert_eq!(s, "=");
308 }
309 token_count += 1;
310 println!("{:?} {}", s, stack);
311 }
312 assert_eq!(token_count, 5);
313 }
314
315 #[cfg(feature = "default-syntaxes")]
316 #[test]
317 fn can_find_regions_with_trailing_newline() {
318 let ss = SyntaxSet::load_defaults_newlines();
319 let mut state = ParseState::new(ss.find_syntax_by_extension("rb").unwrap());
320 let lines = ["# hello world\n", "lol=5+2\n"];
321 let mut stack = ScopeStack::new();
322
323 for line in lines.iter() {
324 let ops = state.parse_line(line, &ss).expect("#[cfg(test)]");
325 println!("{:?}", ops);
326
327 let mut iterated_ops: Vec<&ScopeStackOp> = Vec::new();
328 for (_, op) in ScopeRegionIterator::new(&ops, line) {
329 stack.apply(op).expect("#[cfg(test)]");
330 iterated_ops.push(op);
331 println!("{:?}", op);
332 }
333
334 let all_ops = ops.iter().map(|t| &t.1);
335 assert_eq!(all_ops.count(), iterated_ops.len() - 1); // -1 because we want to ignore the NOOP
336 }
337 }
338}