Coverage Report

Created: 2026-02-14 06:23

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/regex/regex-syntax/src/error.rs
Line
Count
Source
1
use alloc::{
2
    format,
3
    string::{String, ToString},
4
    vec,
5
    vec::Vec,
6
};
7
8
use crate::{ast, hir};
9
10
/// This error type encompasses any error that can be returned by this crate.
11
///
12
/// This error type is marked as `non_exhaustive`. This means that adding a
13
/// new variant is not considered a breaking change.
14
#[non_exhaustive]
15
#[derive(Clone, Debug, Eq, PartialEq)]
16
pub enum Error {
17
    /// An error that occurred while translating concrete syntax into abstract
18
    /// syntax (AST).
19
    Parse(ast::Error),
20
    /// An error that occurred while translating abstract syntax into a high
21
    /// level intermediate representation (HIR).
22
    Translate(hir::Error),
23
}
24
25
impl From<ast::Error> for Error {
26
6.40k
    fn from(err: ast::Error) -> Error {
27
6.40k
        Error::Parse(err)
28
6.40k
    }
29
}
30
31
impl From<hir::Error> for Error {
32
2.63k
    fn from(err: hir::Error) -> Error {
33
2.63k
        Error::Translate(err)
34
2.63k
    }
35
}
36
37
#[cfg(feature = "std")]
38
impl std::error::Error for Error {}
39
40
impl core::fmt::Display for Error {
41
9.03k
    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
42
9.03k
        match *self {
43
6.40k
            Error::Parse(ref x) => x.fmt(f),
44
2.63k
            Error::Translate(ref x) => x.fmt(f),
45
        }
46
9.03k
    }
47
}
48
49
/// A helper type for formatting nice error messages.
50
///
51
/// This type is responsible for reporting regex parse errors in a nice human
52
/// readable format. Most of its complexity is from interspersing notational
53
/// markers pointing out the position where an error occurred.
54
#[derive(Debug)]
55
pub struct Formatter<'e, E> {
56
    /// The original regex pattern in which the error occurred.
57
    pattern: &'e str,
58
    /// The error kind. It must impl fmt::Display.
59
    err: &'e E,
60
    /// The primary span of the error.
61
    span: &'e ast::Span,
62
    /// An auxiliary and optional span, in case the error needs to point to
63
    /// two locations (e.g., when reporting a duplicate capture group name).
64
    aux_span: Option<&'e ast::Span>,
65
}
66
67
impl<'e> From<&'e ast::Error> for Formatter<'e, ast::ErrorKind> {
68
6.40k
    fn from(err: &'e ast::Error) -> Self {
69
6.40k
        Formatter {
70
6.40k
            pattern: err.pattern(),
71
6.40k
            err: err.kind(),
72
6.40k
            span: err.span(),
73
6.40k
            aux_span: err.auxiliary_span(),
74
6.40k
        }
75
6.40k
    }
76
}
77
78
impl<'e> From<&'e hir::Error> for Formatter<'e, hir::ErrorKind> {
79
2.63k
    fn from(err: &'e hir::Error) -> Self {
80
2.63k
        Formatter {
81
2.63k
            pattern: err.pattern(),
82
2.63k
            err: err.kind(),
83
2.63k
            span: err.span(),
84
2.63k
            aux_span: None,
85
2.63k
        }
86
2.63k
    }
87
}
88
89
impl<'e, E: core::fmt::Display> core::fmt::Display for Formatter<'e, E> {
90
9.03k
    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
91
9.03k
        let spans = Spans::from_formatter(self);
92
9.03k
        if self.pattern.contains('\n') {
93
553
            let divider = repeat_char('~', 79);
94
95
553
            writeln!(f, "regex parse error:")?;
96
553
            writeln!(f, "{divider}")?;
97
553
            let notated = spans.notate();
98
553
            write!(f, "{notated}")?;
99
553
            writeln!(f, "{divider}")?;
100
            // If we have error spans that cover multiple lines, then we just
101
            // note the line numbers.
102
553
            if !spans.multi_line.is_empty() {
103
84
                let mut notes = vec![];
104
168
                for span in &spans.multi_line {
105
84
                    notes.push(format!(
106
84
                        "on line {} (column {}) through line {} (column {})",
107
84
                        span.start.line,
108
84
                        span.start.column,
109
84
                        span.end.line,
110
84
                        span.end.column - 1
111
84
                    ));
112
84
                }
113
84
                writeln!(f, "{}", notes.join("\n"))?;
114
469
            }
115
553
            write!(f, "error: {}", self.err)?;
116
        } else {
117
8.48k
            writeln!(f, "regex parse error:")?;
118
8.48k
            let notated = Spans::from_formatter(self).notate();
119
8.48k
            write!(f, "{notated}")?;
120
8.48k
            write!(f, "error: {}", self.err)?;
121
        }
122
9.03k
        Ok(())
123
9.03k
    }
<regex_syntax::error::Formatter<regex_syntax::ast::ErrorKind> as core::fmt::Display>::fmt
Line
Count
Source
90
6.40k
    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
91
6.40k
        let spans = Spans::from_formatter(self);
92
6.40k
        if self.pattern.contains('\n') {
93
399
            let divider = repeat_char('~', 79);
94
95
399
            writeln!(f, "regex parse error:")?;
96
399
            writeln!(f, "{divider}")?;
97
399
            let notated = spans.notate();
98
399
            write!(f, "{notated}")?;
99
399
            writeln!(f, "{divider}")?;
100
            // If we have error spans that cover multiple lines, then we just
101
            // note the line numbers.
102
399
            if !spans.multi_line.is_empty() {
103
74
                let mut notes = vec![];
104
148
                for span in &spans.multi_line {
105
74
                    notes.push(format!(
106
74
                        "on line {} (column {}) through line {} (column {})",
107
74
                        span.start.line,
108
74
                        span.start.column,
109
74
                        span.end.line,
110
74
                        span.end.column - 1
111
74
                    ));
112
74
                }
113
74
                writeln!(f, "{}", notes.join("\n"))?;
114
325
            }
115
399
            write!(f, "error: {}", self.err)?;
116
        } else {
117
6.00k
            writeln!(f, "regex parse error:")?;
118
6.00k
            let notated = Spans::from_formatter(self).notate();
119
6.00k
            write!(f, "{notated}")?;
120
6.00k
            write!(f, "error: {}", self.err)?;
121
        }
122
6.40k
        Ok(())
123
6.40k
    }
<regex_syntax::error::Formatter<regex_syntax::hir::ErrorKind> as core::fmt::Display>::fmt
Line
Count
Source
90
2.63k
    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
91
2.63k
        let spans = Spans::from_formatter(self);
92
2.63k
        if self.pattern.contains('\n') {
93
154
            let divider = repeat_char('~', 79);
94
95
154
            writeln!(f, "regex parse error:")?;
96
154
            writeln!(f, "{divider}")?;
97
154
            let notated = spans.notate();
98
154
            write!(f, "{notated}")?;
99
154
            writeln!(f, "{divider}")?;
100
            // If we have error spans that cover multiple lines, then we just
101
            // note the line numbers.
102
154
            if !spans.multi_line.is_empty() {
103
10
                let mut notes = vec![];
104
20
                for span in &spans.multi_line {
105
10
                    notes.push(format!(
106
10
                        "on line {} (column {}) through line {} (column {})",
107
10
                        span.start.line,
108
10
                        span.start.column,
109
10
                        span.end.line,
110
10
                        span.end.column - 1
111
10
                    ));
112
10
                }
113
10
                writeln!(f, "{}", notes.join("\n"))?;
114
144
            }
115
154
            write!(f, "error: {}", self.err)?;
116
        } else {
117
2.47k
            writeln!(f, "regex parse error:")?;
118
2.47k
            let notated = Spans::from_formatter(self).notate();
119
2.47k
            write!(f, "{notated}")?;
120
2.47k
            write!(f, "error: {}", self.err)?;
121
        }
122
2.63k
        Ok(())
123
2.63k
    }
124
}
125
126
/// This type represents an arbitrary number of error spans in a way that makes
127
/// it convenient to notate the regex pattern. ("Notate" means "point out
128
/// exactly where the error occurred in the regex pattern.")
129
///
130
/// Technically, we can only ever have two spans given our current error
131
/// structure. However, after toiling with a specific algorithm for handling
132
/// two spans, it became obvious that an algorithm to handle an arbitrary
133
/// number of spans was actually much simpler.
134
struct Spans<'p> {
135
    /// The original regex pattern string.
136
    pattern: &'p str,
137
    /// The total width that should be used for line numbers. The width is
138
    /// used for left padding the line numbers for alignment.
139
    ///
140
    /// A value of `0` means line numbers should not be displayed. That is,
141
    /// the pattern is itself only one line.
142
    line_number_width: usize,
143
    /// All error spans that occur on a single line. This sequence always has
144
    /// length equivalent to the number of lines in `pattern`, where the index
145
    /// of the sequence represents a line number, starting at `0`. The spans
146
    /// in each line are sorted in ascending order.
147
    by_line: Vec<Vec<ast::Span>>,
148
    /// All error spans that occur over one or more lines. That is, the start
149
    /// and end position of the span have different line numbers. The spans are
150
    /// sorted in ascending order.
151
    multi_line: Vec<ast::Span>,
152
}
153
154
impl<'p> Spans<'p> {
155
    /// Build a sequence of spans from a formatter.
156
17.5k
    fn from_formatter<'e, E: core::fmt::Display>(
157
17.5k
        fmter: &'p Formatter<'e, E>,
158
17.5k
    ) -> Spans<'p> {
159
17.5k
        let mut line_count = fmter.pattern.lines().count();
160
        // If the pattern ends with a `\n` literal, then our line count is
161
        // off by one, since a span can occur immediately after the last `\n`,
162
        // which is consider to be an additional line.
163
17.5k
        if fmter.pattern.ends_with('\n') {
164
102
            line_count += 1;
165
17.4k
        }
166
17.5k
        let line_number_width =
167
17.5k
            if line_count <= 1 { 0 } else { line_count.to_string().len() };
168
17.5k
        let mut spans = Spans {
169
17.5k
            pattern: &fmter.pattern,
170
17.5k
            line_number_width,
171
17.5k
            by_line: vec![vec![]; line_count],
172
17.5k
            multi_line: vec![],
173
17.5k
        };
174
17.5k
        spans.add(fmter.span.clone());
175
17.5k
        if let Some(span) = fmter.aux_span {
176
1.05k
            spans.add(span.clone());
177
16.4k
        }
178
17.5k
        spans
179
17.5k
    }
<regex_syntax::error::Spans>::from_formatter::<regex_syntax::ast::ErrorKind>
Line
Count
Source
156
12.4k
    fn from_formatter<'e, E: core::fmt::Display>(
157
12.4k
        fmter: &'p Formatter<'e, E>,
158
12.4k
    ) -> Spans<'p> {
159
12.4k
        let mut line_count = fmter.pattern.lines().count();
160
        // If the pattern ends with a `\n` literal, then our line count is
161
        // off by one, since a span can occur immediately after the last `\n`,
162
        // which is consider to be an additional line.
163
12.4k
        if fmter.pattern.ends_with('\n') {
164
71
            line_count += 1;
165
12.3k
        }
166
12.4k
        let line_number_width =
167
12.4k
            if line_count <= 1 { 0 } else { line_count.to_string().len() };
168
12.4k
        let mut spans = Spans {
169
12.4k
            pattern: &fmter.pattern,
170
12.4k
            line_number_width,
171
12.4k
            by_line: vec![vec![]; line_count],
172
12.4k
            multi_line: vec![],
173
12.4k
        };
174
12.4k
        spans.add(fmter.span.clone());
175
12.4k
        if let Some(span) = fmter.aux_span {
176
1.05k
            spans.add(span.clone());
177
11.3k
        }
178
12.4k
        spans
179
12.4k
    }
<regex_syntax::error::Spans>::from_formatter::<regex_syntax::hir::ErrorKind>
Line
Count
Source
156
5.10k
    fn from_formatter<'e, E: core::fmt::Display>(
157
5.10k
        fmter: &'p Formatter<'e, E>,
158
5.10k
    ) -> Spans<'p> {
159
5.10k
        let mut line_count = fmter.pattern.lines().count();
160
        // If the pattern ends with a `\n` literal, then our line count is
161
        // off by one, since a span can occur immediately after the last `\n`,
162
        // which is consider to be an additional line.
163
5.10k
        if fmter.pattern.ends_with('\n') {
164
31
            line_count += 1;
165
5.07k
        }
166
5.10k
        let line_number_width =
167
5.10k
            if line_count <= 1 { 0 } else { line_count.to_string().len() };
168
5.10k
        let mut spans = Spans {
169
5.10k
            pattern: &fmter.pattern,
170
5.10k
            line_number_width,
171
5.10k
            by_line: vec![vec![]; line_count],
172
5.10k
            multi_line: vec![],
173
5.10k
        };
174
5.10k
        spans.add(fmter.span.clone());
175
5.10k
        if let Some(span) = fmter.aux_span {
176
0
            spans.add(span.clone());
177
5.10k
        }
178
5.10k
        spans
179
5.10k
    }
180
181
    /// Add the given span to this sequence, putting it in the right place.
182
18.5k
    fn add(&mut self, span: ast::Span) {
183
        // This is grossly inefficient since we sort after each add, but right
184
        // now, we only ever add two spans at most.
185
18.5k
        if span.is_one_line() {
186
18.4k
            let i = span.start.line - 1; // because lines are 1-indexed
187
18.4k
            self.by_line[i].push(span);
188
18.4k
            self.by_line[i].sort();
189
18.4k
        } else {
190
84
            self.multi_line.push(span);
191
84
            self.multi_line.sort();
192
84
        }
193
18.5k
    }
194
195
    /// Notate the pattern string with carets (`^`) pointing at each span
196
    /// location. This only applies to spans that occur within a single line.
197
9.03k
    fn notate(&self) -> String {
198
9.03k
        let mut notated = String::new();
199
110k
        for (i, line) in self.pattern.lines().enumerate() {
200
110k
            if self.line_number_width > 0 {
201
101k
                notated.push_str(&self.left_pad_line_number(i + 1));
202
101k
                notated.push_str(": ");
203
101k
            } else {
204
8.48k
                notated.push_str("    ");
205
8.48k
            }
206
110k
            notated.push_str(line);
207
110k
            notated.push('\n');
208
110k
            if let Some(notes) = self.notate_line(i) {
209
8.96k
                notated.push_str(&notes);
210
8.96k
                notated.push('\n');
211
101k
            }
212
        }
213
9.03k
        notated
214
9.03k
    }
215
216
    /// Return notes for the line indexed at `i` (zero-based). If there are no
217
    /// spans for the given line, then `None` is returned. Otherwise, an
218
    /// appropriately space padded string with correctly positioned `^` is
219
    /// returned, accounting for line numbers.
220
110k
    fn notate_line(&self, i: usize) -> Option<String> {
221
110k
        let spans = &self.by_line[i];
222
110k
        if spans.is_empty() {
223
101k
            return None;
224
8.96k
        }
225
8.96k
        let mut notes = String::new();
226
35.6k
        for _ in 0..self.line_number_padding() {
227
35.6k
            notes.push(' ');
228
35.6k
        }
229
8.96k
        let mut pos = 0;
230
18.4k
        for span in spans {
231
3.32M
            for _ in pos..(span.start.column - 1) {
232
3.32M
                notes.push(' ');
233
3.32M
                pos += 1;
234
3.32M
            }
235
9.48k
            let note_len = span.end.column.saturating_sub(span.start.column);
236
269k
            for _ in 0..core::cmp::max(1, note_len) {
237
269k
                notes.push('^');
238
269k
                pos += 1;
239
269k
            }
240
        }
241
8.96k
        Some(notes)
242
110k
    }
243
244
    /// Left pad the given line number with spaces such that it is aligned with
245
    /// other line numbers.
246
101k
    fn left_pad_line_number(&self, n: usize) -> String {
247
101k
        let n = n.to_string();
248
101k
        let pad = self.line_number_width.checked_sub(n.len()).unwrap();
249
101k
        let mut result = repeat_char(' ', pad);
250
101k
        result.push_str(&n);
251
101k
        result
252
101k
    }
253
254
    /// Return the line number padding beginning at the start of each line of
255
    /// the pattern.
256
    ///
257
    /// If the pattern is only one line, then this returns a fixed padding
258
    /// for visual indentation.
259
8.96k
    fn line_number_padding(&self) -> usize {
260
8.96k
        if self.line_number_width == 0 {
261
8.48k
            4
262
        } else {
263
480
            2 + self.line_number_width
264
        }
265
8.96k
    }
266
}
267
268
102k
fn repeat_char(c: char, count: usize) -> String {
269
102k
    core::iter::repeat(c).take(count).collect()
270
102k
}
271
272
#[cfg(test)]
273
mod tests {
274
    use alloc::string::ToString;
275
276
    use crate::ast::parse::Parser;
277
278
    fn assert_panic_message(pattern: &str, expected_msg: &str) {
279
        let result = Parser::new().parse(pattern);
280
        match result {
281
            Ok(_) => {
282
                panic!("regex should not have parsed");
283
            }
284
            Err(err) => {
285
                assert_eq!(err.to_string(), expected_msg.trim());
286
            }
287
        }
288
    }
289
290
    // See: https://github.com/rust-lang/regex/issues/464
291
    #[test]
292
    fn regression_464() {
293
        let err = Parser::new().parse("a{\n").unwrap_err();
294
        // This test checks that the error formatter doesn't panic.
295
        assert!(!err.to_string().is_empty());
296
    }
297
298
    // See: https://github.com/rust-lang/regex/issues/545
299
    #[test]
300
    fn repetition_quantifier_expects_a_valid_decimal() {
301
        assert_panic_message(
302
            r"\\u{[^}]*}",
303
            r#"
304
regex parse error:
305
    \\u{[^}]*}
306
        ^
307
error: repetition quantifier expects a valid decimal
308
"#,
309
        );
310
    }
311
}