/src/cpython/Parser/string_parser.c

Source (jump to first uncovered line)
#include <Python.h>
#include "pycore_bytesobject.h"   // _PyBytes_DecodeEscape()
#include "pycore_unicodeobject.h" // _PyUnicode_DecodeUnicodeEscapeInternal()

#include "lexer/state.h"
#include "pegen.h"
#include "string_parser.h"

#include <stdbool.h>

//// STRING HANDLING FUNCTIONS ////

static int
warn_invalid_escape_sequence(Parser *p, const char* buffer, const char *first_invalid_escape, Token *t)
{
    if (p->call_invalid_rules) {
        // Do not report warnings if we are in the second pass of the parser
        // to avoid showing the warning twice.
        return 0;
    }
    unsigned char c = (unsigned char)*first_invalid_escape;
    if ((t->type == FSTRING_MIDDLE || t->type == FSTRING_END || t->type == TSTRING_MIDDLE || t->type == TSTRING_END)
            && (c == '{' || c == '}')) {
        // in this case the tokenizer has already emitted a warning,
        // see Parser/tokenizer/helpers.c:warn_invalid_escape_sequence
        return 0;
    }

    int octal = ('4' <= c && c <= '7');
    PyObject *msg =
        octal
        ? PyUnicode_FromFormat(
              "\"\\%.3s\" is an invalid octal escape sequence. "
              "Such sequences will not work in the future. "
              "Did you mean \"\\\\%.3s\"? A raw string is also an option.",
              first_invalid_escape, first_invalid_escape)
        : PyUnicode_FromFormat(
              "\"\\%c\" is an invalid escape sequence. "
              "Such sequences will not work in the future. "
              "Did you mean \"\\\\%c\"? A raw string is also an option.",
              c, c);
    if (msg == NULL) {
        return -1;
    }
    PyObject *category;
    if (p->feature_version >= 12) {
        category = PyExc_SyntaxWarning;
    }
    else {
        category = PyExc_DeprecationWarning;
    }

    // Calculate the lineno and the col_offset of the invalid escape sequence
    const char *start = buffer;
    const char *end = first_invalid_escape;
    int lineno = t->lineno;
    int col_offset = t->col_offset;
    while (start < end) {
        if (*start == '\n') {
            lineno++;
            col_offset = 0;
        }
        else {
            col_offset++;
        }
        start++;
    }

    // Count the number of quotes in the token
    char first_quote = 0;
    if (lineno == t->lineno) {
        int quote_count = 0;
        char* tok = PyBytes_AsString(t->bytes);
        for (int i = 0; i < PyBytes_Size(t->bytes); i++) {
            if (tok[i] == '\'' || tok[i] == '\"') {
                if (quote_count == 0) {
                    first_quote = tok[i];
                }
                if (tok[i] == first_quote) {
                    quote_count++;
                }
            } else {
                break;
            }
        }

        col_offset += quote_count;
    }

    if (PyErr_WarnExplicitObject(category, msg, p->tok->filename,
                                 lineno, NULL, NULL) < 0) {
        if (PyErr_ExceptionMatches(category)) {
            /* Replace the Syntax/DeprecationWarning exception with a SyntaxError
               to get a more accurate error report */
            PyErr_Clear();

            /* This is needed, in order for the SyntaxError to point to the token t,
               since _PyPegen_raise_error uses p->tokens[p->fill - 1] for the
               error location, if p->known_err_token is not set. */
            p->known_err_token = t;
            if (octal) {
                RAISE_ERROR_KNOWN_LOCATION(p, PyExc_SyntaxError, lineno, col_offset-1, lineno, col_offset+1,
                    "\"\\%.3s\" is an invalid octal escape sequence. "
                    "Did you mean \"\\\\%.3s\"? A raw string is also an option.",
                    first_invalid_escape, first_invalid_escape);
            }
            else {
                RAISE_ERROR_KNOWN_LOCATION(p, PyExc_SyntaxError, lineno, col_offset-1, lineno, col_offset+1,
                    "\"\\%c\" is an invalid escape sequence. "
                    "Did you mean \"\\\\%c\"? A raw string is also an option.",
                    c, c);
            }
        }
        Py_DECREF(msg);
        return -1;
    }
    Py_DECREF(msg);
    return 0;
}

static PyObject *
decode_utf8(const char **sPtr, const char *end)
{
    const char *s;
    const char *t;
    t = s = *sPtr;
    while (s < end && (*s & 0x80)) {
        s++;
    }
    *sPtr = s;
    return PyUnicode_DecodeUTF8(t, s - t, NULL);
}

static PyObject *
decode_unicode_with_escapes(Parser *parser, const char *s, size_t len, Token *t)
{
    PyObject *v;
    PyObject *u;
    char *buf;
    char *p;
    const char *end;

    /* check for integer overflow */
    if (len > (size_t)PY_SSIZE_T_MAX / 6) {
        return NULL;
    }
    /* "ä" (2 bytes) may become "\U000000E4" (10 bytes), or 1:5
       "\ä" (3 bytes) may become "\u005c\U000000E4" (16 bytes), or ~1:6 */
    u = PyBytes_FromStringAndSize((char *)NULL, (Py_ssize_t)len * 6);
    if (u == NULL) {
        return NULL;
    }
    p = buf = PyBytes_AsString(u);
    if (p == NULL) {
        return NULL;
    }
    end = s + len;
    while (s < end) {
        if (*s == '\\') {
            *p++ = *s++;
            if (s >= end || *s & 0x80) {
                strcpy(p, "u005c");
                p += 5;
                if (s >= end) {
                    break;
                }
            }
        }
        if (*s & 0x80) {
            PyObject *w;
            int kind;
            const void *data;
            Py_ssize_t w_len;
            Py_ssize_t i;
            w = decode_utf8(&s, end);
            if (w == NULL) {
                Py_DECREF(u);
                return NULL;
            }
            kind = PyUnicode_KIND(w);
            data = PyUnicode_DATA(w);
            w_len = PyUnicode_GET_LENGTH(w);
            for (i = 0; i < w_len; i++) {
                Py_UCS4 chr = PyUnicode_READ(kind, data, i);
                sprintf(p, "\\U%08x", chr);
                p += 10;
            }
            /* Should be impossible to overflow */
            assert(p - buf <= PyBytes_GET_SIZE(u));
            Py_DECREF(w);
        }
        else {
            *p++ = *s++;
        }
    }
    len = (size_t)(p - buf);
    s = buf;

    int first_invalid_escape_char;
    const char *first_invalid_escape_ptr;
    v = _PyUnicode_DecodeUnicodeEscapeInternal2(s, (Py_ssize_t)len, NULL, NULL,
                                                &first_invalid_escape_char,
                                                &first_invalid_escape_ptr);

    // HACK: later we can simply pass the line no, since we don't preserve the tokens
    // when we are decoding the string but we preserve the line numbers.
    if (v != NULL && first_invalid_escape_ptr != NULL && t != NULL) {
        if (warn_invalid_escape_sequence(parser, s, first_invalid_escape_ptr, t) < 0) {
            /* We have not decref u before because first_invalid_escape_ptr
               points inside u. */
            Py_XDECREF(u);
            Py_DECREF(v);
            return NULL;
        }
    }
    Py_XDECREF(u);
    return v;
}

static PyObject *
decode_bytes_with_escapes(Parser *p, const char *s, Py_ssize_t len, Token *t)
{
    int first_invalid_escape_char;
    const char *first_invalid_escape_ptr;
    PyObject *result = _PyBytes_DecodeEscape2(s, len, NULL,
                                              &first_invalid_escape_char,
                                              &first_invalid_escape_ptr);
    if (result == NULL) {
        return NULL;
    }

    if (first_invalid_escape_ptr != NULL) {
        if (warn_invalid_escape_sequence(p, s, first_invalid_escape_ptr, t) < 0) {
            Py_DECREF(result);
            return NULL;
        }
    }
    return result;
}

PyObject *
_PyPegen_decode_string(Parser *p, int raw, const char *s, size_t len, Token *t)
{
    if (raw) {
        return PyUnicode_DecodeUTF8Stateful(s, (Py_ssize_t)len, NULL, NULL);
    }
    return decode_unicode_with_escapes(p, s, len, t);
}

/* s must include the bracketing quote characters, and r, b &/or f prefixes
    (if any), and embedded escape sequences (if any). (f-strings are handled by the parser)
   _PyPegen_parse_string parses it, and returns the decoded Python string object. */
PyObject *
_PyPegen_parse_string(Parser *p, Token *t)
{
    const char *s = PyBytes_AsString(t->bytes);
    if (s == NULL) {
        return NULL;
    }

    size_t len;
    int quote = Py_CHARMASK(*s);
    int bytesmode = 0;
    int rawmode = 0;

    if (Py_ISALPHA(quote)) {
        while (!bytesmode || !rawmode) {
            if (quote == 'b' || quote == 'B') {
                quote =(unsigned char)*++s;
                bytesmode = 1;
            }
            else if (quote == 'u' || quote == 'U') {
                quote = (unsigned char)*++s;
            }
            else if (quote == 'r' || quote == 'R') {
                quote = (unsigned char)*++s;
                rawmode = 1;
            }
            else {
                break;
            }
        }
    }

    if (quote != '\'' && quote != '\"') {
        PyErr_BadInternalCall();
        return NULL;
    }

    /* Skip the leading quote char. */
    s++;
    len = strlen(s);
    // gh-120155: 's' contains at least the trailing quote,
    // so the code '--len' below is safe.
    assert(len >= 1);

    if (len > INT_MAX) {
        PyErr_SetString(PyExc_OverflowError, "string to parse is too long");
        return NULL;
    }
    if (s[--len] != quote) {
        /* Last quote char must match the first. */
        PyErr_BadInternalCall();
        return NULL;
    }
    if (len >= 4 && s[0] == quote && s[1] == quote) {
        /* A triple quoted string. We've already skipped one quote at
           the start and one at the end of the string. Now skip the
           two at the start. */
        s += 2;
        len -= 2;
        /* And check that the last two match. */
        if (s[--len] != quote || s[--len] != quote) {
            PyErr_BadInternalCall();
            return NULL;
        }
    }

    /* Avoid invoking escape decoding routines if possible. */
    rawmode = rawmode || strchr(s, '\\') == NULL;
    if (bytesmode) {
        /* Disallow non-ASCII characters. */
        const char *ch;
        for (ch = s; *ch; ch++) {
            if (Py_CHARMASK(*ch) >= 0x80) {
                RAISE_SYNTAX_ERROR_KNOWN_LOCATION(
                                   t,
                                   "bytes can only contain ASCII "
                                   "literal characters");
                return NULL;
            }
        }
        if (rawmode) {
            return PyBytes_FromStringAndSize(s, (Py_ssize_t)len);
        }
        return decode_bytes_with_escapes(p, s, (Py_ssize_t)len, t);
    }
    return _PyPegen_decode_string(p, rawmode, s, len, t);
}

Coverage Report

Created: 2025-08-26 06:26

Line	Count	Source (jump to first uncovered line)
1		#include <Python.h>
2		#include "pycore_bytesobject.h" // _PyBytes_DecodeEscape()
3		#include "pycore_unicodeobject.h" // _PyUnicode_DecodeUnicodeEscapeInternal()
4
5		#include "lexer/state.h"
6		#include "pegen.h"
7		#include "string_parser.h"
8
9		#include <stdbool.h>
10
11		//// STRING HANDLING FUNCTIONS ////
12
13		static int
14		warn_invalid_escape_sequence(Parser p, const char buffer, const char first_invalid_escape, Token t)
15	5.61k	{
16	5.61k	if (p->call_invalid_rules) {
17		// Do not report warnings if we are in the second pass of the parser
18		// to avoid showing the warning twice.
19	2.38k	return 0;
20	2.38k	}
21	3.22k	unsigned char c = (unsigned char)*first_invalid_escape;
22	3.22k	if ((t->type == FSTRING_MIDDLE \|\| t->type == FSTRING_END \|\| t->type == TSTRING_MIDDLE \|\| t->type == TSTRING_END)
23	3.22k	&& (c == '{' \|\| c == '}')) {
24		// in this case the tokenizer has already emitted a warning,
25		// see Parser/tokenizer/helpers.c:warn_invalid_escape_sequence
26	516	return 0;
27	516	}
28
29	2.71k	int octal = ('4' <= c && c <= '7');
30	2.71k	PyObject *msg =
31	2.71k	octal
32	2.71k	? PyUnicode_FromFormat(
33	601	"\"\\%.3s\" is an invalid octal escape sequence. "
34	601	"Such sequences will not work in the future. "
35	601	"Did you mean \"\\\\%.3s\"? A raw string is also an option.",
36	601	first_invalid_escape, first_invalid_escape)
37	2.71k	: PyUnicode_FromFormat(
38	2.11k	"\"\\%c\" is an invalid escape sequence. "
39	2.11k	"Such sequences will not work in the future. "
40	2.11k	"Did you mean \"\\\\%c\"? A raw string is also an option.",
41	2.11k	c, c);
42	2.71k	if (msg == NULL) {
43	0	return -1;
44	0	}
45	2.71k	PyObject *category;
46	2.71k	if (p->feature_version >= 12) {
47	2.71k	category = PyExc_SyntaxWarning;
48	2.71k	}
49	0	else {
50	0	category = PyExc_DeprecationWarning;
51	0	}
52
53		// Calculate the lineno and the col_offset of the invalid escape sequence
54	2.71k	const char *start = buffer;
55	2.71k	const char *end = first_invalid_escape;
56	2.71k	int lineno = t->lineno;
57	2.71k	int col_offset = t->col_offset;
58	37.8k	while (start < end) {
59	35.1k	if (*start == '\n') {
60	881	lineno++;
61	881	col_offset = 0;
62	881	}
63	34.2k	else {
64	34.2k	col_offset++;
65	34.2k	}
66	35.1k	start++;
67	35.1k	}
68
69		// Count the number of quotes in the token
70	2.71k	char first_quote = 0;
71	2.71k	if (lineno == t->lineno) {
72	2.46k	int quote_count = 0;
73	2.46k	char* tok = PyBytes_AsString(t->bytes);
74	4.64k	for (int i = 0; i < PyBytes_Size(t->bytes); i++) {
75	3.89k	if (tok[i] == '\'' \|\| tok[i] == '\"') {
76	2.18k	if (quote_count == 0) {
77	1.78k	first_quote = tok[i];
78	1.78k	}
79	2.18k	if (tok[i] == first_quote) {
80	1.93k	quote_count++;
81	1.93k	}
82	2.18k	} else {
83	1.70k	break;
84	1.70k	}
85	3.89k	}
86
87	2.46k	col_offset += quote_count;
88	2.46k	}
89
90	2.71k	if (PyErr_WarnExplicitObject(category, msg, p->tok->filename,
91	2.71k	lineno, NULL, NULL) < 0) {
92	0	if (PyErr_ExceptionMatches(category)) {
93		/* Replace the Syntax/DeprecationWarning exception with a SyntaxError
94		to get a more accurate error report */
95	0	PyErr_Clear();
96
97		/* This is needed, in order for the SyntaxError to point to the token t,
98		since _PyPegen_raise_error uses p->tokens[p->fill - 1] for the
99		error location, if p->known_err_token is not set. */
100	0	p->known_err_token = t;
101	0	if (octal) {
102	0	RAISE_ERROR_KNOWN_LOCATION(p, PyExc_SyntaxError, lineno, col_offset-1, lineno, col_offset+1,
103	0	"\"\\%.3s\" is an invalid octal escape sequence. "
104	0	"Did you mean \"\\\\%.3s\"? A raw string is also an option.",
105	0	first_invalid_escape, first_invalid_escape);
106	0	}
107	0	else {
108	0	RAISE_ERROR_KNOWN_LOCATION(p, PyExc_SyntaxError, lineno, col_offset-1, lineno, col_offset+1,
109	0	"\"\\%c\" is an invalid escape sequence. "
110	0	"Did you mean \"\\\\%c\"? A raw string is also an option.",
111	0	c, c);
112	0	}
113	0	}
114	0	Py_DECREF(msg);
115	0	return -1;
116	0	}
117	2.71k	Py_DECREF(msg);
118	2.71k	return 0;
119	2.71k	}
120
121		static PyObject *
122		decode_utf8(const char *sPtr, const char end)
123	7.60k	{
124	7.60k	const char *s;
125	7.60k	const char *t;
126	7.60k	t = s = *sPtr;
127	96.3k	while (s < end && (*s & 0x80)) {
128	88.7k	s++;
129	88.7k	}
130	7.60k	*sPtr = s;
131	7.60k	return PyUnicode_DecodeUTF8(t, s - t, NULL);
132	7.60k	}
133
134		static PyObject *
135		decode_unicode_with_escapes(Parser parser, const char s, size_t len, Token *t)
136	32.2k	{
137	32.2k	PyObject *v;
138	32.2k	PyObject *u;
139	32.2k	char *buf;
140	32.2k	char *p;
141	32.2k	const char *end;
142
143		/* check for integer overflow */
144	32.2k	if (len > (size_t)PY_SSIZE_T_MAX / 6) {
145	0	return NULL;
146	0	}
147		/* "ä" (2 bytes) may become "\U000000E4" (10 bytes), or 1:5
148		"\ä" (3 bytes) may become "\u005c\U000000E4" (16 bytes), or ~1:6 */
149	32.2k	u = PyBytes_FromStringAndSize((char )NULL, (Py_ssize_t)len 6);
150	32.2k	if (u == NULL) {
151	0	return NULL;
152	0	}
153	32.2k	p = buf = PyBytes_AsString(u);
154	32.2k	if (p == NULL) {
155	0	return NULL;
156	0	}
157	32.2k	end = s + len;
158	278k	while (s < end) {
159	247k	if (*s == '\\') {
160	42.4k	p++ = s++;
161	42.4k	if (s >= end \|\| *s & 0x80) {
162	2.08k	strcpy(p, "u005c");
163	2.08k	p += 5;
164	2.08k	if (s >= end) {
165	519	break;
166	519	}
167	2.08k	}
168	42.4k	}
169	246k	if (*s & 0x80) {
170	7.60k	PyObject *w;
171	7.60k	int kind;
172	7.60k	const void *data;
173	7.60k	Py_ssize_t w_len;
174	7.60k	Py_ssize_t i;
175	7.60k	w = decode_utf8(&s, end);
176	7.60k	if (w == NULL) {
177	35	Py_DECREF(u);
178	35	return NULL;
179	35	}
180	7.56k	kind = PyUnicode_KIND(w);
181	7.56k	data = PyUnicode_DATA(w);
182	7.56k	w_len = PyUnicode_GET_LENGTH(w);
183	38.7k	for (i = 0; i < w_len; i++) {
184	31.2k	Py_UCS4 chr = PyUnicode_READ(kind, data, i);
185	31.2k	sprintf(p, "\\U%08x", chr);
186	31.2k	p += 10;
187	31.2k	}
188		/* Should be impossible to overflow */
189	7.56k	assert(p - buf <= PyBytes_GET_SIZE(u));
190	7.56k	Py_DECREF(w);
191	7.56k	}
192	238k	else {
193	238k	p++ = s++;
194	238k	}
195	246k	}
196	32.1k	len = (size_t)(p - buf);
197	32.1k	s = buf;
198
199	32.1k	int first_invalid_escape_char;
200	32.1k	const char *first_invalid_escape_ptr;
201	32.1k	v = _PyUnicode_DecodeUnicodeEscapeInternal2(s, (Py_ssize_t)len, NULL, NULL,
202	32.1k	&first_invalid_escape_char,
203	32.1k	&first_invalid_escape_ptr);
204
205		// HACK: later we can simply pass the line no, since we don't preserve the tokens
206		// when we are decoding the string but we preserve the line numbers.
207	32.1k	if (v != NULL && first_invalid_escape_ptr != NULL && t != NULL) {
208	4.73k	if (warn_invalid_escape_sequence(parser, s, first_invalid_escape_ptr, t) < 0) {
209		/* We have not decref u before because first_invalid_escape_ptr
210		points inside u. */
211	0	Py_XDECREF(u);
212	0	Py_DECREF(v);
213	0	return NULL;
214	0	}
215	4.73k	}
216	32.1k	Py_XDECREF(u);
217	32.1k	return v;
218	32.1k	}
219
220		static PyObject *
221		decode_bytes_with_escapes(Parser p, const char s, Py_ssize_t len, Token *t)
222	3.07k	{
223	3.07k	int first_invalid_escape_char;
224	3.07k	const char *first_invalid_escape_ptr;
225	3.07k	PyObject *result = _PyBytes_DecodeEscape2(s, len, NULL,
226	3.07k	&first_invalid_escape_char,
227	3.07k	&first_invalid_escape_ptr);
228	3.07k	if (result == NULL) {
229	4	return NULL;
230	4	}
231
232	3.07k	if (first_invalid_escape_ptr != NULL) {
233	872	if (warn_invalid_escape_sequence(p, s, first_invalid_escape_ptr, t) < 0) {
234	0	Py_DECREF(result);
235	0	return NULL;
236	0	}
237	872	}
238	3.07k	return result;
239	3.07k	}
240
241		PyObject *
242		_PyPegen_decode_string(Parser p, int raw, const char s, size_t len, Token *t)
243	100k	{
244	100k	if (raw) {
245	68.1k	return PyUnicode_DecodeUTF8Stateful(s, (Py_ssize_t)len, NULL, NULL);
246	68.1k	}
247	32.2k	return decode_unicode_with_escapes(p, s, len, t);
248	100k	}
249
250		/* s must include the bracketing quote characters, and r, b &/or f prefixes
251		(if any), and embedded escape sequences (if any). (f-strings are handled by the parser)
252		_PyPegen_parse_string parses it, and returns the decoded Python string object. */
253		PyObject *
254		_PyPegen_parse_string(Parser p, Token t)
255	74.7k	{
256	74.7k	const char *s = PyBytes_AsString(t->bytes);
257	74.7k	if (s == NULL) {
258	0	return NULL;
259	0	}
260
261	74.7k	size_t len;
262	74.7k	int quote = Py_CHARMASK(*s);
263	74.7k	int bytesmode = 0;
264	74.7k	int rawmode = 0;
265
266	74.7k	if (Py_ISALPHA(quote)) {
267	19.8k	while (!bytesmode \|\| !rawmode) {
268	19.2k	if (quote == 'b' \|\| quote == 'B') {
269	8.06k	quote =(unsigned char)*++s;
270	8.06k	bytesmode = 1;
271	8.06k	}
272	11.2k	else if (quote == 'u' \|\| quote == 'U') {
273	1.02k	quote = (unsigned char)*++s;
274	1.02k	}
275	10.2k	else if (quote == 'r' \|\| quote == 'R') {
276	1.13k	quote = (unsigned char)*++s;
277	1.13k	rawmode = 1;
278	1.13k	}
279	9.07k	else {
280	9.07k	break;
281	9.07k	}
282	19.2k	}
283	9.64k	}
284
285	74.7k	if (quote != '\'' && quote != '\"') {
286	1	PyErr_BadInternalCall();
287	1	return NULL;
288	1	}
289
290		/* Skip the leading quote char. */
291	74.7k	s++;
292	74.7k	len = strlen(s);
293		// gh-120155: 's' contains at least the trailing quote,
294		// so the code '--len' below is safe.
295	74.7k	assert(len >= 1);
296
297	74.7k	if (len > INT_MAX) {
298	0	PyErr_SetString(PyExc_OverflowError, "string to parse is too long");
299	0	return NULL;
300	0	}
301	74.7k	if (s[--len] != quote) {
302		/* Last quote char must match the first. */
303	0	PyErr_BadInternalCall();
304	0	return NULL;
305	0	}
306	74.7k	if (len >= 4 && s[0] == quote && s[1] == quote) {
307		/* A triple quoted string. We've already skipped one quote at
308		the start and one at the end of the string. Now skip the
309		two at the start. */
310	2.78k	s += 2;
311	2.78k	len -= 2;
312		/* And check that the last two match. */
313	2.78k	if (s[--len] != quote \|\| s[--len] != quote) {
314	0	PyErr_BadInternalCall();
315	0	return NULL;
316	0	}
317	2.78k	}
318
319		/* Avoid invoking escape decoding routines if possible. */
320	74.7k	rawmode = rawmode \|\| strchr(s, '\\') == NULL;
321	74.7k	if (bytesmode) {
322		/* Disallow non-ASCII characters. */
323	8.06k	const char *ch;
324	104k	for (ch = s; *ch; ch++) {
325	96.4k	if (Py_CHARMASK(*ch) >= 0x80) {
326	6	RAISE_SYNTAX_ERROR_KNOWN_LOCATION(
327	6	t,
328	6	"bytes can only contain ASCII "
329	6	"literal characters");
330	6	return NULL;
331	6	}
332	96.4k	}
333	8.05k	if (rawmode) {
334	4.98k	return PyBytes_FromStringAndSize(s, (Py_ssize_t)len);
335	4.98k	}
336	3.07k	return decode_bytes_with_escapes(p, s, (Py_ssize_t)len, t);
337	8.05k	}
338	66.7k	return _PyPegen_decode_string(p, rawmode, s, len, t);
339	74.7k	}