Coverage for /pythoncovmergedfiles/medio/medio/usr/local/lib/python3.11/site-packages/asttokens/util.py: 50%

255 # type: (Module, Callable[[AstNode, Optional[Token]], Tuple[Optional[Token], Optional[Token]]], Optional[Callable[[AstNode, Optional[Token], Optional[Token]], None]]) -> None

256 """

257 Scans the tree under the node depth-first using an explicit stack. It avoids implicit recursion

258 via the function call stack to avoid hitting 'maximum recursion depth exceeded' error.

259

260 It calls ``previsit()`` and ``postvisit()`` as follows:

261

262 * ``previsit(node, par_value)`` - should return ``(par_value, value)``

263 ``par_value`` is as returned from ``previsit()`` of the parent.

264

265 * ``postvisit(node, par_value, value)`` - should return ``value``

266 ``par_value`` is as returned from ``previsit()`` of the parent, and ``value`` is as

267 returned from ``previsit()`` of this node itself. The return ``value`` is ignored except

268 the one for the root node, which is returned from the overall ``visit_tree()`` call.

269

270 For the initial node, ``par_value`` is None. ``postvisit`` may be None.

271 """

272 if not postvisit:

273 postvisit = lambda node, pvalue, value: None

274

275 iter_children = iter_children_func(node)

276 done = set()

277 ret = None

278 stack = [(node, None, _PREVISIT)] # type: List[Tuple[AstNode, Optional[Token], Union[Optional[Token], object]]]

279 while stack:

280 current, par_value, value = stack.pop()

281 if value is _PREVISIT:

282 assert current not in done # protect againt infinite loop in case of a bad tree.

283 done.add(current)

284

285 pvalue, post_value = previsit(current, par_value)

286 stack.append((current, par_value, post_value))

287

288 # Insert all children in reverse order (so that first child ends up on top of the stack).

289 ins = len(stack)

290 for n in iter_children(current):

291 stack.insert(ins, (n, pvalue, _PREVISIT))

292 else:

293 ret = postvisit(current, par_value, cast(Optional[Token], value))

294 return ret

295

296

297def walk(node, include_joined_str=False):

298 # type: (AST, bool) -> Iterator[Union[Module, AstNode]]

299 """

300 Recursively yield all descendant nodes in the tree starting at ``node`` (including ``node``

301 itself), using depth-first pre-order traversal (yieling parents before their children).

302

303 This is similar to ``ast.walk()``, but with a different order, and it works for both ``ast`` and

304 ``astroid`` trees. Also, as ``iter_children()``, it skips singleton nodes generated by ``ast``.

305

306 By default, ``JoinedStr`` (f-string) nodes and their contents are skipped

307 because they previously couldn't be handled. Set ``include_joined_str`` to True to include them.

308 """

309 iter_children = iter_children_func(node)

310 done = set()

311 stack = [node]

312 while stack:

313 current = stack.pop()

314 assert current not in done # protect againt infinite loop in case of a bad tree.

315 done.add(current)

316

317 yield current

318

319 # Insert all children in reverse order (so that first child ends up on top of the stack).

320 # This is faster than building a list and reversing it.

321 ins = len(stack)

322 for c in iter_children(current, include_joined_str):

323 stack.insert(ins, c)

324

325

326def replace(text, replacements):

327 # type: (str, List[Tuple[int, int, str]]) -> str

328 """

329 Replaces multiple slices of text with new values. This is a convenience method for making code

330 modifications of ranges e.g. as identified by ``ASTTokens.get_text_range(node)``. Replacements is

331 an iterable of ``(start, end, new_text)`` tuples.

332

333 For example, ``replace("this is a test", [(0, 4, "X"), (8, 9, "THE")])`` produces

334 ``"X is THE test"``.

335 """

336 p = 0

337 parts = []

338 for (start, end, new_text) in sorted(replacements):

339 parts.append(text[p:start])

340 parts.append(new_text)

341 p = end

342 parts.append(text[p:])

343 return ''.join(parts)

344

345

346class NodeMethods:

347 """

348 Helper to get `visit_{node_type}` methods given a node's class and cache the results.

349 """

350 def __init__(self):

351 # type: () -> None

352 self._cache = {} # type: Dict[Union[ABCMeta, type], Callable[[AstNode, Token, Token], Tuple[Token, Token]]]

353

354 def get(self, obj, cls):

355 # type: (Any, Union[ABCMeta, type]) -> Callable

356 """

357 Using the lowercase name of the class as node_type, returns `obj.visit_{node_type}`,

358 or `obj.visit_default` if the type-specific method is not found.

359 """

360 method = self._cache.get(cls)

361 if not method:

362 name = "visit_" + cls.__name__.lower()

363 method = getattr(obj, name, obj.visit_default)

364 self._cache[cls] = method

365 return method

366

367

368def patched_generate_tokens(original_tokens):

369 # type: (Iterable[TokenInfo]) -> Iterator[TokenInfo]

370 """

371 Fixes tokens yielded by `tokenize.generate_tokens` to handle more non-ASCII characters in identifiers.

372 Workaround for https://github.com/python/cpython/issues/68382.

373 Should only be used when tokenizing a string that is known to be valid syntax,

374 because it assumes that error tokens are not actually errors.

375 Combines groups of consecutive NAME, NUMBER, and/or ERRORTOKEN tokens into a single NAME token.

376 """

377 group = [] # type: List[tokenize.TokenInfo]

378 for tok in original_tokens:

379 if (

380 tok.type in (tokenize.NAME, tokenize.ERRORTOKEN, tokenize.NUMBER)

381 # Only combine tokens if they have no whitespace in between

382 and (not group or group[-1].end == tok.start)

383 ):

384 group.append(tok)

385 else:

386 for combined_token in combine_tokens(group):

387 yield combined_token

388 group = []

389 yield tok

390 for combined_token in combine_tokens(group):

391 yield combined_token

392

393def combine_tokens(group):

394 # type: (List[tokenize.TokenInfo]) -> List[tokenize.TokenInfo]

395 if not any(tok.type == tokenize.ERRORTOKEN for tok in group) or len({tok.line for tok in group}) != 1:

396 return group

397 return [

398 tokenize.TokenInfo(

399 type=tokenize.NAME,

400 string="".join(t.string for t in group),

401 start=group[0].start,

402 end=group[-1].end,

403 line=group[0].line,

404 )

405 ]

406

407

408def last_stmt(node):

409 # type: (AstNode) -> AstNode

410 """

411 If the given AST node contains multiple statements, return the last one.

412 Otherwise, just return the node.

413 """

414 child_stmts = [

415 child for child in iter_children_func(node)(node)

416 if is_stmt(child) or type(child).__name__ in (

417 "excepthandler",

418 "ExceptHandler",

419 "match_case",

420 "MatchCase",

421 "TryExcept",

422 "TryFinally",

423 )

424 ]

425 if child_stmts:

426 return last_stmt(child_stmts[-1])

427 return node

428

429

430

431@lru_cache(maxsize=None)

432def fstring_positions_work():

433 # type: () -> bool

434 """

435 The positions attached to nodes inside f-string FormattedValues have some bugs

436 that were fixed in Python 3.9.7 in https://github.com/python/cpython/pull/27729.

437 This checks for those bugs more concretely without relying on the Python version.

438 Specifically this checks:

439 - Values with a format spec or conversion

440 - Repeated (i.e. identical-looking) expressions

441 - f-strings implicitly concatenated over multiple lines.

442 - Multiline, triple-quoted f-strings.

443 """

444 source = """(

445 f"a {b}{b} c {d!r} e {f:g} h {i:{j}} k {l:{m:n}}"

446 f"a {b}{b} c {d!r} e {f:g} h {i:{j}} k {l:{m:n}}"

447 f"{x + y + z} {x} {y} {z} {z} {z!a} {z:z}"

448 f'''

449 {s} {t}

450 {u} {v}

451 '''

452 )"""

453 tree = ast.parse(source)

454 name_nodes = [node for node in ast.walk(tree) if isinstance(node, ast.Name)]

455 name_positions = [(node.lineno, node.col_offset) for node in name_nodes]

456 positions_are_unique = len(set(name_positions)) == len(name_positions)

457 correct_source_segments = all(

458 ast.get_source_segment(source, node) == node.id

459 for node in name_nodes

460 )

461 return positions_are_unique and correct_source_segments

462

463def annotate_fstring_nodes(tree):

464 # type: (ast.AST) -> None

465 """

466 Add a special attribute `_broken_positions` to nodes inside f-strings

467 if the lineno/col_offset cannot be trusted.

468 """

469 if sys.version_info >= (3, 12):

470 # f-strings were weirdly implemented until https://peps.python.org/pep-0701/

471 # In Python 3.12, inner nodes have sensible positions.

472 return

473 for joinedstr in walk(tree, include_joined_str=True):

474 if not isinstance(joinedstr, ast.JoinedStr):

475 continue

476 for part in joinedstr.values:

477 # The ast positions of the FormattedValues/Constant nodes span the full f-string, which is weird.

478 setattr(part, '_broken_positions', True) # use setattr for mypy

479

480 if isinstance(part, ast.FormattedValue):

481 if not fstring_positions_work():

482 for child in walk(part.value):

483 setattr(child, '_broken_positions', True)

484

485 if part.format_spec: # this is another JoinedStr

486 # Again, the standard positions span the full f-string.

487 setattr(part.format_spec, '_broken_positions', True)