Coverage for /pythoncovmergedfiles/medio/medio/usr/local/lib/python3.11/site-packages/IPython/core/inputtransformer2.py: 24%

527 "`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified",

528 stacklevel=2,

529 )

530 parenlev = 0

531 try:

532 for token in tokenutil.generate_tokens_catch_errors(

533 iter(lines).__next__, extra_errors_to_catch=["expected EOF"]

534 ):

535 tokens_by_line[-1].append(token)

536 if (token.type == NEWLINE) \

537 or ((token.type == NL) and (parenlev <= 0)):

538 tokens_by_line.append([])

539 elif token.string in {'(', '[', '{'}:

540 parenlev += 1

541 elif token.string in {')', ']', '}'}:

542 if parenlev > 0:

543 parenlev -= 1

544 except tokenize.TokenError:

545 # Input ended in a multiline string or expression. That's OK for us.

546 pass

547

548

549 if not tokens_by_line[-1]:

550 tokens_by_line.pop()

551

552

553 return tokens_by_line

554

555

556def has_sunken_brackets(tokens: List[tokenize.TokenInfo]):

557 """Check if the depth of brackets in the list of tokens drops below 0"""

558 parenlev = 0

559 for token in tokens:

560 if token.string in {"(", "[", "{"}:

561 parenlev += 1

562 elif token.string in {")", "]", "}"}:

563 parenlev -= 1

564 if parenlev < 0:

565 return True

566 return False

567

568# Arbitrary limit to prevent getting stuck in infinite loops

569TRANSFORM_LOOP_LIMIT = 500

570

571class TransformerManager:

572 """Applies various transformations to a cell or code block.

573

574 The key methods for external use are ``transform_cell()``

575 and ``check_complete()``.

576 """

577 def __init__(self):

578 self.cleanup_transforms = [

579 leading_empty_lines,

580 leading_indent,

581 classic_prompt,

582 ipython_prompt,

583 ]

584 self.line_transforms = [

585 cell_magic,

586 ]

587 self.token_transformers = [

588 MagicAssign,

589 SystemAssign,

590 EscapedCommand,

591 HelpEnd,

592 ]

593

594 def do_one_token_transform(self, lines):

595 """Find and run the transform earliest in the code.

596

597 Returns (changed, lines).

598

599 This method is called repeatedly until changed is False, indicating

600 that all available transformations are complete.

601

602 The tokens following IPython special syntax might not be valid, so

603 the transformed code is retokenised every time to identify the next

604 piece of special syntax. Hopefully long code cells are mostly valid

605 Python, not using lots of IPython special syntax, so this shouldn't be

606 a performance issue.

607 """

608 tokens_by_line = make_tokens_by_line(lines)

609 candidates = []

610 for transformer_cls in self.token_transformers:

611 transformer = transformer_cls.find(tokens_by_line)

612 if transformer:

613 candidates.append(transformer)

614

615 if not candidates:

616 # Nothing to transform

617 return False, lines

618 ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)

619 for transformer in ordered_transformers:

620 try:

621 return True, transformer.transform(lines)

622 except SyntaxError:

623 pass

624 return False, lines

625

626 def do_token_transforms(self, lines):

627 for _ in range(TRANSFORM_LOOP_LIMIT):

628 changed, lines = self.do_one_token_transform(lines)

629 if not changed:

630 return lines

631

632 raise RuntimeError("Input transformation still changing after "

633 "%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)

634

635 def transform_cell(self, cell: str) -> str:

636 """Transforms a cell of input code"""

637 if not cell.endswith('\n'):

638 cell += '\n' # Ensure the cell has a trailing newline

639 lines = cell.splitlines(keepends=True)

640 for transform in self.cleanup_transforms + self.line_transforms:

641 lines = transform(lines)

642

643 lines = self.do_token_transforms(lines)

644 return ''.join(lines)

645

646 def check_complete(self, cell: str):

647 """Return whether a block of code is ready to execute, or should be continued

648

649 Parameters

650 ----------

651 cell : string

652 Python input code, which can be multiline.

653

654 Returns

655 -------

656 status : str

657 One of 'complete', 'incomplete', or 'invalid' if source is not a

658 prefix of valid code.

659 indent_spaces : int or None

660 The number of spaces by which to indent the next line of code. If

661 status is not 'incomplete', this is None.

662 """

663 # Remember if the lines ends in a new line.

664 ends_with_newline = False

665 for character in reversed(cell):

666 if character == '\n':

667 ends_with_newline = True

668 break

669 elif character.strip():

670 break

671 else:

672 continue

673

674 if not ends_with_newline:

675 # Append an newline for consistent tokenization

676 # See https://bugs.python.org/issue33899

677 cell += '\n'

678

679 lines = cell.splitlines(keepends=True)

680

681 if not lines:

682 return 'complete', None

683

684 for line in reversed(lines):

685 if not line.strip():

686 continue

687 elif line.strip("\n").endswith("\\"):

688 return "incomplete", find_last_indent(lines)

689 else:

690 break

691

692 try:

693 for transform in self.cleanup_transforms:

694 if not getattr(transform, 'has_side_effects', False):

695 lines = transform(lines)

696 except SyntaxError:

697 return 'invalid', None

698

699 if lines[0].startswith('%%'):

700 # Special case for cell magics - completion marked by blank line

701 if lines[-1].strip():

702 return 'incomplete', find_last_indent(lines)

703 else:

704 return 'complete', None

705

706 try:

707 for transform in self.line_transforms:

708 if not getattr(transform, 'has_side_effects', False):

709 lines = transform(lines)

710 lines = self.do_token_transforms(lines)

711 except SyntaxError:

712 return 'invalid', None

713

714 tokens_by_line = make_tokens_by_line(lines)

715

716 # Bail if we got one line and there are more closing parentheses than

717 # the opening ones

718 if (

719 len(lines) == 1

720 and tokens_by_line

721 and has_sunken_brackets(tokens_by_line[0])

722 ):

723 return "invalid", None

724

725 if not tokens_by_line:

726 return 'incomplete', find_last_indent(lines)

727

728 if (

729 tokens_by_line[-1][-1].type != tokenize.ENDMARKER

730 and tokens_by_line[-1][-1].type != tokenize.ERRORTOKEN

731 ):

732 # We're in a multiline string or expression

733 return 'incomplete', find_last_indent(lines)

734

735 newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER} # type: ignore

736

737 # Pop the last line which only contains DEDENTs and ENDMARKER

738 last_token_line = None

739 if {t.type for t in tokens_by_line[-1]} in [

740 {tokenize.DEDENT, tokenize.ENDMARKER},

741 {tokenize.ENDMARKER}

742 ] and len(tokens_by_line) > 1:

743 last_token_line = tokens_by_line.pop()

744

745 while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:

746 tokens_by_line[-1].pop()

747

748 if not tokens_by_line[-1]:

749 return 'incomplete', find_last_indent(lines)

750

751 if tokens_by_line[-1][-1].string == ':':

752 # The last line starts a block (e.g. 'if foo:')

753 ix = 0

754 while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:

755 ix += 1

756

757 indent = tokens_by_line[-1][ix].start[1]

758 return 'incomplete', indent + 4

759

760 if tokens_by_line[-1][0].line.endswith('\\'):

761 return 'incomplete', None

762

763 # At this point, our checks think the code is complete (or invalid).

764 # We'll use codeop.compile_command to check this with the real parser

765 try:

766 with warnings.catch_warnings():

767 warnings.simplefilter('error', SyntaxWarning)

768 res = compile_command(''.join(lines), symbol='exec')

769 except (SyntaxError, OverflowError, ValueError, TypeError,

770 MemoryError, SyntaxWarning):

771 return 'invalid', None

772 else:

773 if res is None:

774 return 'incomplete', find_last_indent(lines)

775

776 if last_token_line and last_token_line[0].type == tokenize.DEDENT:

777 if ends_with_newline:

778 return 'complete', None

779 return 'incomplete', find_last_indent(lines)

780

781 # If there's a blank line at the end, assume we're ready to execute

782 if not lines[-1].strip():

783 return 'complete', None

784

785 return 'complete', None

786

787

788def find_last_indent(lines):

789 m = _indent_re.match(lines[-1])

790 if not m:

791 return 0

792 return len(m.group(0).replace('\t', ' '*4))

793

794

795class MaybeAsyncCompile(Compile):

796 def __init__(self, extra_flags=0):

797 super().__init__()

798 self.flags |= extra_flags

799

800

801class MaybeAsyncCommandCompiler(CommandCompiler):

802 def __init__(self, extra_flags=0):

803 self.compiler = MaybeAsyncCompile(extra_flags=extra_flags)

804

805

806_extra_flags = ast.PyCF_ALLOW_TOP_LEVEL_AWAIT

807

808compile_command = MaybeAsyncCommandCompiler(extra_flags=_extra_flags)