Coverage for /pythoncovmergedfiles/medio/medio/usr/local/lib/python3.11/site-packages/IPython/core/inputtransformer2.py: 23%

617 "`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified",

618 stacklevel=2,

619 )

620 parenlev = 0

621 try:

622 for token in tokenutil.generate_tokens_catch_errors(

623 iter(lines).__next__, extra_errors_to_catch=["expected EOF"]

624 ):

625 tokens_by_line[-1].append(token)

626 if (token.type == NEWLINE) \

627 or ((token.type == NL) and (parenlev <= 0)):

628 tokens_by_line.append([])

629 elif token.string in {'(', '[', '{'}:

630 parenlev += 1

631 elif token.string in {')', ']', '}'}:

632 if parenlev > 0:

633 parenlev -= 1

634 except tokenize.TokenError:

635 # Input ended in a multiline string or expression. That's OK for us.

636 pass

637

638

639 if not tokens_by_line[-1]:

640 tokens_by_line.pop()

641

642

643 return tokens_by_line

644

645

646def has_sunken_brackets(tokens: List[tokenize.TokenInfo]):

647 """Check if the depth of brackets in the list of tokens drops below 0"""

648 parenlev = 0

649 for token in tokens:

650 if token.string in {"(", "[", "{"}:

651 parenlev += 1

652 elif token.string in {")", "]", "}"}:

653 parenlev -= 1

654 if parenlev < 0:

655 return True

656 return False

657

658# Arbitrary limit to prevent getting stuck in infinite loops

659TRANSFORM_LOOP_LIMIT = 500

660

661class TransformerManager:

662 """Applies various transformations to a cell or code block.

663

664 The key methods for external use are ``transform_cell()``

665 and ``check_complete()``.

666 """

667 def __init__(self):

668 self.cleanup_transforms = [

669 leading_empty_lines,

670 leading_indent,

671 classic_prompt,

672 ipython_prompt,

673 ]

674 self.line_transforms = [

675 cell_magic,

676 ]

677 self.token_transformers = [

678 MagicAssign,

679 SystemAssign,

680 EscapedCommand,

681 HelpEnd,

682 ]

683

684 def do_one_token_transform(self, lines):

685 """Find and run the transform earliest in the code.

686

687 Returns (changed, lines).

688

689 This method is called repeatedly until changed is False, indicating

690 that all available transformations are complete.

691

692 The tokens following IPython special syntax might not be valid, so

693 the transformed code is retokenised every time to identify the next

694 piece of special syntax. Hopefully long code cells are mostly valid

695 Python, not using lots of IPython special syntax, so this shouldn't be

696 a performance issue.

697 """

698 tokens_by_line = make_tokens_by_line(lines)

699 candidates = []

700 for transformer_cls in self.token_transformers:

701 transformer = transformer_cls.find(tokens_by_line)

702 if transformer:

703 candidates.append(transformer)

704

705 if not candidates:

706 # Nothing to transform

707 return False, lines

708 ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)

709 for transformer in ordered_transformers:

710 try:

711 return True, transformer.transform(lines)

712 except SyntaxError:

713 pass

714 return False, lines

715

716 def do_token_transforms(self, lines):

717 for _ in range(TRANSFORM_LOOP_LIMIT):

718 changed, lines = self.do_one_token_transform(lines)

719 if not changed:

720 return lines

721

722 raise RuntimeError("Input transformation still changing after "

723 "%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)

724

725 def transform_cell(self, cell: str) -> str:

726 """Transforms a cell of input code"""

727 if not cell.endswith('\n'):

728 cell += '\n' # Ensure the cell has a trailing newline

729 lines = cell.splitlines(keepends=True)

730 for transform in self.cleanup_transforms + self.line_transforms:

731 lines = transform(lines)

732

733 lines = self.do_token_transforms(lines)

734 return ''.join(lines)

735

736 def check_complete(self, cell: str):

737 """Return whether a block of code is ready to execute, or should be continued

738

739 Parameters

740 ----------

741 cell : string

742 Python input code, which can be multiline.

743

744 Returns

745 -------

746 status : str

747 One of 'complete', 'incomplete', or 'invalid' if source is not a

748 prefix of valid code.

749 indent_spaces : int or None

750 The number of spaces by which to indent the next line of code. If

751 status is not 'incomplete', this is None.

752 """

753 # Remember if the lines ends in a new line.

754 ends_with_newline = False

755 for character in reversed(cell):

756 if character == '\n':

757 ends_with_newline = True

758 break

759 elif character.strip():

760 break

761 else:

762 continue

763

764 if not ends_with_newline:

765 # Append an newline for consistent tokenization

766 # See https://bugs.python.org/issue33899

767 cell += '\n'

768

769 lines = cell.splitlines(keepends=True)

770

771 if not lines:

772 return 'complete', None

773

774 for line in reversed(lines):

775 if not line.strip():

776 continue

777 elif line.strip("\n").endswith("\\"):

778 return "incomplete", find_last_indent(lines)

779 else:

780 break

781

782 try:

783 for transform in self.cleanup_transforms:

784 if not getattr(transform, 'has_side_effects', False):

785 lines = transform(lines)

786 except SyntaxError:

787 return 'invalid', None

788

789 if lines[0].startswith('%%'):

790 # Special case for cell magics - completion marked by blank line

791 if lines[-1].strip():

792 return 'incomplete', find_last_indent(lines)

793 else:

794 return 'complete', None

795

796 try:

797 for transform in self.line_transforms:

798 if not getattr(transform, 'has_side_effects', False):

799 lines = transform(lines)

800 lines = self.do_token_transforms(lines)

801 except SyntaxError:

802 return 'invalid', None

803

804 tokens_by_line = make_tokens_by_line(lines)

805

806 # Bail if we got one line and there are more closing parentheses than

807 # the opening ones

808 if (

809 len(lines) == 1

810 and tokens_by_line

811 and has_sunken_brackets(tokens_by_line[0])

812 ):

813 return "invalid", None

814

815 if not tokens_by_line:

816 return 'incomplete', find_last_indent(lines)

817

818 if (

819 tokens_by_line[-1][-1].type != tokenize.ENDMARKER

820 and tokens_by_line[-1][-1].type != tokenize.ERRORTOKEN

821 ):

822 # We're in a multiline string or expression

823 return 'incomplete', find_last_indent(lines)

824

825 newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER} # type: ignore

826

827 # Pop the last line which only contains DEDENTs and ENDMARKER

828 last_token_line = None

829 if {t.type for t in tokens_by_line[-1]} in [

830 {tokenize.DEDENT, tokenize.ENDMARKER},

831 {tokenize.ENDMARKER}

832 ] and len(tokens_by_line) > 1:

833 last_token_line = tokens_by_line.pop()

834

835 while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:

836 tokens_by_line[-1].pop()

837

838 if not tokens_by_line[-1]:

839 return 'incomplete', find_last_indent(lines)

840

841 if tokens_by_line[-1][-1].string == ':':

842 # The last line starts a block (e.g. 'if foo:')

843 ix = 0

844 while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:

845 ix += 1

846

847 indent = tokens_by_line[-1][ix].start[1]

848 return 'incomplete', indent + 4

849

850 if tokens_by_line[-1][0].line.endswith('\\'):

851 return 'incomplete', None

852

853 # At this point, our checks think the code is complete (or invalid).

854 # We'll use codeop.compile_command to check this with the real parser

855 try:

856 with warnings.catch_warnings():

857 warnings.simplefilter('error', SyntaxWarning)

858 res = compile_command(''.join(lines), symbol='exec')

859 except (SyntaxError, OverflowError, ValueError, TypeError,

860 MemoryError, SyntaxWarning):

861 return 'invalid', None

862 else:

863 if res is None:

864 return 'incomplete', find_last_indent(lines)

865

866 if last_token_line and last_token_line[0].type == tokenize.DEDENT:

867 if ends_with_newline:

868 return 'complete', None

869 return 'incomplete', find_last_indent(lines)

870

871 # If there's a blank line at the end, assume we're ready to execute

872 if not lines[-1].strip():

873 return 'complete', None

874

875 return 'complete', None

876

877

878def find_last_indent(lines):

879 m = _indent_re.match(lines[-1])

880 if not m:

881 return 0

882 return len(m.group(0).replace('\t', ' '*4))

883

884

885class MaybeAsyncCompile(Compile):

886 def __init__(self, extra_flags=0):

887 super().__init__()

888 self.flags |= extra_flags

889

890

891class MaybeAsyncCommandCompiler(CommandCompiler):

892 def __init__(self, extra_flags=0):

893 self.compiler = MaybeAsyncCompile(extra_flags=extra_flags)

894

895

896_extra_flags = ast.PyCF_ALLOW_TOP_LEVEL_AWAIT

897

898compile_command = MaybeAsyncCommandCompiler(extra_flags=_extra_flags)