harvesting_the_net/pics/lib/python3.10/site-packages/parso/python/prefix.py

import re
from codecs import BOM_UTF8
from typing import Tuple

from parso.python.tokenize import group

unicode_bom = BOM_UTF8.decode('utf-8')


class PrefixPart:
    def __init__(self, leaf, typ, value, spacing='', start_pos=None):
        assert start_pos is not None
        self.parent = leaf
        self.type = typ
        self.value = value
        self.spacing = spacing
        self.start_pos: Tuple[int, int] = start_pos

    @property
    def end_pos(self) -> Tuple[int, int]:
        if self.value.endswith('\n') or self.value.endswith('\r'):
            return self.start_pos[0] + 1, 0
        if self.value == unicode_bom:
            # The bom doesn't have a length at the start of a Python file.
            return self.start_pos
        return self.start_pos[0], self.start_pos[1] + len(self.value)

    def create_spacing_part(self):
        column = self.start_pos[1] - len(self.spacing)
        return PrefixPart(
            self.parent, 'spacing', self.spacing,
            start_pos=(self.start_pos[0], column)
        )

    def __repr__(self):
        return '%s(%s, %s, %s)' % (
            self.__class__.__name__,
            self.type,
            repr(self.value),
            self.start_pos
        )

    def search_ancestor(self, *node_types):
        node = self.parent
        while node is not None:
            if node.type in node_types:
                return node
            node = node.parent
        return None


_comment = r'#[^\n\r\f]*'
_backslash = r'\\\r?\n|\\\r'
_newline = r'\r?\n|\r'
_form_feed = r'\f'
_only_spacing = '$'
_spacing = r'[ \t]*'
_bom = unicode_bom

_regex = group(
    _comment, _backslash, _newline, _form_feed, _only_spacing, _bom,
    capture=True
)
_regex = re.compile(group(_spacing, capture=True) + _regex)


_types = {
    '#': 'comment',
    '\\': 'backslash',
    '\f': 'formfeed',
    '\n': 'newline',
    '\r': 'newline',
    unicode_bom: 'bom'
}


def split_prefix(leaf, start_pos):
    line, column = start_pos
    start = 0
    value = spacing = ''
    bom = False
    while start != len(leaf.prefix):
        match = _regex.match(leaf.prefix, start)
        spacing = match.group(1)
        value = match.group(2)
        if not value:
            break
        type_ = _types[value[0]]
        yield PrefixPart(
            leaf, type_, value, spacing,
            start_pos=(line, column + start - int(bom) + len(spacing))
        )
        if type_ == 'bom':
            bom = True

        start = match.end(0)
        if value.endswith('\n') or value.endswith('\r'):
            line += 1
            column = -start

    if value:
        spacing = ''
    yield PrefixPart(
        leaf, 'spacing', spacing,
        start_pos=(line, column + start)
    )
end 2 years ago			`import re`
			`from codecs import BOM_UTF8`
			`from typing import Tuple`

			`from parso.python.tokenize import group`

			`unicode_bom = BOM_UTF8.decode('utf-8')`


			`class PrefixPart:`
			`def __init__(self, leaf, typ, value, spacing='', start_pos=None):`
			`assert start_pos is not None`
			`self.parent = leaf`
			`self.type = typ`
			`self.value = value`
			`self.spacing = spacing`
			`self.start_pos: Tuple[int, int] = start_pos`

			`@property`
			`def end_pos(self) -> Tuple[int, int]:`
			`if self.value.endswith('\n') or self.value.endswith('\r'):`
			`return self.start_pos[0] + 1, 0`
			`if self.value == unicode_bom:`
			`# The bom doesn't have a length at the start of a Python file.`
			`return self.start_pos`
			`return self.start_pos[0], self.start_pos[1] + len(self.value)`

			`def create_spacing_part(self):`
			`column = self.start_pos[1] - len(self.spacing)`
			`return PrefixPart(`
			`self.parent, 'spacing', self.spacing,`
			`start_pos=(self.start_pos[0], column)`
			`)`

			`def __repr__(self):`
			`return '%s(%s, %s, %s)' % (`
			`self.__class__.__name__,`
			`self.type,`
			`repr(self.value),`
			`self.start_pos`
			`)`

			`def search_ancestor(self, *node_types):`
			`node = self.parent`
			`while node is not None:`
			`if node.type in node_types:`
			`return node`
			`node = node.parent`
			`return None`


			`_comment = r'#[^\n\r\f]*'`
			`_backslash = r'\\\r?\n\|\\\r'`
			`_newline = r'\r?\n\|\r'`
			`_form_feed = r'\f'`
			`_only_spacing = '$'`
			`_spacing = r'[ \t]*'`
			`_bom = unicode_bom`

			`_regex = group(`
			`_comment, _backslash, _newline, _form_feed, _only_spacing, _bom,`
			`capture=True`
			`)`
			`_regex = re.compile(group(_spacing, capture=True) + _regex)`


			`_types = {`
			`'#': 'comment',`
			`'\\': 'backslash',`
			`'\f': 'formfeed',`
			`'\n': 'newline',`
			`'\r': 'newline',`
			`unicode_bom: 'bom'`
			`}`


			`def split_prefix(leaf, start_pos):`
			`line, column = start_pos`
			`start = 0`
			`value = spacing = ''`
			`bom = False`
			`while start != len(leaf.prefix):`
			`match = _regex.match(leaf.prefix, start)`
			`spacing = match.group(1)`
			`value = match.group(2)`
			`if not value:`
			`break`
			`type_ = _types[value[0]]`
			`yield PrefixPart(`
			`leaf, type_, value, spacing,`
			`start_pos=(line, column + start - int(bom) + len(spacing))`
			`)`
			`if type_ == 'bom':`
			`bom = True`

			`start = match.end(0)`
			`if value.endswith('\n') or value.endswith('\r'):`
			`line += 1`
			`column = -start`

			`if value:`
			`spacing = ''`
			`yield PrefixPart(`
			`leaf, 'spacing', spacing,`
			`start_pos=(line, column + start)`
			`)`