[config.git] / djavu-asus / elpy / rpc-venv / lib / python3.11 / site-packages / flake8 / processor.py

"""Module containing our file processor that tokenizes a file for checks."""
from __future__ import annotations

import argparse
import ast
import logging
import tokenize
from typing import Any
from typing import Generator
from typing import List
from typing import Tuple

from flake8 import defaults
from flake8 import utils
from flake8._compat import FSTRING_END
from flake8._compat import FSTRING_MIDDLE
from flake8.plugins.finder import LoadedPlugin

LOG = logging.getLogger(__name__)
NEWLINE = frozenset([tokenize.NL, tokenize.NEWLINE])

SKIP_TOKENS = frozenset(
    [tokenize.NL, tokenize.NEWLINE, tokenize.INDENT, tokenize.DEDENT]
)

_LogicalMapping = List[Tuple[int, Tuple[int, int]]]
_Logical = Tuple[List[str], List[str], _LogicalMapping]


class FileProcessor:
    """Processes a file and holds state.

    This processes a file by generating tokens, logical and physical lines,
    and AST trees. This also provides a way of passing state about the file
    to checks expecting that state. Any public attribute on this object can
    be requested by a plugin. The known public attributes are:

    - :attr:`blank_before`
    - :attr:`blank_lines`
    - :attr:`checker_state`
    - :attr:`indent_char`
    - :attr:`indent_level`
    - :attr:`line_number`
    - :attr:`logical_line`
    - :attr:`max_line_length`
    - :attr:`max_doc_length`
    - :attr:`multiline`
    - :attr:`noqa`
    - :attr:`previous_indent_level`
    - :attr:`previous_logical`
    - :attr:`previous_unindented_logical_line`
    - :attr:`tokens`
    - :attr:`file_tokens`
    - :attr:`total_lines`
    - :attr:`verbose`
    """

    #: always ``False``, included for compatibility
    noqa = False

    def __init__(
        self,
        filename: str,
        options: argparse.Namespace,
        lines: list[str] | None = None,
    ) -> None:
        """Initialize our file processor.

        :param filename: Name of the file to process
        """
        self.options = options
        self.filename = filename
        self.lines = lines if lines is not None else self.read_lines()
        self.strip_utf_bom()

        # Defaults for public attributes
        #: Number of preceding blank lines
        self.blank_before = 0
        #: Number of blank lines
        self.blank_lines = 0
        #: Checker states for each plugin?
        self._checker_states: dict[str, dict[Any, Any]] = {}
        #: Current checker state
        self.checker_state: dict[Any, Any] = {}
        #: User provided option for hang closing
        self.hang_closing = options.hang_closing
        #: Character used for indentation
        self.indent_char: str | None = None
        #: Current level of indentation
        self.indent_level = 0
        #: Number of spaces used for indentation
        self.indent_size = options.indent_size
        #: Line number in the file
        self.line_number = 0
        #: Current logical line
        self.logical_line = ""
        #: Maximum line length as configured by the user
        self.max_line_length = options.max_line_length
        #: Maximum docstring / comment line length as configured by the user
        self.max_doc_length = options.max_doc_length
        #: Whether the current physical line is multiline
        self.multiline = False
        #: Previous level of indentation
        self.previous_indent_level = 0
        #: Previous logical line
        self.previous_logical = ""
        #: Previous unindented (i.e. top-level) logical line
        self.previous_unindented_logical_line = ""
        #: Current set of tokens
        self.tokens: list[tokenize.TokenInfo] = []
        #: Total number of lines in the file
        self.total_lines = len(self.lines)
        #: Verbosity level of Flake8
        self.verbose = options.verbose
        #: Statistics dictionary
        self.statistics = {"logical lines": 0}
        self._file_tokens: list[tokenize.TokenInfo] | None = None
        # map from line number to the line we'll search for `noqa` in
        self._noqa_line_mapping: dict[int, str] | None = None
        self._fstring_start = -1

    @property
    def file_tokens(self) -> list[tokenize.TokenInfo]:
        """Return the complete set of tokens for a file."""
        if self._file_tokens is None:
            line_iter = iter(self.lines)
            self._file_tokens = list(
                tokenize.generate_tokens(lambda: next(line_iter))
            )

        return self._file_tokens

    def fstring_start(self, lineno: int) -> None:
        """Signal the beginning of an fstring."""
        self._fstring_start = lineno

    def multiline_string(
        self, token: tokenize.TokenInfo
    ) -> Generator[str, None, None]:
        """Iterate through the lines of a multiline string."""
        if token.type == FSTRING_END:
            start = self._fstring_start
        else:
            start = token.start[0]

        self.multiline = True
        self.line_number = start
        # intentionally don't include the last line, that line will be
        # terminated later by a future end-of-line
        for _ in range(start, token.end[0]):
            yield self.lines[self.line_number - 1]
            self.line_number += 1
        self.multiline = False

    def reset_blank_before(self) -> None:
        """Reset the blank_before attribute to zero."""
        self.blank_before = 0

    def delete_first_token(self) -> None:
        """Delete the first token in the list of tokens."""
        del self.tokens[0]

    def visited_new_blank_line(self) -> None:
        """Note that we visited a new blank line."""
        self.blank_lines += 1

    def update_state(self, mapping: _LogicalMapping) -> None:
        """Update the indent level based on the logical line mapping."""
        (start_row, start_col) = mapping[0][1]
        start_line = self.lines[start_row - 1]
        self.indent_level = expand_indent(start_line[:start_col])
        if self.blank_before < self.blank_lines:
            self.blank_before = self.blank_lines

    def update_checker_state_for(self, plugin: LoadedPlugin) -> None:
        """Update the checker_state attribute for the plugin."""
        if "checker_state" in plugin.parameters:
            self.checker_state = self._checker_states.setdefault(
                plugin.entry_name, {}
            )

    def next_logical_line(self) -> None:
        """Record the previous logical line.

        This also resets the tokens list and the blank_lines count.
        """
        if self.logical_line:
            self.previous_indent_level = self.indent_level
            self.previous_logical = self.logical_line
            if not self.indent_level:
                self.previous_unindented_logical_line = self.logical_line
        self.blank_lines = 0
        self.tokens = []

    def build_logical_line_tokens(self) -> _Logical:  # noqa: C901
        """Build the mapping, comments, and logical line lists."""
        logical = []
        comments = []
        mapping: _LogicalMapping = []
        length = 0
        previous_row = previous_column = None
        for token_type, text, start, end, line in self.tokens:
            if token_type in SKIP_TOKENS:
                continue
            if not mapping:
                mapping = [(0, start)]
            if token_type == tokenize.COMMENT:
                comments.append(text)
                continue
            if token_type == tokenize.STRING:
                text = mutate_string(text)
            elif token_type == FSTRING_MIDDLE:
                text = "x" * len(text)
            if previous_row:
                (start_row, start_column) = start
                if previous_row != start_row:
                    row_index = previous_row - 1
                    column_index = previous_column - 1
                    previous_text = self.lines[row_index][column_index]
                    if previous_text == "," or (
                        previous_text not in "{[(" and text not in "}])"
                    ):
                        text = f" {text}"
                elif previous_column != start_column:
                    text = line[previous_column:start_column] + text
            logical.append(text)
            length += len(text)
            mapping.append((length, end))
            (previous_row, previous_column) = end
        return comments, logical, mapping

    def build_ast(self) -> ast.AST:
        """Build an abstract syntax tree from the list of lines."""
        return ast.parse("".join(self.lines))

    def build_logical_line(self) -> tuple[str, str, _LogicalMapping]:
        """Build a logical line from the current tokens list."""
        comments, logical, mapping_list = self.build_logical_line_tokens()
        joined_comments = "".join(comments)
        self.logical_line = "".join(logical)
        self.statistics["logical lines"] += 1
        return joined_comments, self.logical_line, mapping_list

    def keyword_arguments_for(
        self,
        parameters: dict[str, bool],
        arguments: dict[str, Any],
    ) -> dict[str, Any]:
        """Generate the keyword arguments for a list of parameters."""
        ret = {}
        for param, required in parameters.items():
            if param in arguments:
                continue
            try:
                ret[param] = getattr(self, param)
            except AttributeError:
                if required:
                    raise
                else:
                    LOG.warning(
                        'Plugin requested optional parameter "%s" '
                        "but this is not an available parameter.",
                        param,
                    )
        return ret

    def generate_tokens(self) -> Generator[tokenize.TokenInfo, None, None]:
        """Tokenize the file and yield the tokens."""
        for token in tokenize.generate_tokens(self.next_line):
            if token[2][0] > self.total_lines:
                break
            self.tokens.append(token)
            yield token

    def _noqa_line_range(self, min_line: int, max_line: int) -> dict[int, str]:
        line_range = range(min_line, max_line + 1)
        joined = "".join(self.lines[min_line - 1 : max_line])
        return dict.fromkeys(line_range, joined)

    def noqa_line_for(self, line_number: int) -> str | None:
        """Retrieve the line which will be used to determine noqa."""
        if self._noqa_line_mapping is None:
            try:
                file_tokens = self.file_tokens
            except (tokenize.TokenError, SyntaxError):
                # if we failed to parse the file tokens, we'll always fail in
                # the future, so set this so the code does not try again
                self._noqa_line_mapping = {}
            else:
                ret = {}

                min_line = len(self.lines) + 2
                max_line = -1
                for tp, _, (s_line, _), (e_line, _), _ in file_tokens:
                    if tp == tokenize.ENDMARKER:
                        break

                    min_line = min(min_line, s_line)
                    max_line = max(max_line, e_line)

                    if tp in (tokenize.NL, tokenize.NEWLINE):
                        ret.update(self._noqa_line_range(min_line, max_line))

                        min_line = len(self.lines) + 2
                        max_line = -1

                # in newer versions of python, a `NEWLINE` token is inserted
                # at the end of the file even if it doesn't have one.
                # on old pythons, they will not have hit a `NEWLINE`
                if max_line != -1:
                    ret.update(self._noqa_line_range(min_line, max_line))

                self._noqa_line_mapping = ret

        # NOTE(sigmavirus24): Some plugins choose to report errors for empty
        # files on Line 1. In those cases, we shouldn't bother trying to
        # retrieve a physical line (since none exist).
        return self._noqa_line_mapping.get(line_number)

    def next_line(self) -> str:
        """Get the next line from the list."""
        if self.line_number >= self.total_lines:
            return ""
        line = self.lines[self.line_number]
        self.line_number += 1
        if self.indent_char is None and line[:1] in defaults.WHITESPACE:
            self.indent_char = line[0]
        return line

    def read_lines(self) -> list[str]:
        """Read the lines for this file checker."""
        if self.filename == "-":
            self.filename = self.options.stdin_display_name or "stdin"
            lines = self.read_lines_from_stdin()
        else:
            lines = self.read_lines_from_filename()
        return lines

    def read_lines_from_filename(self) -> list[str]:
        """Read the lines for a file."""
        try:
            with tokenize.open(self.filename) as fd:
                return fd.readlines()
        except (SyntaxError, UnicodeError):
            # If we can't detect the codec with tokenize.detect_encoding, or
            # the detected encoding is incorrect, just fallback to latin-1.
            with open(self.filename, encoding="latin-1") as fd:
                return fd.readlines()

    def read_lines_from_stdin(self) -> list[str]:
        """Read the lines from standard in."""
        return utils.stdin_get_lines()

    def should_ignore_file(self) -> bool:
        """Check if ``flake8: noqa`` is in the file to be ignored.

        :returns:
            True if a line matches :attr:`defaults.NOQA_FILE`,
            otherwise False
        """
        if not self.options.disable_noqa and any(
            defaults.NOQA_FILE.match(line) for line in self.lines
        ):
            return True
        elif any(defaults.NOQA_FILE.search(line) for line in self.lines):
            LOG.warning(
                "Detected `flake8: noqa` on line with code. To ignore an "
                "error on a line use `noqa` instead."
            )
            return False
        else:
            return False

    def strip_utf_bom(self) -> None:
        """Strip the UTF bom from the lines of the file."""
        if not self.lines:
            # If we have nothing to analyze quit early
            return

        first_byte = ord(self.lines[0][0])
        if first_byte not in (0xEF, 0xFEFF):
            return

        # If the first byte of the file is a UTF-8 BOM, strip it
        if first_byte == 0xFEFF:
            self.lines[0] = self.lines[0][1:]
        elif self.lines[0][:3] == "\xEF\xBB\xBF":
            self.lines[0] = self.lines[0][3:]


def is_eol_token(token: tokenize.TokenInfo) -> bool:
    """Check if the token is an end-of-line token."""
    return token[0] in NEWLINE or token[4][token[3][1] :].lstrip() == "\\\n"


def is_multiline_string(token: tokenize.TokenInfo) -> bool:
    """Check if this is a multiline string."""
    return token.type == FSTRING_END or (
        token.type == tokenize.STRING and "\n" in token.string
    )


def token_is_newline(token: tokenize.TokenInfo) -> bool:
    """Check if the token type is a newline token type."""
    return token[0] in NEWLINE


def count_parentheses(current_parentheses_count: int, token_text: str) -> int:
    """Count the number of parentheses."""
    if token_text in "([{":  # nosec
        return current_parentheses_count + 1
    elif token_text in "}])":  # nosec
        return current_parentheses_count - 1
    return current_parentheses_count


def expand_indent(line: str) -> int:
    r"""Return the amount of indentation.

    Tabs are expanded to the next multiple of 8.

    >>> expand_indent('    ')
    4
    >>> expand_indent('\t')
    8
    >>> expand_indent('       \t')
    8
    >>> expand_indent('        \t')
    16
    """
    return len(line.expandtabs(8))


# NOTE(sigmavirus24): This was taken wholesale from
# https://github.com/PyCQA/pycodestyle. The in-line comments were edited to be
# more descriptive.
def mutate_string(text: str) -> str:
    """Replace contents with 'xxx' to prevent syntax matching.

    >>> mutate_string('"abc"')
    '"xxx"'
    >>> mutate_string("'''abc'''")
    "'''xxx'''"
    >>> mutate_string("r'abc'")
    "r'xxx'"
    """
    # NOTE(sigmavirus24): If there are string modifiers (e.g., b, u, r)
    # use the last "character" to determine if we're using single or double
    # quotes and then find the first instance of it
    start = text.index(text[-1]) + 1
    end = len(text) - 1
    # Check for triple-quoted strings
    if text[-3:] in ('"""', "'''"):
        start += 2
        end -= 2
    return text[:start] + "x" * (end - start) + text[end:]
Commit	Line	Data
53e6db90 DC	1	"""Module containing our file processor that tokenizes a file for checks."""
	2	from __future__ import annotations
	3
	4	import argparse
	5	import ast
	6	import logging
	7	import tokenize
	8	from typing import Any
	9	from typing import Generator
	10	from typing import List
	11	from typing import Tuple
	12
	13	from flake8 import defaults
	14	from flake8 import utils
	15	from flake8._compat import FSTRING_END
	16	from flake8._compat import FSTRING_MIDDLE
	17	from flake8.plugins.finder import LoadedPlugin
	18
	19	LOG = logging.getLogger(__name__)
	20	NEWLINE = frozenset([tokenize.NL, tokenize.NEWLINE])
	21
	22	SKIP_TOKENS = frozenset(
	23	[tokenize.NL, tokenize.NEWLINE, tokenize.INDENT, tokenize.DEDENT]
	24	)
	25
	26	_LogicalMapping = List[Tuple[int, Tuple[int, int]]]
	27	_Logical = Tuple[List[str], List[str], _LogicalMapping]
	28
	29
	30	class FileProcessor:
	31	"""Processes a file and holds state.
	32
	33	This processes a file by generating tokens, logical and physical lines,
	34	and AST trees. This also provides a way of passing state about the file
	35	to checks expecting that state. Any public attribute on this object can
	36	be requested by a plugin. The known public attributes are:
	37
	38	- :attr:`blank_before`
	39	- :attr:`blank_lines`
	40	- :attr:`checker_state`
	41	- :attr:`indent_char`
	42	- :attr:`indent_level`
	43	- :attr:`line_number`
	44	- :attr:`logical_line`
	45	- :attr:`max_line_length`
	46	- :attr:`max_doc_length`
	47	- :attr:`multiline`
	48	- :attr:`noqa`
	49	- :attr:`previous_indent_level`
	50	- :attr:`previous_logical`
	51	- :attr:`previous_unindented_logical_line`
	52	- :attr:`tokens`
	53	- :attr:`file_tokens`
	54	- :attr:`total_lines`
	55	- :attr:`verbose`
	56	"""
	57
	58	#: always ``False``, included for compatibility
	59	noqa = False
	60
	61	def __init__(
	62	self,
	63	filename: str,
	64	options: argparse.Namespace,
65	lines: list[str] \| None = None,
66	) -> None:
67	"""Initialize our file processor.
68
69	:param filename: Name of the file to process
70	"""
71	self.options = options
72	self.filename = filename
73	self.lines = lines if lines is not None else self.read_lines()
74	self.strip_utf_bom()
75
76	# Defaults for public attributes
77	#: Number of preceding blank lines
78	self.blank_before = 0
79	#: Number of blank lines
80	self.blank_lines = 0
81	#: Checker states for each plugin?
82	self._checker_states: dict[str, dict[Any, Any]] = {}
83	#: Current checker state
84	self.checker_state: dict[Any, Any] = {}
85	#: User provided option for hang closing
86	self.hang_closing = options.hang_closing
87	#: Character used for indentation
88	self.indent_char: str \| None = None
89	#: Current level of indentation
90	self.indent_level = 0
91	#: Number of spaces used for indentation
92	self.indent_size = options.indent_size
93	#: Line number in the file
94	self.line_number = 0
95	#: Current logical line
96	self.logical_line = ""
97	#: Maximum line length as configured by the user
98	self.max_line_length = options.max_line_length
99	#: Maximum docstring / comment line length as configured by the user
100	self.max_doc_length = options.max_doc_length
101	#: Whether the current physical line is multiline
102	self.multiline = False
103	#: Previous level of indentation
104	self.previous_indent_level = 0
105	#: Previous logical line
106	self.previous_logical = ""
107	#: Previous unindented (i.e. top-level) logical line
108	self.previous_unindented_logical_line = ""
109	#: Current set of tokens
110	self.tokens: list[tokenize.TokenInfo] = []
111	#: Total number of lines in the file
112	self.total_lines = len(self.lines)
113	#: Verbosity level of Flake8
114	self.verbose = options.verbose
115	#: Statistics dictionary
116	self.statistics = {"logical lines": 0}
117	self._file_tokens: list[tokenize.TokenInfo] \| None = None
118	# map from line number to the line we'll search for `noqa` in
119	self._noqa_line_mapping: dict[int, str] \| None = None
120	self._fstring_start = -1
121
122	@property
123	def file_tokens(self) -> list[tokenize.TokenInfo]:
124	"""Return the complete set of tokens for a file."""
125	if self._file_tokens is None:
126	line_iter = iter(self.lines)
127	self._file_tokens = list(
128	tokenize.generate_tokens(lambda: next(line_iter))
129	)
130
131	return self._file_tokens
132
133	def fstring_start(self, lineno: int) -> None:
134	"""Signal the beginning of an fstring."""
135	self._fstring_start = lineno
136
137	def multiline_string(
138	self, token: tokenize.TokenInfo
139	) -> Generator[str, None, None]:
140	"""Iterate through the lines of a multiline string."""
141	if token.type == FSTRING_END:
142	start = self._fstring_start
143	else:
144	start = token.start[0]
145
146	self.multiline = True
147	self.line_number = start
148	# intentionally don't include the last line, that line will be
149	# terminated later by a future end-of-line
150	for _ in range(start, token.end[0]):
151	yield self.lines[self.line_number - 1]
152	self.line_number += 1
153	self.multiline = False
154
155	def reset_blank_before(self) -> None:
156	"""Reset the blank_before attribute to zero."""
157	self.blank_before = 0
158
159	def delete_first_token(self) -> None:
160	"""Delete the first token in the list of tokens."""
161	del self.tokens[0]
162
163	def visited_new_blank_line(self) -> None:
164	"""Note that we visited a new blank line."""
165	self.blank_lines += 1
166
167	def update_state(self, mapping: _LogicalMapping) -> None:
168	"""Update the indent level based on the logical line mapping."""
169	(start_row, start_col) = mapping[0][1]
170	start_line = self.lines[start_row - 1]
171	self.indent_level = expand_indent(start_line[:start_col])
172	if self.blank_before < self.blank_lines:
173	self.blank_before = self.blank_lines
174
175	def update_checker_state_for(self, plugin: LoadedPlugin) -> None:
176	"""Update the checker_state attribute for the plugin."""
177	if "checker_state" in plugin.parameters:
178	self.checker_state = self._checker_states.setdefault(
179	plugin.entry_name, {}
180	)
181
182	def next_logical_line(self) -> None:
183	"""Record the previous logical line.
184
185	This also resets the tokens list and the blank_lines count.
186	"""
187	if self.logical_line:
188	self.previous_indent_level = self.indent_level
189	self.previous_logical = self.logical_line
190	if not self.indent_level:
191	self.previous_unindented_logical_line = self.logical_line
192	self.blank_lines = 0
193	self.tokens = []
194
195	def build_logical_line_tokens(self) -> _Logical: # noqa: C901
196	"""Build the mapping, comments, and logical line lists."""
197	logical = []
198	comments = []
199	mapping: _LogicalMapping = []
200	length = 0
201	previous_row = previous_column = None
202	for token_type, text, start, end, line in self.tokens:
203	if token_type in SKIP_TOKENS:
204	continue
205	if not mapping:
206	mapping = [(0, start)]
207	if token_type == tokenize.COMMENT:
208	comments.append(text)
209	continue
210	if token_type == tokenize.STRING:
211	text = mutate_string(text)
212	elif token_type == FSTRING_MIDDLE:
213	text = "x" * len(text)
214	if previous_row:
215	(start_row, start_column) = start
216	if previous_row != start_row:
217	row_index = previous_row - 1
218	column_index = previous_column - 1
219	previous_text = self.lines[row_index][column_index]
220	if previous_text == "," or (
221	previous_text not in "{[(" and text not in "}])"
222	):
223	text = f" {text}"
224	elif previous_column != start_column:
225	text = line[previous_column:start_column] + text
226	logical.append(text)
227	length += len(text)
228	mapping.append((length, end))
229	(previous_row, previous_column) = end
230	return comments, logical, mapping
231
232	def build_ast(self) -> ast.AST:
233	"""Build an abstract syntax tree from the list of lines."""
234	return ast.parse("".join(self.lines))
235
236	def build_logical_line(self) -> tuple[str, str, _LogicalMapping]:
237	"""Build a logical line from the current tokens list."""
238	comments, logical, mapping_list = self.build_logical_line_tokens()
239	joined_comments = "".join(comments)
240	self.logical_line = "".join(logical)
241	self.statistics["logical lines"] += 1
242	return joined_comments, self.logical_line, mapping_list
243
244	def keyword_arguments_for(
245	self,
246	parameters: dict[str, bool],
247	arguments: dict[str, Any],
248	) -> dict[str, Any]:
249	"""Generate the keyword arguments for a list of parameters."""
250	ret = {}
251	for param, required in parameters.items():
252	if param in arguments:
253	continue
254	try:
255	ret[param] = getattr(self, param)
256	except AttributeError:
257	if required:
258	raise
259	else:
260	LOG.warning(
261	'Plugin requested optional parameter "%s" '
262	"but this is not an available parameter.",
263	param,
264	)
265	return ret
266
267	def generate_tokens(self) -> Generator[tokenize.TokenInfo, None, None]:
268	"""Tokenize the file and yield the tokens."""
269	for token in tokenize.generate_tokens(self.next_line):
270	if token[2][0] > self.total_lines:
271	break
272	self.tokens.append(token)
273	yield token
274
275	def _noqa_line_range(self, min_line: int, max_line: int) -> dict[int, str]:
276	line_range = range(min_line, max_line + 1)
277	joined = "".join(self.lines[min_line - 1 : max_line])
278	return dict.fromkeys(line_range, joined)
279
280	def noqa_line_for(self, line_number: int) -> str \| None:
281	"""Retrieve the line which will be used to determine noqa."""
282	if self._noqa_line_mapping is None:
283	try:
284	file_tokens = self.file_tokens
285	except (tokenize.TokenError, SyntaxError):
286	# if we failed to parse the file tokens, we'll always fail in
287	# the future, so set this so the code does not try again
288	self._noqa_line_mapping = {}
289	else:
290	ret = {}
291
292	min_line = len(self.lines) + 2
293	max_line = -1
294	for tp, _, (s_line, _), (e_line, _), _ in file_tokens:
295	if tp == tokenize.ENDMARKER:
296	break
297
298	min_line = min(min_line, s_line)
299	max_line = max(max_line, e_line)
300
301	if tp in (tokenize.NL, tokenize.NEWLINE):
302	ret.update(self._noqa_line_range(min_line, max_line))
303
304	min_line = len(self.lines) + 2
305	max_line = -1
306
307	# in newer versions of python, a `NEWLINE` token is inserted
308	# at the end of the file even if it doesn't have one.
309	# on old pythons, they will not have hit a `NEWLINE`
310	if max_line != -1:
311	ret.update(self._noqa_line_range(min_line, max_line))
312
313	self._noqa_line_mapping = ret
314
315	# NOTE(sigmavirus24): Some plugins choose to report errors for empty
316	# files on Line 1. In those cases, we shouldn't bother trying to
317	# retrieve a physical line (since none exist).
318	return self._noqa_line_mapping.get(line_number)
319
320	def next_line(self) -> str:
321	"""Get the next line from the list."""
322	if self.line_number >= self.total_lines:
323	return ""
324	line = self.lines[self.line_number]
325	self.line_number += 1
326	if self.indent_char is None and line[:1] in defaults.WHITESPACE:
327	self.indent_char = line[0]
328	return line
329
330	def read_lines(self) -> list[str]:
331	"""Read the lines for this file checker."""
332	if self.filename == "-":
333	self.filename = self.options.stdin_display_name or "stdin"
334	lines = self.read_lines_from_stdin()
335	else:
336	lines = self.read_lines_from_filename()
337	return lines
338
339	def read_lines_from_filename(self) -> list[str]:
340	"""Read the lines for a file."""
341	try:
342	with tokenize.open(self.filename) as fd:
343	return fd.readlines()
344	except (SyntaxError, UnicodeError):
345	# If we can't detect the codec with tokenize.detect_encoding, or
346	# the detected encoding is incorrect, just fallback to latin-1.
347	with open(self.filename, encoding="latin-1") as fd:
348	return fd.readlines()
349
350	def read_lines_from_stdin(self) -> list[str]:
351	"""Read the lines from standard in."""
352	return utils.stdin_get_lines()
353
354	def should_ignore_file(self) -> bool:
355	"""Check if ``flake8: noqa`` is in the file to be ignored.
356
357	:returns:
358	True if a line matches :attr:`defaults.NOQA_FILE`,
359	otherwise False
360	"""
361	if not self.options.disable_noqa and any(
362	defaults.NOQA_FILE.match(line) for line in self.lines
363	):
364	return True
365	elif any(defaults.NOQA_FILE.search(line) for line in self.lines):
366	LOG.warning(
367	"Detected `flake8: noqa` on line with code. To ignore an "
368	"error on a line use `noqa` instead."
369	)
370	return False
371	else:
372	return False
373
374	def strip_utf_bom(self) -> None:
375	"""Strip the UTF bom from the lines of the file."""
376	if not self.lines:
377	# If we have nothing to analyze quit early
378	return
379
380	first_byte = ord(self.lines[0][0])
381	if first_byte not in (0xEF, 0xFEFF):
382	return
383
384	# If the first byte of the file is a UTF-8 BOM, strip it
385	if first_byte == 0xFEFF:
386	self.lines[0] = self.lines[0][1:]
387	elif self.lines[0][:3] == "\xEF\xBB\xBF":
388	self.lines[0] = self.lines[0][3:]
389
390
391	def is_eol_token(token: tokenize.TokenInfo) -> bool:
392	"""Check if the token is an end-of-line token."""
393	return token[0] in NEWLINE or token[4][token[3][1] :].lstrip() == "\\\n"
394
395
396	def is_multiline_string(token: tokenize.TokenInfo) -> bool:
397	"""Check if this is a multiline string."""
398	return token.type == FSTRING_END or (
399	token.type == tokenize.STRING and "\n" in token.string
400	)
401
402
403	def token_is_newline(token: tokenize.TokenInfo) -> bool:
404	"""Check if the token type is a newline token type."""
405	return token[0] in NEWLINE
406
407
408	def count_parentheses(current_parentheses_count: int, token_text: str) -> int:
409	"""Count the number of parentheses."""
410	if token_text in "([{": # nosec
411	return current_parentheses_count + 1
412	elif token_text in "}])": # nosec
413	return current_parentheses_count - 1
414	return current_parentheses_count
415
416
417	def expand_indent(line: str) -> int:
418	r"""Return the amount of indentation.
419
420	Tabs are expanded to the next multiple of 8.
421
422	>>> expand_indent(' ')
423	4
424	>>> expand_indent('\t')
425	8
426	>>> expand_indent(' \t')
427	8
428	>>> expand_indent(' \t')
429	16
430	"""
431	return len(line.expandtabs(8))
432
433
434	# NOTE(sigmavirus24): This was taken wholesale from
435	# https://github.com/PyCQA/pycodestyle. The in-line comments were edited to be
436	# more descriptive.
437	def mutate_string(text: str) -> str:
438	"""Replace contents with 'xxx' to prevent syntax matching.
439
440	>>> mutate_string('"abc"')
441	'"xxx"'
442	>>> mutate_string("'''abc'''")
443	"'''xxx'''"
444	>>> mutate_string("r'abc'")
445	"r'xxx'"
446	"""
447	# NOTE(sigmavirus24): If there are string modifiers (e.g., b, u, r)
448	# use the last "character" to determine if we're using single or double
449	# quotes and then find the first instance of it
450	start = text.index(text[-1]) + 1
451	end = len(text) - 1
452	# Check for triple-quoted strings
453	if text[-3:] in ('"""', "'''"):
454	start += 2
455	end -= 2
456	return text[:start] + "x" * (end - start) + text[end:]