[config.git] / djavu-asus / elpy / rpc-venv / lib / python3.11 / site-packages / parso / grammar.py

import hashlib
import os
from typing import Generic, TypeVar, Union, Dict, Optional, Any
from pathlib import Path

from parso._compatibility import is_pypy
from parso.pgen2 import generate_grammar
from parso.utils import split_lines, python_bytes_to_unicode, \
    PythonVersionInfo, parse_version_string
from parso.python.diff import DiffParser
from parso.python.tokenize import tokenize_lines, tokenize
from parso.python.token import PythonTokenTypes
from parso.cache import parser_cache, load_module, try_to_save_module
from parso.parser import BaseParser
from parso.python.parser import Parser as PythonParser
from parso.python.errors import ErrorFinderConfig
from parso.python import pep8
from parso.file_io import FileIO, KnownContentFileIO
from parso.normalizer import RefactoringNormalizer, NormalizerConfig

_loaded_grammars: Dict[str, 'Grammar'] = {}

_NodeT = TypeVar("_NodeT")


class Grammar(Generic[_NodeT]):
    """
    :py:func:`parso.load_grammar` returns instances of this class.

    Creating custom none-python grammars by calling this is not supported, yet.

    :param text: A BNF representation of your grammar.
    """
    _start_nonterminal: str
    _error_normalizer_config: Optional[ErrorFinderConfig] = None
    _token_namespace: Any = None
    _default_normalizer_config: NormalizerConfig = pep8.PEP8NormalizerConfig()

    def __init__(self, text: str, *, tokenizer, parser=BaseParser, diff_parser=None):
        self._pgen_grammar = generate_grammar(
            text,
            token_namespace=self._get_token_namespace()
        )
        self._parser = parser
        self._tokenizer = tokenizer
        self._diff_parser = diff_parser
        self._hashed = hashlib.sha256(text.encode("utf-8")).hexdigest()

    def parse(self,
              code: Union[str, bytes] = None,
              *,
              error_recovery=True,
              path: Union[os.PathLike, str] = None,
              start_symbol: str = None,
              cache=False,
              diff_cache=False,
              cache_path: Union[os.PathLike, str] = None,
              file_io: FileIO = None) -> _NodeT:
        """
        If you want to parse a Python file you want to start here, most likely.

        If you need finer grained control over the parsed instance, there will be
        other ways to access it.

        :param str code: A unicode or bytes string. When it's not possible to
            decode bytes to a string, returns a
            :py:class:`UnicodeDecodeError`.
        :param bool error_recovery: If enabled, any code will be returned. If
            it is invalid, it will be returned as an error node. If disabled,
            you will get a ParseError when encountering syntax errors in your
            code.
        :param str start_symbol: The grammar rule (nonterminal) that you want
            to parse. Only allowed to be used when error_recovery is False.
        :param str path: The path to the file you want to open. Only needed for caching.
        :param bool cache: Keeps a copy of the parser tree in RAM and on disk
            if a path is given. Returns the cached trees if the corresponding
            files on disk have not changed. Note that this stores pickle files
            on your file system (e.g. for Linux in ``~/.cache/parso/``).
        :param bool diff_cache: Diffs the cached python module against the new
            code and tries to parse only the parts that have changed. Returns
            the same (changed) module that is found in cache. Using this option
            requires you to not do anything anymore with the cached modules
            under that path, because the contents of it might change. This
            option is still somewhat experimental. If you want stability,
            please don't use it.
        :param bool cache_path: If given saves the parso cache in this
            directory. If not given, defaults to the default cache places on
            each platform.

        :return: A subclass of :py:class:`parso.tree.NodeOrLeaf`. Typically a
            :py:class:`parso.python.tree.Module`.
        """
        if code is None and path is None and file_io is None:
            raise TypeError("Please provide either code or a path.")

        if isinstance(path, str):
            path = Path(path)
        if isinstance(cache_path, str):
            cache_path = Path(cache_path)

        if start_symbol is None:
            start_symbol = self._start_nonterminal

        if error_recovery and start_symbol != 'file_input':
            raise NotImplementedError("This is currently not implemented.")

        if file_io is None:
            if code is None:
                file_io = FileIO(path)  # type: ignore
            else:
                file_io = KnownContentFileIO(path, code)

        if cache and file_io.path is not None:
            module_node = load_module(self._hashed, file_io, cache_path=cache_path)
            if module_node is not None:
                return module_node  # type: ignore

        if code is None:
            code = file_io.read()
        code = python_bytes_to_unicode(code)

        lines = split_lines(code, keepends=True)
        if diff_cache:
            if self._diff_parser is None:
                raise TypeError("You have to define a diff parser to be able "
                                "to use this option.")
            try:
                module_cache_item = parser_cache[self._hashed][file_io.path]
            except KeyError:
                pass
            else:
                module_node = module_cache_item.node
                old_lines = module_cache_item.lines
                if old_lines == lines:
                    return module_node  # type: ignore

                new_node = self._diff_parser(
                    self._pgen_grammar, self._tokenizer, module_node
                ).update(
                    old_lines=old_lines,
                    new_lines=lines
                )
                try_to_save_module(self._hashed, file_io, new_node, lines,
                                   # Never pickle in pypy, it's slow as hell.
                                   pickling=cache and not is_pypy,
                                   cache_path=cache_path)
                return new_node  # type: ignore

        tokens = self._tokenizer(lines)

        p = self._parser(
            self._pgen_grammar,
            error_recovery=error_recovery,
            start_nonterminal=start_symbol
        )
        root_node = p.parse(tokens=tokens)

        if cache or diff_cache:
            try_to_save_module(self._hashed, file_io, root_node, lines,
                               # Never pickle in pypy, it's slow as hell.
                               pickling=cache and not is_pypy,
                               cache_path=cache_path)
        return root_node  # type: ignore

    def _get_token_namespace(self):
        ns = self._token_namespace
        if ns is None:
            raise ValueError("The token namespace should be set.")
        return ns

    def iter_errors(self, node):
        """
        Given a :py:class:`parso.tree.NodeOrLeaf` returns a generator of
        :py:class:`parso.normalizer.Issue` objects. For Python this is
        a list of syntax/indentation errors.
        """
        if self._error_normalizer_config is None:
            raise ValueError("No error normalizer specified for this grammar.")

        return self._get_normalizer_issues(node, self._error_normalizer_config)

    def refactor(self, base_node, node_to_str_map):
        return RefactoringNormalizer(node_to_str_map).walk(base_node)

    def _get_normalizer(self, normalizer_config):
        if normalizer_config is None:
            normalizer_config = self._default_normalizer_config
            if normalizer_config is None:
                raise ValueError("You need to specify a normalizer, because "
                                 "there's no default normalizer for this tree.")
        return normalizer_config.create_normalizer(self)

    def _normalize(self, node, normalizer_config=None):
        """
        TODO this is not public, yet.
        The returned code will be normalized, e.g. PEP8 for Python.
        """
        normalizer = self._get_normalizer(normalizer_config)
        return normalizer.walk(node)

    def _get_normalizer_issues(self, node, normalizer_config=None):
        normalizer = self._get_normalizer(normalizer_config)
        normalizer.walk(node)
        return normalizer.issues

    def __repr__(self):
        nonterminals = self._pgen_grammar.nonterminal_to_dfas.keys()
        txt = ' '.join(list(nonterminals)[:3]) + ' ...'
        return '<%s:%s>' % (self.__class__.__name__, txt)


class PythonGrammar(Grammar):
    _error_normalizer_config = ErrorFinderConfig()
    _token_namespace = PythonTokenTypes
    _start_nonterminal = 'file_input'

    def __init__(self, version_info: PythonVersionInfo, bnf_text: str):
        super().__init__(
            bnf_text,
            tokenizer=self._tokenize_lines,
            parser=PythonParser,
            diff_parser=DiffParser
        )
        self.version_info = version_info

    def _tokenize_lines(self, lines, **kwargs):
        return tokenize_lines(lines, version_info=self.version_info, **kwargs)

    def _tokenize(self, code):
        # Used by Jedi.
        return tokenize(code, version_info=self.version_info)


def load_grammar(*, version: str = None, path: str = None):
    """
    Loads a :py:class:`parso.Grammar`. The default version is the current Python
    version.

    :param str version: A python version string, e.g. ``version='3.8'``.
    :param str path: A path to a grammar file
    """
    version_info = parse_version_string(version)

    file = path or os.path.join(
        'python',
        'grammar%s%s.txt' % (version_info.major, version_info.minor)
    )

    global _loaded_grammars
    path = os.path.join(os.path.dirname(__file__), file)
    try:
        return _loaded_grammars[path]
    except KeyError:
        try:
            with open(path) as f:
                bnf_text = f.read()

            grammar = PythonGrammar(version_info, bnf_text)
            return _loaded_grammars.setdefault(path, grammar)
        except FileNotFoundError:
            message = "Python version %s.%s is currently not supported." % (
                version_info.major, version_info.minor
            )
            raise NotImplementedError(message)
Commit	Line	Data
53e6db90 DC	1	import hashlib
	2	import os
	3	from typing import Generic, TypeVar, Union, Dict, Optional, Any
	4	from pathlib import Path
	5
	6	from parso._compatibility import is_pypy
	7	from parso.pgen2 import generate_grammar
	8	from parso.utils import split_lines, python_bytes_to_unicode, \
	9	PythonVersionInfo, parse_version_string
	10	from parso.python.diff import DiffParser
	11	from parso.python.tokenize import tokenize_lines, tokenize
	12	from parso.python.token import PythonTokenTypes
	13	from parso.cache import parser_cache, load_module, try_to_save_module
	14	from parso.parser import BaseParser
	15	from parso.python.parser import Parser as PythonParser
	16	from parso.python.errors import ErrorFinderConfig
	17	from parso.python import pep8
	18	from parso.file_io import FileIO, KnownContentFileIO
	19	from parso.normalizer import RefactoringNormalizer, NormalizerConfig
	20
	21	_loaded_grammars: Dict[str, 'Grammar'] = {}
	22
	23	_NodeT = TypeVar("_NodeT")
	24
	25
	26	class Grammar(Generic[_NodeT]):
	27	"""
	28	:py:func:`parso.load_grammar` returns instances of this class.
	29
	30	Creating custom none-python grammars by calling this is not supported, yet.
	31
	32	:param text: A BNF representation of your grammar.
	33	"""
	34	_start_nonterminal: str
	35	_error_normalizer_config: Optional[ErrorFinderConfig] = None
	36	_token_namespace: Any = None
	37	_default_normalizer_config: NormalizerConfig = pep8.PEP8NormalizerConfig()
	38
	39	def __init__(self, text: str, *, tokenizer, parser=BaseParser, diff_parser=None):
	40	self._pgen_grammar = generate_grammar(
	41	text,
	42	token_namespace=self._get_token_namespace()
	43	)
	44	self._parser = parser
	45	self._tokenizer = tokenizer
	46	self._diff_parser = diff_parser
	47	self._hashed = hashlib.sha256(text.encode("utf-8")).hexdigest()
	48
	49	def parse(self,
	50	code: Union[str, bytes] = None,
	51	*,
	52	error_recovery=True,
	53	path: Union[os.PathLike, str] = None,
	54	start_symbol: str = None,
	55	cache=False,
	56	diff_cache=False,
	57	cache_path: Union[os.PathLike, str] = None,
	58	file_io: FileIO = None) -> _NodeT:
	59	"""
	60	If you want to parse a Python file you want to start here, most likely.
	61
	62	If you need finer grained control over the parsed instance, there will be
	63	other ways to access it.
	64
65	:param str code: A unicode or bytes string. When it's not possible to
66	decode bytes to a string, returns a
67	:py:class:`UnicodeDecodeError`.
68	:param bool error_recovery: If enabled, any code will be returned. If
69	it is invalid, it will be returned as an error node. If disabled,
70	you will get a ParseError when encountering syntax errors in your
71	code.
72	:param str start_symbol: The grammar rule (nonterminal) that you want
73	to parse. Only allowed to be used when error_recovery is False.
74	:param str path: The path to the file you want to open. Only needed for caching.
75	:param bool cache: Keeps a copy of the parser tree in RAM and on disk
76	if a path is given. Returns the cached trees if the corresponding
77	files on disk have not changed. Note that this stores pickle files
78	on your file system (e.g. for Linux in ``~/.cache/parso/``).
79	:param bool diff_cache: Diffs the cached python module against the new
80	code and tries to parse only the parts that have changed. Returns
81	the same (changed) module that is found in cache. Using this option
82	requires you to not do anything anymore with the cached modules
83	under that path, because the contents of it might change. This
84	option is still somewhat experimental. If you want stability,
85	please don't use it.
86	:param bool cache_path: If given saves the parso cache in this
87	directory. If not given, defaults to the default cache places on
88	each platform.
89
90	:return: A subclass of :py:class:`parso.tree.NodeOrLeaf`. Typically a
91	:py:class:`parso.python.tree.Module`.
92	"""
93	if code is None and path is None and file_io is None:
94	raise TypeError("Please provide either code or a path.")
95
96	if isinstance(path, str):
97	path = Path(path)
98	if isinstance(cache_path, str):
99	cache_path = Path(cache_path)
100
101	if start_symbol is None:
102	start_symbol = self._start_nonterminal
103
104	if error_recovery and start_symbol != 'file_input':
105	raise NotImplementedError("This is currently not implemented.")
106
107	if file_io is None:
108	if code is None:
109	file_io = FileIO(path) # type: ignore
110	else:
111	file_io = KnownContentFileIO(path, code)
112
113	if cache and file_io.path is not None:
114	module_node = load_module(self._hashed, file_io, cache_path=cache_path)
115	if module_node is not None:
116	return module_node # type: ignore
117
118	if code is None:
119	code = file_io.read()
120	code = python_bytes_to_unicode(code)
121
122	lines = split_lines(code, keepends=True)
123	if diff_cache:
124	if self._diff_parser is None:
125	raise TypeError("You have to define a diff parser to be able "
126	"to use this option.")
127	try:
128	module_cache_item = parser_cache[self._hashed][file_io.path]
129	except KeyError:
130	pass
131	else:
132	module_node = module_cache_item.node
133	old_lines = module_cache_item.lines
134	if old_lines == lines:
135	return module_node # type: ignore
136
137	new_node = self._diff_parser(
138	self._pgen_grammar, self._tokenizer, module_node
139	).update(
140	old_lines=old_lines,
141	new_lines=lines
142	)
143	try_to_save_module(self._hashed, file_io, new_node, lines,
144	# Never pickle in pypy, it's slow as hell.
145	pickling=cache and not is_pypy,
146	cache_path=cache_path)
147	return new_node # type: ignore
148
149	tokens = self._tokenizer(lines)
150
151	p = self._parser(
152	self._pgen_grammar,
153	error_recovery=error_recovery,
154	start_nonterminal=start_symbol
155	)
156	root_node = p.parse(tokens=tokens)
157
158	if cache or diff_cache:
159	try_to_save_module(self._hashed, file_io, root_node, lines,
160	# Never pickle in pypy, it's slow as hell.
161	pickling=cache and not is_pypy,
162	cache_path=cache_path)
163	return root_node # type: ignore
164
165	def _get_token_namespace(self):
166	ns = self._token_namespace
167	if ns is None:
168	raise ValueError("The token namespace should be set.")
169	return ns
170
171	def iter_errors(self, node):
172	"""
173	Given a :py:class:`parso.tree.NodeOrLeaf` returns a generator of
174	:py:class:`parso.normalizer.Issue` objects. For Python this is
175	a list of syntax/indentation errors.
176	"""
177	if self._error_normalizer_config is None:
178	raise ValueError("No error normalizer specified for this grammar.")
179
180	return self._get_normalizer_issues(node, self._error_normalizer_config)
181
182	def refactor(self, base_node, node_to_str_map):
183	return RefactoringNormalizer(node_to_str_map).walk(base_node)
184
185	def _get_normalizer(self, normalizer_config):
186	if normalizer_config is None:
187	normalizer_config = self._default_normalizer_config
188	if normalizer_config is None:
189	raise ValueError("You need to specify a normalizer, because "
190	"there's no default normalizer for this tree.")
191	return normalizer_config.create_normalizer(self)
192
193	def _normalize(self, node, normalizer_config=None):
194	"""
195	TODO this is not public, yet.
196	The returned code will be normalized, e.g. PEP8 for Python.
197	"""
198	normalizer = self._get_normalizer(normalizer_config)
199	return normalizer.walk(node)
200
201	def _get_normalizer_issues(self, node, normalizer_config=None):
202	normalizer = self._get_normalizer(normalizer_config)
203	normalizer.walk(node)
204	return normalizer.issues
205
206	def __repr__(self):
207	nonterminals = self._pgen_grammar.nonterminal_to_dfas.keys()
208	txt = ' '.join(list(nonterminals)[:3]) + ' ...'
209	return '<%s:%s>' % (self.__class__.__name__, txt)
210
211
212	class PythonGrammar(Grammar):
213	_error_normalizer_config = ErrorFinderConfig()
214	_token_namespace = PythonTokenTypes
215	_start_nonterminal = 'file_input'
216
217	def __init__(self, version_info: PythonVersionInfo, bnf_text: str):
218	super().__init__(
219	bnf_text,
220	tokenizer=self._tokenize_lines,
221	parser=PythonParser,
222	diff_parser=DiffParser
223	)
224	self.version_info = version_info
225
226	def _tokenize_lines(self, lines, **kwargs):
227	return tokenize_lines(lines, version_info=self.version_info, **kwargs)
228
229	def _tokenize(self, code):
230	# Used by Jedi.
231	return tokenize(code, version_info=self.version_info)
232
233
234	def load_grammar(*, version: str = None, path: str = None):
235	"""
236	Loads a :py:class:`parso.Grammar`. The default version is the current Python
237	version.
238
239	:param str version: A python version string, e.g. ``version='3.8'``.
240	:param str path: A path to a grammar file
241	"""
242	version_info = parse_version_string(version)
243
244	file = path or os.path.join(
245	'python',
246	'grammar%s%s.txt' % (version_info.major, version_info.minor)
247	)
248
249	global _loaded_grammars
250	path = os.path.join(os.path.dirname(__file__), file)
251	try:
252	return _loaded_grammars[path]
253	except KeyError:
254	try:
255	with open(path) as f:
256	bnf_text = f.read()
257
258	grammar = PythonGrammar(version_info, bnf_text)
259	return _loaded_grammars.setdefault(path, grammar)
260	except FileNotFoundError:
261	message = "Python version %s.%s is currently not supported." % (
262	version_info.major, version_info.minor
263	)
264	raise NotImplementedError(message)