| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286 |
- """
- Docstrings are another source of information for functions and classes.
- :mod:`jedi.inference.dynamic_params` tries to find all executions of functions,
- while the docstring parsing is much easier. There are three different types of
- docstrings that |jedi| understands:
- - `Sphinx <http://sphinx-doc.org/markup/desc.html#info-field-lists>`_
- - `Epydoc <http://epydoc.sourceforge.net/manual-fields.html>`_
- - `Numpydoc <https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt>`_
- For example, the sphinx annotation ``:type foo: str`` clearly states that the
- type of ``foo`` is ``str``.
- As an addition to parameter searching, this module also provides return
- annotations.
- """
- import re
- import warnings
- from parso import parse, ParserSyntaxError
- from jedi import debug
- from jedi.inference.cache import inference_state_method_cache
- from jedi.inference.base_value import iterator_to_value_set, ValueSet, \
- NO_VALUES
- from jedi.inference.lazy_value import LazyKnownValues
- DOCSTRING_PARAM_PATTERNS = [
- r'\s*:type\s+%s:\s*([^\n]+)', # Sphinx
- r'\s*:param\s+(\w+)\s+%s:[^\n]*', # Sphinx param with type
- r'\s*@type\s+%s:\s*([^\n]+)', # Epydoc
- ]
- DOCSTRING_RETURN_PATTERNS = [
- re.compile(r'\s*:rtype:\s*([^\n]+)', re.M), # Sphinx
- re.compile(r'\s*@rtype:\s*([^\n]+)', re.M), # Epydoc
- ]
- REST_ROLE_PATTERN = re.compile(r':[^`]+:`([^`]+)`')
- _numpy_doc_string_cache = None
- def _get_numpy_doc_string_cls():
- global _numpy_doc_string_cache
- if isinstance(_numpy_doc_string_cache, (ImportError, SyntaxError)):
- raise _numpy_doc_string_cache
- from numpydoc.docscrape import NumpyDocString # type: ignore[import]
- _numpy_doc_string_cache = NumpyDocString
- return _numpy_doc_string_cache
- def _search_param_in_numpydocstr(docstr, param_str):
- """Search `docstr` (in numpydoc format) for type(-s) of `param_str`."""
- with warnings.catch_warnings():
- warnings.simplefilter("ignore")
- try:
- # This is a non-public API. If it ever changes we should be
- # prepared and return gracefully.
- params = _get_numpy_doc_string_cls()(docstr)._parsed_data['Parameters']
- except Exception:
- return []
- for p_name, p_type, p_descr in params:
- if p_name == param_str:
- m = re.match(r'([^,]+(,[^,]+)*?)(,[ ]*optional)?$', p_type)
- if m:
- p_type = m.group(1)
- return list(_expand_typestr(p_type))
- return []
- def _search_return_in_numpydocstr(docstr):
- """
- Search `docstr` (in numpydoc format) for type(-s) of function returns.
- """
- with warnings.catch_warnings():
- warnings.simplefilter("ignore")
- try:
- doc = _get_numpy_doc_string_cls()(docstr)
- except Exception:
- return
- try:
- # This is a non-public API. If it ever changes we should be
- # prepared and return gracefully.
- returns = doc._parsed_data['Returns']
- returns += doc._parsed_data['Yields']
- except Exception:
- return
- for r_name, r_type, r_descr in returns:
- # Return names are optional and if so the type is in the name
- if not r_type:
- r_type = r_name
- yield from _expand_typestr(r_type)
- def _expand_typestr(type_str):
- """
- Attempts to interpret the possible types in `type_str`
- """
- # Check if alternative types are specified with 'or'
- if re.search(r'\bor\b', type_str):
- for t in type_str.split('or'):
- yield t.split('of')[0].strip()
- # Check if like "list of `type`" and set type to list
- elif re.search(r'\bof\b', type_str):
- yield type_str.split('of')[0]
- # Check if type has is a set of valid literal values eg: {'C', 'F', 'A'}
- elif type_str.startswith('{'):
- node = parse(type_str, version='3.7').children[0]
- if node.type == 'atom':
- for leaf in getattr(node.children[1], "children", []):
- if leaf.type == 'number':
- if '.' in leaf.value:
- yield 'float'
- else:
- yield 'int'
- elif leaf.type == 'string':
- if 'b' in leaf.string_prefix.lower():
- yield 'bytes'
- else:
- yield 'str'
- # Ignore everything else.
- # Otherwise just work with what we have.
- else:
- yield type_str
- def _search_param_in_docstr(docstr, param_str):
- """
- Search `docstr` for type(-s) of `param_str`.
- >>> _search_param_in_docstr(':type param: int', 'param')
- ['int']
- >>> _search_param_in_docstr('@type param: int', 'param')
- ['int']
- >>> _search_param_in_docstr(
- ... ':type param: :class:`threading.Thread`', 'param')
- ['threading.Thread']
- >>> bool(_search_param_in_docstr('no document', 'param'))
- False
- >>> _search_param_in_docstr(':param int param: some description', 'param')
- ['int']
- """
- # look at #40 to see definitions of those params
- patterns = [re.compile(p % re.escape(param_str))
- for p in DOCSTRING_PARAM_PATTERNS]
- for pattern in patterns:
- match = pattern.search(docstr)
- if match:
- return [_strip_rst_role(match.group(1))]
- return _search_param_in_numpydocstr(docstr, param_str)
- def _strip_rst_role(type_str):
- """
- Strip off the part looks like a ReST role in `type_str`.
- >>> _strip_rst_role(':class:`ClassName`') # strip off :class:
- 'ClassName'
- >>> _strip_rst_role(':py:obj:`module.Object`') # works with domain
- 'module.Object'
- >>> _strip_rst_role('ClassName') # do nothing when not ReST role
- 'ClassName'
- See also:
- http://sphinx-doc.org/domains.html#cross-referencing-python-objects
- """
- match = REST_ROLE_PATTERN.match(type_str)
- if match:
- return match.group(1)
- else:
- return type_str
- def _infer_for_statement_string(module_context, string):
- if string is None:
- return []
- potential_imports = re.findall(r'((?:\w+\.)*\w+)\.', string)
- # Try to import module part in dotted name.
- # (e.g., 'threading' in 'threading.Thread').
- imports = "\n".join(f"import {p}" for p in potential_imports)
- string = f'{imports}\n{string}'
- debug.dbg('Parse docstring code %s', string, color='BLUE')
- grammar = module_context.inference_state.grammar
- try:
- module = grammar.parse(string, error_recovery=False)
- except ParserSyntaxError:
- return []
- try:
- # It's not the last item, because that's an end marker.
- stmt = module.children[-2]
- except (AttributeError, IndexError):
- return []
- if stmt.type not in ('name', 'atom', 'atom_expr'):
- return []
- # Here we basically use a fake module that also uses the filters in
- # the actual module.
- from jedi.inference.docstring_utils import DocstringModule
- m = DocstringModule(
- in_module_context=module_context,
- inference_state=module_context.inference_state,
- module_node=module,
- code_lines=[],
- )
- return list(_execute_types_in_stmt(m.as_context(), stmt))
- def _execute_types_in_stmt(module_context, stmt):
- """
- Executing all types or general elements that we find in a statement. This
- doesn't include tuple, list and dict literals, because the stuff they
- contain is executed. (Used as type information).
- """
- definitions = module_context.infer_node(stmt)
- return ValueSet.from_sets(
- _execute_array_values(module_context.inference_state, d)
- for d in definitions
- )
- def _execute_array_values(inference_state, array):
- """
- Tuples indicate that there's not just one return value, but the listed
- ones. `(str, int)` means that it returns a tuple with both types.
- """
- from jedi.inference.value.iterable import SequenceLiteralValue, FakeTuple, FakeList
- if isinstance(array, SequenceLiteralValue) and array.array_type in ('tuple', 'list'):
- values = []
- for lazy_value in array.py__iter__():
- objects = ValueSet.from_sets(
- _execute_array_values(inference_state, typ)
- for typ in lazy_value.infer()
- )
- values.append(LazyKnownValues(objects))
- cls = FakeTuple if array.array_type == 'tuple' else FakeList
- return {cls(inference_state, values)}
- else:
- return array.execute_annotation()
- @inference_state_method_cache()
- def infer_param(function_value, param):
- def infer_docstring(docstring):
- return ValueSet(
- p
- for param_str in _search_param_in_docstr(docstring, param.name.value)
- for p in _infer_for_statement_string(module_context, param_str)
- )
- module_context = function_value.get_root_context()
- func = param.get_parent_function()
- if func.type == 'lambdef':
- return NO_VALUES
- types = infer_docstring(function_value.py__doc__())
- if function_value.is_bound_method() \
- and function_value.py__name__() == '__init__':
- types |= infer_docstring(function_value.class_context.py__doc__())
- debug.dbg('Found param types for docstring: %s', types, color='BLUE')
- return types
- @inference_state_method_cache()
- @iterator_to_value_set
- def infer_return_types(function_value):
- def search_return_in_docstr(code):
- for p in DOCSTRING_RETURN_PATTERNS:
- match = p.search(code)
- if match:
- yield _strip_rst_role(match.group(1))
- # Check for numpy style return hint
- yield from _search_return_in_numpydocstr(code)
- for type_str in search_return_in_docstr(function_value.py__doc__()):
- yield from _infer_for_statement_string(function_value.get_root_context(), type_str)
|