-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathfilter.py
240 lines (198 loc) · 7.56 KB
/
filter.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
"""This module defines functions for filtering mypy type checking errors."""
# remove when dropping Python 3.7-3.9 support
from __future__ import annotations
import importlib.abc
import pathlib
import sys
import tokenize
from collections.abc import Iterable, Sequence
from importlib import util
from typing import NamedTuple
from mypy_upgrade.parsing import MypyError
def _get_module_paths(*, modules: list[str]) -> list[pathlib.Path | None]:
"""Determine file system paths of given modules/packages.
Args:
modules: a list of strings representing (importable) modules.
Returns:
A list (of the same length as the input list) of pathlib.Path objects
corresponding to the given modules. If a path is not found for a
module, the corresponding entry in the output is ``None``.
Raises:
NotImplementedError: Uncountered an unsupported module type.
"""
paths: list[pathlib.Path | None] = []
for module in modules:
spec = util.find_spec(module)
if spec is None:
paths.append(None)
else:
loader = spec.loader
if isinstance(loader, importlib.abc.ExecutionLoader):
module_path = pathlib.Path(loader.get_filename(module))
if loader.is_package(module):
module_path = module_path.parent
elif spec.origin == "frozen":
module_path = pathlib.Path(spec.loader_state.filename)
else:
msg = "Uncountered an unsupported module type."
raise NotImplementedError(msg)
paths.append(module_path)
return paths
def filter_by_source(
*,
errors: list[MypyError],
packages: list[str],
modules: list[str],
files: list[str],
) -> list[MypyError]:
"""Filter `MypyError`s by source (e.g., packages, modules, files).
Args:
errors: a list of `MypyError`s.
packages: a list of strings specifying packages to be included.
modules: a list of strings specifying modules to be included.
files: a list of strings specifying files to be included.
Returns:
A list of `MypyError`s including only those in either ``packages``,
``modules``, or ``files``.
"""
if len(packages + modules + files) == 0:
return errors
package_paths = [
p for p in _get_module_paths(modules=packages) if p is not None
]
module_paths = [
m for m in _get_module_paths(modules=modules) if m is not None
]
file_paths = [pathlib.Path(f).resolve() for f in files]
paths = package_paths + module_paths + file_paths
selected = []
for error in errors:
module_path = pathlib.Path(error.filename).resolve()
# ! Use Path.is_relative_to when dropping Python 3.7-3.8 support
should_include = any(
path in module_path.parents or path == module_path
for path in paths
)
if should_include:
selected.append(error)
return selected
def filter_by_code(
*,
errors: Iterable[MypyError],
codes_to_silence: Iterable[str] | None = None,
) -> list[MypyError]:
"""Filter `MypyError`s by error code.
Args:
errors: a list of `MypyError`s.
codes_to_silence: an optional list of strings indicating the only mypy
error codes to silence. If not supplied, all errors will be
suppressed. Defaults to None.
Returns:
A list of `MypyError`s including only those with error codes in
`codes_to_silence`.
"""
code_filtered_errors = list(errors)
if codes_to_silence is not None:
code_filtered_errors = [
error
for error in code_filtered_errors
if error.error_code in codes_to_silence
]
return code_filtered_errors
class UnsilenceableRegion(NamedTuple):
"""A region within a source code that cannot be silenced by an inline
comment.
Attributes:
start: an integer representing the start line of the unsilenceable
region (1-indexed).
end: an integer representing the end line of the unsilenceable
region (1-indexed).
When start = end, it is interpreted that the Unsilenceable
region is an explicitly continued line.
"""
start: int
end: int
def _find_unsilenceable_regions(
*,
tokens: Iterable[tokenize.TokenInfo],
comments: Sequence[str],
) -> list[UnsilenceableRegion]:
"""Find the regions encapsulated by line continuation characters or
by multiline strings.
Args:
tokens: an iterable containing `TokenInfo` objects.
comments: a sequence of strings representing code comments-one for
each line in the source from which `tokens` is generated.
Returns:
A list of `UnsilenceableRegion` objects.
Multiline strings are represented by `UnsilenceableRegion` objects
whose first entries in their `start` and `end` attributes differ.
Explicitly continued lines are represented by `UnsilenceableRegion`
objects whose first entries in their `start` and `end` attributes are
the same.
"""
unsilenceable_regions: set[UnsilenceableRegion] = set()
for token in tokens:
if token.start[0] != token.end[0] and (
token.exact_type == tokenize.STRING
or (
sys.version_info >= (3, 12)
and token.exact_type == tokenize.FSTRING_MIDDLE
)
):
region = UnsilenceableRegion(token.start[0], token.end[0])
unsilenceable_regions.add(region)
elif (
token.line.rstrip("\r\n").endswith("\\")
and not comments[token.end[0] - 1]
):
region = UnsilenceableRegion(token.end[0], token.end[0])
unsilenceable_regions.add(region)
return list(unsilenceable_regions)
def _is_safe_to_silence(
*, error: MypyError, unsilenceable_regions: Iterable[UnsilenceableRegion]
) -> bool:
"""Determine if the error is safe to silence
Args:
error: a `MypyError` for which a type error suppression comment is to
placed.
unsilenceable_regions: an iterable of `UnsilenceableRegion`s.
Returns:
`False` if the error is in an `UnsilenceableRegion` or its error code
is "syntax"; `True` otherwise.
"""
if error.error_code == "syntax":
return False
for region in unsilenceable_regions:
# Error within an UnsilenceableRegion (but not last line of multiline
# string)
if region.start <= error.line_no <= region.end and not (
error.line_no == region.end and region.start != region.end
):
return False
return True
def filter_by_silenceability(
*,
errors: Iterable[MypyError],
comments: Sequence[str],
tokens: Iterable[tokenize.TokenInfo],
) -> list[MypyError]:
"""Filter `MypyError`s by those which are safe to silence.
Args:
errors: the errors whose line numbers are to be corrected.
comments: a container of strings representing code comments.
tokens: an iterable containing `TokenInfo` objects.
Returns:
A list in which each entry is a `MypyError` from `errors` that can be
silenced with a type suppression comment.
"""
unsilenceable_regions = _find_unsilenceable_regions(
tokens=tokens, comments=comments
)
safe_to_silence = []
for error in errors:
if _is_safe_to_silence(
error=error, unsilenceable_regions=unsilenceable_regions
):
safe_to_silence.append(error)
return safe_to_silence