-
Notifications
You must be signed in to change notification settings - Fork 82
/
Copy pathautoflake.py
executable file
·1610 lines (1347 loc) · 49.4 KB
/
autoflake.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
#!/usr/bin/env python
# Copyright (C) Steven Myint
#
# Permission is hereby granted, free of charge, to any person obtaining
# a copy of this software and associated documentation files (the
# "Software"), to deal in the Software without restriction, including
# without limitation the rights to use, copy, modify, merge, publish,
# distribute, sublicense, and/or sell copies of the Software, and to
# permit persons to whom the Software is furnished to do so, subject to
# the following conditions:
#
# The above copyright notice and this permission notice shall be included
# in all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
# CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
"""Removes unused imports and unused variables as reported by pyflakes."""
from __future__ import annotations
import ast
import collections
import difflib
import fnmatch
import io
import logging
import os
import pathlib
import re
import signal
import string
import sys
import sysconfig
import tokenize
from collections.abc import Iterable
from collections.abc import Mapping
from collections.abc import MutableMapping
from collections.abc import Sequence
from typing import Any
from typing import Callable
from typing import cast
from typing import IO
import pyflakes.api
import pyflakes.messages
import pyflakes.reporter
__version__ = "2.3.1"
_LOGGER = logging.getLogger("autoflake")
_LOGGER.propagate = False
ATOMS = frozenset([tokenize.NAME, tokenize.NUMBER, tokenize.STRING])
EXCEPT_REGEX = re.compile(r"^\s*except [\s,()\w]+ as \w+:$")
PYTHON_SHEBANG_REGEX = re.compile(r"^#!.*\bpython[3]?\b\s*$")
MAX_PYTHON_FILE_DETECTION_BYTES = 1024
IGNORE_COMMENT_REGEX = re.compile(
r"\s*#\s{1,}autoflake:\s{1,}\bskip_file\b",
re.MULTILINE,
)
def standard_paths() -> Iterable[str]:
"""Yield paths to standard modules."""
paths = sysconfig.get_paths()
path_names = ("stdlib", "platstdlib")
for path_name in path_names:
# Yield lib paths.
if path_name in paths:
path = paths[path_name]
if os.path.isdir(path):
yield from os.listdir(path)
# Yield lib-dynload paths.
dynload_path = os.path.join(path, "lib-dynload")
if os.path.isdir(dynload_path):
yield from os.listdir(dynload_path)
def standard_package_names() -> Iterable[str]:
"""Yield standard module names."""
for name in standard_paths():
if name.startswith("_") or "-" in name:
continue
if "." in name and not name.endswith(("so", "py", "pyc")):
continue
yield name.split(".")[0]
IMPORTS_WITH_SIDE_EFFECTS = {"antigravity", "rlcompleter", "this"}
# In case they are built into CPython.
BINARY_IMPORTS = {
"datetime",
"grp",
"io",
"json",
"math",
"multiprocessing",
"parser",
"pwd",
"string",
"operator",
"os",
"sys",
"time",
}
SAFE_IMPORTS = (
frozenset(standard_package_names()) - IMPORTS_WITH_SIDE_EFFECTS | BINARY_IMPORTS
)
def unused_import_line_numbers(
messages: Iterable[pyflakes.messages.Message],
) -> Iterable[int]:
"""Yield line numbers of unused imports."""
for message in messages:
if isinstance(message, pyflakes.messages.UnusedImport):
yield message.lineno
def unused_import_module_name(
messages: Iterable[pyflakes.messages.Message],
) -> Iterable[tuple[int, str]]:
"""Yield line number and module name of unused imports."""
pattern = re.compile(r"\'(.+?)\'")
for message in messages:
if isinstance(message, pyflakes.messages.UnusedImport):
module_name = pattern.search(str(message))
if module_name:
module_name = module_name.group()[1:-1]
yield (message.lineno, module_name)
def star_import_used_line_numbers(
messages: Iterable[pyflakes.messages.Message],
) -> Iterable[int]:
"""Yield line number of star import usage."""
for message in messages:
if isinstance(message, pyflakes.messages.ImportStarUsed):
yield message.lineno
def star_import_usage_undefined_name(
messages: Iterable[pyflakes.messages.Message],
) -> Iterable[tuple[int, str, str]]:
"""Yield line number, undefined name, and its possible origin module."""
for message in messages:
if isinstance(message, pyflakes.messages.ImportStarUsage):
undefined_name = message.message_args[0]
module_name = message.message_args[1]
yield (message.lineno, undefined_name, module_name)
def unused_variable_line_numbers(
messages: Iterable[pyflakes.messages.Message],
) -> Iterable[int]:
"""Yield line numbers of unused variables."""
for message in messages:
if isinstance(message, pyflakes.messages.UnusedVariable):
yield message.lineno
def duplicate_key_line_numbers(
messages: Iterable[pyflakes.messages.Message],
source: str,
) -> Iterable[int]:
"""Yield line numbers of duplicate keys."""
messages = [
message
for message in messages
if isinstance(message, pyflakes.messages.MultiValueRepeatedKeyLiteral)
]
if messages:
# Filter out complex cases. We don't want to bother trying to parse
# this stuff and get it right. We can do it on a key-by-key basis.
key_to_messages = create_key_to_messages_dict(messages)
lines = source.split("\n")
for key, messages in key_to_messages.items():
good = True
for message in messages:
line = lines[message.lineno - 1]
key = message.message_args[0]
if not dict_entry_has_key(line, key):
good = False
if good:
for message in messages:
yield message.lineno
def create_key_to_messages_dict(
messages: Iterable[pyflakes.messages.MultiValueRepeatedKeyLiteral],
) -> Mapping[Any, Iterable[pyflakes.messages.MultiValueRepeatedKeyLiteral]]:
"""Return dict mapping the key to list of messages."""
dictionary: dict[
Any,
list[pyflakes.messages.MultiValueRepeatedKeyLiteral],
] = collections.defaultdict(list)
for message in messages:
dictionary[message.message_args[0]].append(message)
return dictionary
def check(source: str) -> Iterable[pyflakes.messages.Message]:
"""Return messages from pyflakes."""
reporter = ListReporter()
try:
pyflakes.api.check(source, filename="<string>", reporter=reporter)
except (AttributeError, RecursionError, UnicodeDecodeError):
pass
return reporter.messages
class StubFile:
"""Stub out file for pyflakes."""
def write(self, *_: Any) -> None:
"""Stub out."""
class ListReporter(pyflakes.reporter.Reporter):
"""Accumulate messages in messages list."""
def __init__(self) -> None:
"""Initialize.
Ignore errors from Reporter.
"""
ignore = StubFile()
pyflakes.reporter.Reporter.__init__(self, ignore, ignore)
self.messages: list[pyflakes.messages.Message] = []
def flake(self, message: pyflakes.messages.Message) -> None:
"""Accumulate messages."""
self.messages.append(message)
def extract_package_name(line: str) -> str | None:
"""Return package name in import statement."""
assert "\\" not in line
assert "(" not in line
assert ")" not in line
assert ";" not in line
if line.lstrip().startswith(("import", "from")):
word = line.split()[1]
else:
# Ignore doctests.
return None
package = word.split(".")[0]
assert " " not in package
return package
def multiline_import(line: str, previous_line: str = "") -> bool:
"""Return True if import is spans multiples lines."""
for symbol in "()":
if symbol in line:
return True
return multiline_statement(line, previous_line)
def multiline_statement(line: str, previous_line: str = "") -> bool:
"""Return True if this is part of a multiline statement."""
for symbol in "\\:;":
if symbol in line:
return True
sio = io.StringIO(line)
try:
list(tokenize.generate_tokens(sio.readline))
return previous_line.rstrip().endswith("\\")
except (SyntaxError, tokenize.TokenError):
return True
class PendingFix:
"""Allows a rewrite operation to span multiple lines.
In the main rewrite loop, every time a helper function returns a
``PendingFix`` object instead of a string, this object will be called
with the following line.
"""
def __init__(self, line: str) -> None:
"""Analyse and store the first line."""
self.accumulator = collections.deque([line])
def __call__(self, line: str) -> PendingFix | str:
"""Process line considering the accumulator.
Return self to keep processing the following lines or a string
with the final result of all the lines processed at once.
"""
raise NotImplementedError("Abstract method needs to be overwritten")
def _valid_char_in_line(char: str, line: str) -> bool:
"""Return True if a char appears in the line and is not commented."""
comment_index = line.find("#")
char_index = line.find(char)
valid_char_in_line = char_index >= 0 and (
comment_index > char_index or comment_index < 0
)
return valid_char_in_line
def _top_module(module_name: str) -> str:
"""Return the name of the top level module in the hierarchy."""
if module_name[0] == ".":
return "%LOCAL_MODULE%"
return module_name.split(".")[0]
def _modules_to_remove(
unused_modules: Iterable[str],
safe_to_remove: Iterable[str] = SAFE_IMPORTS,
) -> Iterable[str]:
"""Discard unused modules that are not safe to remove from the list."""
return [x for x in unused_modules if _top_module(x) in safe_to_remove]
def _segment_module(segment: str) -> str:
"""Extract the module identifier inside the segment.
It might be the case the segment does not have a module (e.g. is composed
just by a parenthesis or line continuation and whitespace). In this
scenario we just keep the segment... These characters are not valid in
identifiers, so they will never be contained in the list of unused modules
anyway.
"""
return segment.strip(string.whitespace + ",\\()") or segment
class FilterMultilineImport(PendingFix):
"""Remove unused imports from multiline import statements.
This class handles both the cases: "from imports" and "direct imports".
Some limitations exist (e.g. imports with comments, lines joined by ``;``,
etc). In these cases, the statement is left unchanged to avoid problems.
"""
IMPORT_RE = re.compile(r"\bimport\b\s*")
INDENTATION_RE = re.compile(r"^\s*")
BASE_RE = re.compile(r"\bfrom\s+([^ ]+)")
SEGMENT_RE = re.compile(
r"([^,\s]+(?:[\s\\]+as[\s\\]+[^,\s]+)?[,\s\\)]*)",
re.M,
)
# ^ module + comma + following space (including new line and continuation)
IDENTIFIER_RE = re.compile(r"[^,\s]+")
def __init__(
self,
line: str,
unused_module: Iterable[str] = (),
remove_all_unused_imports: bool = False,
safe_to_remove: Iterable[str] = SAFE_IMPORTS,
previous_line: str = "",
):
"""Receive the same parameters as ``filter_unused_import``."""
self.remove: Iterable[str] = unused_module
self.parenthesized: bool = "(" in line
self.from_, imports = self.IMPORT_RE.split(line, maxsplit=1)
match = self.BASE_RE.search(self.from_)
self.base = match.group(1) if match else None
self.give_up: bool = False
if not remove_all_unused_imports:
if self.base and _top_module(self.base) not in safe_to_remove:
self.give_up = True
else:
self.remove = _modules_to_remove(self.remove, safe_to_remove)
if "\\" in previous_line:
# Ignore tricky things like "try: \<new line> import" ...
self.give_up = True
self.analyze(line)
PendingFix.__init__(self, imports)
def is_over(self, line: str | None = None) -> bool:
"""Return True if the multiline import statement is over."""
line = line or self.accumulator[-1]
if self.parenthesized:
return _valid_char_in_line(")", line)
return not _valid_char_in_line("\\", line)
def analyze(self, line: str) -> None:
"""Decide if the statement will be fixed or left unchanged."""
if any(ch in line for ch in ";:#"):
self.give_up = True
def fix(self, accumulated: Iterable[str]) -> str:
"""Given a collection of accumulated lines, fix the entire import."""
old_imports = "".join(accumulated)
ending = get_line_ending(old_imports)
# Split imports into segments that contain the module name +
# comma + whitespace and eventual <newline> \ ( ) chars
segments = [x for x in self.SEGMENT_RE.findall(old_imports) if x]
modules = [_segment_module(x) for x in segments]
keep = _filter_imports(modules, self.base, self.remove)
# Short-circuit if no import was discarded
if len(keep) == len(segments):
return self.from_ + "import " + "".join(accumulated)
fixed = ""
if keep:
# Since it is very difficult to deal with all the line breaks and
# continuations, let's use the code layout that already exists and
# just replace the module identifiers inside the first N-1 segments
# + the last segment
templates = list(zip(modules, segments))
templates = templates[: len(keep) - 1] + templates[-1:]
# It is important to keep the last segment, since it might contain
# important chars like `)`
fixed = "".join(
template.replace(module, keep[i])
for i, (module, template) in enumerate(templates)
)
# Fix the edge case: inline parenthesis + just one surviving import
if self.parenthesized and any(ch not in fixed for ch in "()"):
fixed = fixed.strip(string.whitespace + "()") + ending
# Replace empty imports with a "pass" statement
empty = len(fixed.strip(string.whitespace + "\\(),")) < 1
if empty:
match = self.INDENTATION_RE.search(self.from_)
assert match is not None
indentation = match.group(0)
return indentation + "pass" + ending
return self.from_ + "import " + fixed
def __call__(self, line: str | None = None) -> PendingFix | str:
"""Accumulate all the lines in the import and then trigger the fix."""
if line:
self.accumulator.append(line)
self.analyze(line)
if not self.is_over(line):
return self
if self.give_up:
return self.from_ + "import " + "".join(self.accumulator)
return self.fix(self.accumulator)
def _filter_imports(
imports: Iterable[str],
parent: str | None = None,
unused_module: Iterable[str] = (),
) -> Sequence[str]:
# We compare full module name (``a.module`` not `module`) to
# guarantee the exact same module as detected from pyflakes.
sep = "" if parent and parent[-1] == "." else "."
def full_name(name: str) -> str:
return name if parent is None else parent + sep + name
return [x for x in imports if full_name(x) not in unused_module]
def filter_from_import(line: str, unused_module: Iterable[str]) -> str:
"""Parse and filter ``from something import a, b, c``.
Return line without unused import modules, or `pass` if all of the
module in import is unused.
"""
(indentation, imports) = re.split(
pattern=r"\bimport\b",
string=line,
maxsplit=1,
)
match = re.search(
pattern=r"\bfrom\s+([^ ]+)",
string=indentation,
)
assert match is not None
base_module = match.group(1)
imports = re.split(pattern=r"\s*,\s*", string=imports.strip())
filtered_imports = _filter_imports(imports, base_module, unused_module)
# All of the import in this statement is unused
if not filtered_imports:
return get_indentation(line) + "pass" + get_line_ending(line)
indentation += "import "
return indentation + ", ".join(filtered_imports) + get_line_ending(line)
def break_up_import(line: str) -> str:
"""Return line with imports on separate lines."""
assert "\\" not in line
assert "(" not in line
assert ")" not in line
assert ";" not in line
assert "#" not in line
assert not line.lstrip().startswith("from")
newline = get_line_ending(line)
if not newline:
return line
(indentation, imports) = re.split(
pattern=r"\bimport\b",
string=line,
maxsplit=1,
)
indentation += "import "
assert newline
return "".join(
[indentation + i.strip() + newline for i in imports.split(",")],
)
def filter_code(
source: str,
additional_imports: Iterable[str] | None = None,
expand_star_imports: bool = False,
remove_all_unused_imports: bool = False,
remove_duplicate_keys: bool = False,
remove_unused_variables: bool = False,
remove_rhs_for_unused_variables: bool = False,
ignore_init_module_imports: bool = False,
) -> Iterable[str]:
"""Yield code with unused imports removed."""
imports = SAFE_IMPORTS
if additional_imports:
imports |= frozenset(additional_imports)
del additional_imports
messages = check(source)
if ignore_init_module_imports:
marked_import_line_numbers: frozenset[int] = frozenset()
else:
marked_import_line_numbers = frozenset(
unused_import_line_numbers(messages),
)
marked_unused_module: dict[int, list[str]] = collections.defaultdict(list)
for line_number, module_name in unused_import_module_name(messages):
marked_unused_module[line_number].append(module_name)
undefined_names: list[str] = []
if expand_star_imports and not (
# See explanations in #18.
re.search(r"\b__all__\b", source)
or re.search(r"\bdel\b", source)
):
marked_star_import_line_numbers = frozenset(
star_import_used_line_numbers(messages),
)
if len(marked_star_import_line_numbers) > 1:
# Auto expanding only possible for single star import
marked_star_import_line_numbers = frozenset()
else:
for line_number, undefined_name, _ in star_import_usage_undefined_name(
messages,
):
undefined_names.append(undefined_name)
if not undefined_names:
marked_star_import_line_numbers = frozenset()
else:
marked_star_import_line_numbers = frozenset()
if remove_unused_variables:
marked_variable_line_numbers = frozenset(
unused_variable_line_numbers(messages),
)
else:
marked_variable_line_numbers = frozenset()
if remove_duplicate_keys:
marked_key_line_numbers: frozenset[int] = frozenset(
duplicate_key_line_numbers(messages, source),
)
else:
marked_key_line_numbers = frozenset()
line_messages = get_messages_by_line(messages)
sio = io.StringIO(source)
previous_line = ""
result: str | PendingFix = ""
for line_number, line in enumerate(sio.readlines(), start=1):
if isinstance(result, PendingFix):
result = result(line)
elif "#" in line:
result = line
elif line_number in marked_import_line_numbers:
result = filter_unused_import(
line,
unused_module=marked_unused_module[line_number],
remove_all_unused_imports=remove_all_unused_imports,
imports=imports,
previous_line=previous_line,
)
elif line_number in marked_variable_line_numbers:
result = filter_unused_variable(
line,
drop_rhs=remove_rhs_for_unused_variables,
)
elif line_number in marked_key_line_numbers:
result = filter_duplicate_key(
line,
line_messages[line_number],
line_number,
marked_key_line_numbers,
source,
)
elif line_number in marked_star_import_line_numbers:
result = filter_star_import(line, undefined_names)
else:
result = line
if not isinstance(result, PendingFix):
yield result
previous_line = line
def get_messages_by_line(
messages: Iterable[pyflakes.messages.Message],
) -> Mapping[int, pyflakes.messages.Message]:
"""Return dictionary that maps line number to message."""
line_messages: dict[int, pyflakes.messages.Message] = {}
for message in messages:
line_messages[message.lineno] = message
return line_messages
def filter_star_import(
line: str,
marked_star_import_undefined_name: Iterable[str],
) -> str:
"""Return line with the star import expanded."""
undefined_name = sorted(set(marked_star_import_undefined_name))
return re.sub(r"\*", ", ".join(undefined_name), line)
def filter_unused_import(
line: str,
unused_module: Iterable[str],
remove_all_unused_imports: bool,
imports: Iterable[str],
previous_line: str = "",
) -> PendingFix | str:
"""Return line if used, otherwise return None."""
# Ignore doctests.
if line.lstrip().startswith(">"):
return line
if multiline_import(line, previous_line):
filt = FilterMultilineImport(
line,
unused_module,
remove_all_unused_imports,
imports,
previous_line,
)
return filt()
is_from_import = line.lstrip().startswith("from")
if "," in line and not is_from_import:
return break_up_import(line)
package = extract_package_name(line)
if not remove_all_unused_imports and package is not None and package not in imports:
return line
if "," in line:
assert is_from_import
return filter_from_import(line, unused_module)
else:
# We need to replace import with "pass" in case the import is the
# only line inside a block. For example,
# "if True:\n import os". In such cases, if the import is
# removed, the block will be left hanging with no body.
return get_indentation(line) + "pass" + get_line_ending(line)
def filter_unused_variable(
line: str,
previous_line: str = "",
drop_rhs: bool = False,
) -> str:
"""Return line if used, otherwise return None."""
if re.match(EXCEPT_REGEX, line):
return re.sub(r" as \w+:$", ":", line, count=1)
elif multiline_statement(line, previous_line):
return line
elif line.count("=") == 1:
split_line = line.split("=")
assert len(split_line) == 2
value = split_line[1].lstrip()
if "," in split_line[0]:
return line
if is_literal_or_name(value):
# Rather than removing the line, replace with it "pass" to avoid
# a possible hanging block with no body.
value = "pass" + get_line_ending(line)
if drop_rhs:
return get_indentation(line) + value
if drop_rhs:
return ""
return get_indentation(line) + value
else:
return line
def filter_duplicate_key(
line: str,
message: pyflakes.messages.Message,
line_number: int,
marked_line_numbers: Iterable[int],
source: str,
previous_line: str = "",
) -> str:
"""Return '' if first occurrence of the key otherwise return `line`."""
if marked_line_numbers and line_number == sorted(marked_line_numbers)[0]:
return ""
return line
def dict_entry_has_key(line: str, key: Any) -> bool:
"""Return True if `line` is a dict entry that uses `key`.
Return False for multiline cases where the line should not be removed by
itself.
"""
if "#" in line:
return False
result = re.match(r"\s*(.*)\s*:\s*(.*),\s*$", line)
if not result:
return False
try:
candidate_key = ast.literal_eval(result.group(1))
except (SyntaxError, ValueError):
return False
if multiline_statement(result.group(2)):
return False
return cast(bool, candidate_key == key)
def is_literal_or_name(value: str) -> bool:
"""Return True if value is a literal or a name."""
try:
ast.literal_eval(value)
return True
except (SyntaxError, ValueError):
pass
if value.strip() in ["dict()", "list()", "set()"]:
return True
# Support removal of variables on the right side. But make sure
# there are no dots, which could mean an access of a property.
return re.match(r"^\w+\s*$", value) is not None
def useless_pass_line_numbers(
source: str,
ignore_pass_after_docstring: bool = False,
) -> Iterable[int]:
"""Yield line numbers of unneeded "pass" statements."""
sio = io.StringIO(source)
previous_token_type = None
last_pass_row = None
last_pass_indentation = None
previous_line = ""
previous_non_empty_line = ""
for token in tokenize.generate_tokens(sio.readline):
token_type = token[0]
start_row = token[2][0]
line = token[4]
is_pass = token_type == tokenize.NAME and line.strip() == "pass"
# Leading "pass".
if (
start_row - 1 == last_pass_row
and get_indentation(line) == last_pass_indentation
and token_type in ATOMS
and not is_pass
):
yield start_row - 1
if is_pass:
last_pass_row = start_row
last_pass_indentation = get_indentation(line)
is_trailing_pass = (
previous_token_type != tokenize.INDENT
and not previous_line.rstrip().endswith("\\")
)
is_pass_after_docstring = previous_non_empty_line.rstrip().endswith(
("'''", '"""'),
)
# Trailing "pass".
if is_trailing_pass:
if is_pass_after_docstring and ignore_pass_after_docstring:
continue
else:
yield start_row
previous_token_type = token_type
previous_line = line
if line.strip():
previous_non_empty_line = line
def filter_useless_pass(
source: str,
ignore_pass_statements: bool = False,
ignore_pass_after_docstring: bool = False,
) -> Iterable[str]:
"""Yield code with useless "pass" lines removed."""
if ignore_pass_statements:
marked_lines: frozenset[int] = frozenset()
else:
try:
marked_lines = frozenset(
useless_pass_line_numbers(
source,
ignore_pass_after_docstring,
),
)
except (SyntaxError, tokenize.TokenError):
marked_lines = frozenset()
sio = io.StringIO(source)
for line_number, line in enumerate(sio.readlines(), start=1):
if line_number not in marked_lines:
yield line
def get_indentation(line: str) -> str:
"""Return leading whitespace."""
if line.strip():
non_whitespace_index = len(line) - len(line.lstrip())
return line[:non_whitespace_index]
else:
return ""
def get_line_ending(line: str) -> str:
"""Return line ending."""
non_whitespace_index = len(line.rstrip()) - len(line)
if not non_whitespace_index:
return ""
else:
return line[non_whitespace_index:]
def fix_code(
source: str,
additional_imports: Iterable[str] | None = None,
expand_star_imports: bool = False,
remove_all_unused_imports: bool = False,
remove_duplicate_keys: bool = False,
remove_unused_variables: bool = False,
remove_rhs_for_unused_variables: bool = False,
ignore_init_module_imports: bool = False,
ignore_pass_statements: bool = False,
ignore_pass_after_docstring: bool = False,
) -> str:
"""Return code with all filtering run on it."""
if not source:
return source
if IGNORE_COMMENT_REGEX.search(source):
return source
# pyflakes does not handle "nonlocal" correctly.
if "nonlocal" in source:
remove_unused_variables = False
filtered_source = None
while True:
filtered_source = "".join(
filter_useless_pass(
"".join(
filter_code(
source,
additional_imports=additional_imports,
expand_star_imports=expand_star_imports,
remove_all_unused_imports=remove_all_unused_imports,
remove_duplicate_keys=remove_duplicate_keys,
remove_unused_variables=remove_unused_variables,
remove_rhs_for_unused_variables=(
remove_rhs_for_unused_variables
),
ignore_init_module_imports=ignore_init_module_imports,
),
),
ignore_pass_statements=ignore_pass_statements,
ignore_pass_after_docstring=ignore_pass_after_docstring,
),
)
if filtered_source == source:
break
source = filtered_source
return filtered_source
def fix_file(
filename: str,
args: Mapping[str, Any],
standard_out: IO[str] | None = None,
) -> int:
"""Run fix_code() on a file."""
if standard_out is None:
standard_out = sys.stdout
encoding = detect_encoding(filename)
with open_with_encoding(filename, encoding=encoding) as input_file:
return _fix_file(
input_file,
filename,
args,
args["write_to_stdout"],
cast(IO[str], standard_out),
encoding=encoding,
)
def _fix_file(
input_file: IO[str],
filename: str,
args: Mapping[str, Any],
write_to_stdout: bool,
standard_out: IO[str],
encoding: str | None = None,
) -> int:
source = input_file.read()
original_source = source
isInitFile = os.path.basename(filename) == "__init__.py"
if args["ignore_init_module_imports"] and isInitFile:
ignore_init_module_imports = True
else:
ignore_init_module_imports = False
filtered_source = fix_code(
source,
additional_imports=(args["imports"].split(",") if "imports" in args else None),
expand_star_imports=args["expand_star_imports"],
remove_all_unused_imports=args["remove_all_unused_imports"],
remove_duplicate_keys=args["remove_duplicate_keys"],
remove_unused_variables=args["remove_unused_variables"],
remove_rhs_for_unused_variables=(args["remove_rhs_for_unused_variables"]),
ignore_init_module_imports=ignore_init_module_imports,
ignore_pass_statements=args["ignore_pass_statements"],
ignore_pass_after_docstring=args["ignore_pass_after_docstring"],
)