Skip to content

Commit a4c11a7

Browse files
alexmvbancekzsol
authored
Re-indent the contents of docstrings (#1053)
* Re-indent the contents of docstrings when indentation changes Keeping the contents of docstrings completely unchanged when re-indenting (from 2-space intents to 4, for example) can cause incorrect docstring indentation: ``` class MyClass: """Multiline class docstring """ def method(self): """Multiline method docstring """ pass ``` ...becomes: ``` class MyClass: """Multiline class docstring """ def method(self): """Multiline method docstring """ pass ``` This uses the PEP 257 algorithm for determining docstring indentation, and adjusts the contents of docstrings to match their new indentation after `black` is applied. A small normalization is necessary to `assert_equivalent` because the trees are technically no longer precisely equivalent -- some constant strings have changed. When comparing two ASTs, whitespace after newlines within constant strings is thus folded into a single space. Co-authored-by: Luka Zakrajšek <[email protected]> * Extract the inner `_v` method to decrease complexity This reduces the cyclomatic complexity to a level that makes flake8 happy. * Blacken blib2to3's docstring which had an over-indent Co-authored-by: Luka Zakrajšek <[email protected]> Co-authored-by: Zsolt Dollenstein <[email protected]>
1 parent 9938c92 commit a4c11a7

File tree

4 files changed

+251
-39
lines changed

4 files changed

+251
-39
lines changed

black.py

+105-38
Original file line numberDiff line numberDiff line change
@@ -1955,6 +1955,18 @@ def visit_factor(self, node: Node) -> Iterator[Line]:
19551955
node.insert_child(index, Node(syms.atom, [lpar, operand, rpar]))
19561956
yield from self.visit_default(node)
19571957

1958+
def visit_STRING(self, leaf: Leaf) -> Iterator[Line]:
1959+
# Check if it's a docstring
1960+
if prev_siblings_are(
1961+
leaf.parent, [None, token.NEWLINE, token.INDENT, syms.simple_stmt]
1962+
) and is_multiline_string(leaf):
1963+
prefix = " " * self.current_line.depth
1964+
docstring = fix_docstring(leaf.value[3:-3], prefix)
1965+
leaf.value = leaf.value[0:3] + docstring + leaf.value[-3:]
1966+
normalize_string_quotes(leaf)
1967+
1968+
yield from self.visit_default(leaf)
1969+
19581970
def __post_init__(self) -> None:
19591971
"""You are in a twisty little maze of passages."""
19601972
v = self.visit_stmt
@@ -2236,6 +2248,22 @@ def preceding_leaf(node: Optional[LN]) -> Optional[Leaf]:
22362248
return None
22372249

22382250

2251+
def prev_siblings_are(node: Optional[LN], tokens: List[Optional[NodeType]]) -> bool:
2252+
"""Return if the `node` and its previous siblings match types against the provided
2253+
list of tokens; the provided `node`has its type matched against the last element in
2254+
the list. `None` can be used as the first element to declare that the start of the
2255+
list is anchored at the start of its parent's children."""
2256+
if not tokens:
2257+
return True
2258+
if tokens[-1] is None:
2259+
return node is None
2260+
if not node:
2261+
return False
2262+
if node.type != tokens[-1]:
2263+
return False
2264+
return prev_siblings_are(node.prev_sibling, tokens[:-1])
2265+
2266+
22392267
def child_towards(ancestor: Node, descendant: LN) -> Optional[LN]:
22402268
"""Return the child of `ancestor` that contains `descendant`."""
22412269
node: Optional[LN] = descendant
@@ -5804,54 +5832,66 @@ def _fixup_ast_constants(
58045832
return node
58055833

58065834

5807-
def assert_equivalent(src: str, dst: str) -> None:
5808-
"""Raise AssertionError if `src` and `dst` aren't equivalent."""
5809-
5810-
def _v(node: Union[ast.AST, ast3.AST, ast27.AST], depth: int = 0) -> Iterator[str]:
5811-
"""Simple visitor generating strings to compare ASTs by content."""
5835+
def _stringify_ast(
5836+
node: Union[ast.AST, ast3.AST, ast27.AST], depth: int = 0
5837+
) -> Iterator[str]:
5838+
"""Simple visitor generating strings to compare ASTs by content."""
58125839

5813-
node = _fixup_ast_constants(node)
5840+
node = _fixup_ast_constants(node)
58145841

5815-
yield f"{' ' * depth}{node.__class__.__name__}("
5842+
yield f"{' ' * depth}{node.__class__.__name__}("
58165843

5817-
for field in sorted(node._fields): # noqa: F402
5818-
# TypeIgnore has only one field 'lineno' which breaks this comparison
5819-
type_ignore_classes = (ast3.TypeIgnore, ast27.TypeIgnore)
5820-
if sys.version_info >= (3, 8):
5821-
type_ignore_classes += (ast.TypeIgnore,)
5822-
if isinstance(node, type_ignore_classes):
5823-
break
5844+
for field in sorted(node._fields): # noqa: F402
5845+
# TypeIgnore has only one field 'lineno' which breaks this comparison
5846+
type_ignore_classes = (ast3.TypeIgnore, ast27.TypeIgnore)
5847+
if sys.version_info >= (3, 8):
5848+
type_ignore_classes += (ast.TypeIgnore,)
5849+
if isinstance(node, type_ignore_classes):
5850+
break
58245851

5825-
try:
5826-
value = getattr(node, field)
5827-
except AttributeError:
5828-
continue
5852+
try:
5853+
value = getattr(node, field)
5854+
except AttributeError:
5855+
continue
58295856

5830-
yield f"{' ' * (depth+1)}{field}="
5857+
yield f"{' ' * (depth+1)}{field}="
58315858

5832-
if isinstance(value, list):
5833-
for item in value:
5834-
# Ignore nested tuples within del statements, because we may insert
5835-
# parentheses and they change the AST.
5836-
if (
5837-
field == "targets"
5838-
and isinstance(node, (ast.Delete, ast3.Delete, ast27.Delete))
5839-
and isinstance(item, (ast.Tuple, ast3.Tuple, ast27.Tuple))
5840-
):
5841-
for item in item.elts:
5842-
yield from _v(item, depth + 2)
5859+
if isinstance(value, list):
5860+
for item in value:
5861+
# Ignore nested tuples within del statements, because we may insert
5862+
# parentheses and they change the AST.
5863+
if (
5864+
field == "targets"
5865+
and isinstance(node, (ast.Delete, ast3.Delete, ast27.Delete))
5866+
and isinstance(item, (ast.Tuple, ast3.Tuple, ast27.Tuple))
5867+
):
5868+
for item in item.elts:
5869+
yield from _stringify_ast(item, depth + 2)
58435870

5844-
elif isinstance(item, (ast.AST, ast3.AST, ast27.AST)):
5845-
yield from _v(item, depth + 2)
5871+
elif isinstance(item, (ast.AST, ast3.AST, ast27.AST)):
5872+
yield from _stringify_ast(item, depth + 2)
58465873

5847-
elif isinstance(value, (ast.AST, ast3.AST, ast27.AST)):
5848-
yield from _v(value, depth + 2)
5874+
elif isinstance(value, (ast.AST, ast3.AST, ast27.AST)):
5875+
yield from _stringify_ast(value, depth + 2)
58495876

5877+
else:
5878+
# Constant strings may be indented across newlines, if they are
5879+
# docstrings; fold spaces after newlines when comparing
5880+
if (
5881+
isinstance(node, ast.Constant)
5882+
and field == "value"
5883+
and isinstance(value, str)
5884+
):
5885+
normalized = re.sub(r"\n[ \t]+", "\n ", value)
58505886
else:
5851-
yield f"{' ' * (depth+2)}{value!r}, # {value.__class__.__name__}"
5887+
normalized = value
5888+
yield f"{' ' * (depth+2)}{normalized!r}, # {value.__class__.__name__}"
5889+
5890+
yield f"{' ' * depth}) # /{node.__class__.__name__}"
58525891

5853-
yield f"{' ' * depth}) # /{node.__class__.__name__}"
58545892

5893+
def assert_equivalent(src: str, dst: str) -> None:
5894+
"""Raise AssertionError if `src` and `dst` aren't equivalent."""
58555895
try:
58565896
src_ast = parse_ast(src)
58575897
except Exception as exc:
@@ -5870,8 +5910,8 @@ def _v(node: Union[ast.AST, ast3.AST, ast27.AST], depth: int = 0) -> Iterator[st
58705910
f" helpful: {log}"
58715911
) from None
58725912

5873-
src_ast_str = "\n".join(_v(src_ast))
5874-
dst_ast_str = "\n".join(_v(dst_ast))
5913+
src_ast_str = "\n".join(_stringify_ast(src_ast))
5914+
dst_ast_str = "\n".join(_stringify_ast(dst_ast))
58755915
if src_ast_str != dst_ast_str:
58765916
log = dump_to_file(diff(src_ast_str, dst_ast_str, "src", "dst"))
58775917
raise AssertionError(
@@ -6236,5 +6276,32 @@ def patched_main() -> None:
62366276
main()
62376277

62386278

6279+
def fix_docstring(docstring: str, prefix: str) -> str:
6280+
# https://www.python.org/dev/peps/pep-0257/#handling-docstring-indentation
6281+
if not docstring:
6282+
return ""
6283+
# Convert tabs to spaces (following the normal Python rules)
6284+
# and split into a list of lines:
6285+
lines = docstring.expandtabs().splitlines()
6286+
# Determine minimum indentation (first line doesn't count):
6287+
indent = sys.maxsize
6288+
for line in lines[1:]:
6289+
stripped = line.lstrip()
6290+
if stripped:
6291+
indent = min(indent, len(line) - len(stripped))
6292+
# Remove indentation (first line is special):
6293+
trimmed = [lines[0].strip()]
6294+
if indent < sys.maxsize:
6295+
last_line_idx = len(lines) - 2
6296+
for i, line in enumerate(lines[1:]):
6297+
stripped_line = line[indent:].rstrip()
6298+
if stripped_line or i == last_line_idx:
6299+
trimmed.append(prefix + stripped_line)
6300+
else:
6301+
trimmed.append("")
6302+
# Return a single string:
6303+
return "\n".join(trimmed)
6304+
6305+
62396306
if __name__ == "__main__":
62406307
patched_main()

blib2to3/pytree.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -962,7 +962,7 @@ def generate_matches(
962962
(count, results) tuples where:
963963
count: the entire sequence of patterns matches nodes[:count];
964964
results: dict containing named submatches.
965-
"""
965+
"""
966966
if not patterns:
967967
yield 0, {}
968968
else:

tests/data/docstring.py

+138
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,138 @@
1+
class MyClass:
2+
"""Multiline
3+
class docstring
4+
"""
5+
6+
def method(self):
7+
"""Multiline
8+
method docstring
9+
"""
10+
pass
11+
12+
13+
def foo():
14+
"""This is a docstring with
15+
some lines of text here
16+
"""
17+
return
18+
19+
20+
def bar():
21+
'''This is another docstring
22+
with more lines of text
23+
'''
24+
return
25+
26+
27+
def baz():
28+
'''"This" is a string with some
29+
embedded "quotes"'''
30+
return
31+
32+
33+
def troz():
34+
'''Indentation with tabs
35+
is just as OK
36+
'''
37+
return
38+
39+
40+
def zort():
41+
"""Another
42+
multiline
43+
docstring
44+
"""
45+
pass
46+
47+
def poit():
48+
"""
49+
Lorem ipsum dolor sit amet.
50+
51+
Consectetur adipiscing elit:
52+
- sed do eiusmod tempor incididunt ut labore
53+
- dolore magna aliqua
54+
- enim ad minim veniam
55+
- quis nostrud exercitation ullamco laboris nisi
56+
- aliquip ex ea commodo consequat
57+
"""
58+
pass
59+
60+
61+
def over_indent():
62+
"""
63+
This has a shallow indent
64+
- But some lines are deeper
65+
- And the closing quote is too deep
66+
"""
67+
pass
68+
69+
# output
70+
71+
class MyClass:
72+
"""Multiline
73+
class docstring
74+
"""
75+
76+
def method(self):
77+
"""Multiline
78+
method docstring
79+
"""
80+
pass
81+
82+
83+
def foo():
84+
"""This is a docstring with
85+
some lines of text here
86+
"""
87+
return
88+
89+
90+
def bar():
91+
"""This is another docstring
92+
with more lines of text
93+
"""
94+
return
95+
96+
97+
def baz():
98+
'''"This" is a string with some
99+
embedded "quotes"'''
100+
return
101+
102+
103+
def troz():
104+
"""Indentation with tabs
105+
is just as OK
106+
"""
107+
return
108+
109+
110+
def zort():
111+
"""Another
112+
multiline
113+
docstring
114+
"""
115+
pass
116+
117+
118+
def poit():
119+
"""
120+
Lorem ipsum dolor sit amet.
121+
122+
Consectetur adipiscing elit:
123+
- sed do eiusmod tempor incididunt ut labore
124+
- dolore magna aliqua
125+
- enim ad minim veniam
126+
- quis nostrud exercitation ullamco laboris nisi
127+
- aliquip ex ea commodo consequat
128+
"""
129+
pass
130+
131+
132+
def over_indent():
133+
"""
134+
This has a shallow indent
135+
- But some lines are deeper
136+
- And the closing quote is too deep
137+
"""
138+
pass

tests/test_black.py

+7
Original file line numberDiff line numberDiff line change
@@ -391,6 +391,13 @@ def test_string_quotes(self) -> None:
391391
black.assert_stable(source, not_normalized, mode=mode)
392392

393393
@patch("black.dump_to_file", dump_to_stderr)
394+
def test_docstring(self) -> None:
395+
source, expected = read_data("docstring")
396+
actual = fs(source)
397+
self.assertFormatEqual(expected, actual)
398+
black.assert_equivalent(source, actual)
399+
black.assert_stable(source, actual, black.FileMode())
400+
394401
def test_long_strings(self) -> None:
395402
"""Tests for splitting long strings."""
396403
source, expected = read_data("long_strings")

0 commit comments

Comments
 (0)