@@ -1955,6 +1955,18 @@ def visit_factor(self, node: Node) -> Iterator[Line]:
1955
1955
node .insert_child (index , Node (syms .atom , [lpar , operand , rpar ]))
1956
1956
yield from self .visit_default (node )
1957
1957
1958
+ def visit_STRING (self , leaf : Leaf ) -> Iterator [Line ]:
1959
+ # Check if it's a docstring
1960
+ if prev_siblings_are (
1961
+ leaf .parent , [None , token .NEWLINE , token .INDENT , syms .simple_stmt ]
1962
+ ) and is_multiline_string (leaf ):
1963
+ prefix = " " * self .current_line .depth
1964
+ docstring = fix_docstring (leaf .value [3 :- 3 ], prefix )
1965
+ leaf .value = leaf .value [0 :3 ] + docstring + leaf .value [- 3 :]
1966
+ normalize_string_quotes (leaf )
1967
+
1968
+ yield from self .visit_default (leaf )
1969
+
1958
1970
def __post_init__ (self ) -> None :
1959
1971
"""You are in a twisty little maze of passages."""
1960
1972
v = self .visit_stmt
@@ -2236,6 +2248,22 @@ def preceding_leaf(node: Optional[LN]) -> Optional[Leaf]:
2236
2248
return None
2237
2249
2238
2250
2251
+ def prev_siblings_are (node : Optional [LN ], tokens : List [Optional [NodeType ]]) -> bool :
2252
+ """Return if the `node` and its previous siblings match types against the provided
2253
+ list of tokens; the provided `node`has its type matched against the last element in
2254
+ the list. `None` can be used as the first element to declare that the start of the
2255
+ list is anchored at the start of its parent's children."""
2256
+ if not tokens :
2257
+ return True
2258
+ if tokens [- 1 ] is None :
2259
+ return node is None
2260
+ if not node :
2261
+ return False
2262
+ if node .type != tokens [- 1 ]:
2263
+ return False
2264
+ return prev_siblings_are (node .prev_sibling , tokens [:- 1 ])
2265
+
2266
+
2239
2267
def child_towards (ancestor : Node , descendant : LN ) -> Optional [LN ]:
2240
2268
"""Return the child of `ancestor` that contains `descendant`."""
2241
2269
node : Optional [LN ] = descendant
@@ -5804,54 +5832,66 @@ def _fixup_ast_constants(
5804
5832
return node
5805
5833
5806
5834
5807
- def assert_equivalent (src : str , dst : str ) -> None :
5808
- """Raise AssertionError if `src` and `dst` aren't equivalent."""
5809
-
5810
- def _v (node : Union [ast .AST , ast3 .AST , ast27 .AST ], depth : int = 0 ) -> Iterator [str ]:
5811
- """Simple visitor generating strings to compare ASTs by content."""
5835
+ def _stringify_ast (
5836
+ node : Union [ast .AST , ast3 .AST , ast27 .AST ], depth : int = 0
5837
+ ) -> Iterator [str ]:
5838
+ """Simple visitor generating strings to compare ASTs by content."""
5812
5839
5813
- node = _fixup_ast_constants (node )
5840
+ node = _fixup_ast_constants (node )
5814
5841
5815
- yield f"{ ' ' * depth } { node .__class__ .__name__ } ("
5842
+ yield f"{ ' ' * depth } { node .__class__ .__name__ } ("
5816
5843
5817
- for field in sorted (node ._fields ): # noqa: F402
5818
- # TypeIgnore has only one field 'lineno' which breaks this comparison
5819
- type_ignore_classes = (ast3 .TypeIgnore , ast27 .TypeIgnore )
5820
- if sys .version_info >= (3 , 8 ):
5821
- type_ignore_classes += (ast .TypeIgnore ,)
5822
- if isinstance (node , type_ignore_classes ):
5823
- break
5844
+ for field in sorted (node ._fields ): # noqa: F402
5845
+ # TypeIgnore has only one field 'lineno' which breaks this comparison
5846
+ type_ignore_classes = (ast3 .TypeIgnore , ast27 .TypeIgnore )
5847
+ if sys .version_info >= (3 , 8 ):
5848
+ type_ignore_classes += (ast .TypeIgnore ,)
5849
+ if isinstance (node , type_ignore_classes ):
5850
+ break
5824
5851
5825
- try :
5826
- value = getattr (node , field )
5827
- except AttributeError :
5828
- continue
5852
+ try :
5853
+ value = getattr (node , field )
5854
+ except AttributeError :
5855
+ continue
5829
5856
5830
- yield f"{ ' ' * (depth + 1 )} { field } ="
5857
+ yield f"{ ' ' * (depth + 1 )} { field } ="
5831
5858
5832
- if isinstance (value , list ):
5833
- for item in value :
5834
- # Ignore nested tuples within del statements, because we may insert
5835
- # parentheses and they change the AST.
5836
- if (
5837
- field == "targets"
5838
- and isinstance (node , (ast .Delete , ast3 .Delete , ast27 .Delete ))
5839
- and isinstance (item , (ast .Tuple , ast3 .Tuple , ast27 .Tuple ))
5840
- ):
5841
- for item in item .elts :
5842
- yield from _v (item , depth + 2 )
5859
+ if isinstance (value , list ):
5860
+ for item in value :
5861
+ # Ignore nested tuples within del statements, because we may insert
5862
+ # parentheses and they change the AST.
5863
+ if (
5864
+ field == "targets"
5865
+ and isinstance (node , (ast .Delete , ast3 .Delete , ast27 .Delete ))
5866
+ and isinstance (item , (ast .Tuple , ast3 .Tuple , ast27 .Tuple ))
5867
+ ):
5868
+ for item in item .elts :
5869
+ yield from _stringify_ast (item , depth + 2 )
5843
5870
5844
- elif isinstance (item , (ast .AST , ast3 .AST , ast27 .AST )):
5845
- yield from _v (item , depth + 2 )
5871
+ elif isinstance (item , (ast .AST , ast3 .AST , ast27 .AST )):
5872
+ yield from _stringify_ast (item , depth + 2 )
5846
5873
5847
- elif isinstance (value , (ast .AST , ast3 .AST , ast27 .AST )):
5848
- yield from _v (value , depth + 2 )
5874
+ elif isinstance (value , (ast .AST , ast3 .AST , ast27 .AST )):
5875
+ yield from _stringify_ast (value , depth + 2 )
5849
5876
5877
+ else :
5878
+ # Constant strings may be indented across newlines, if they are
5879
+ # docstrings; fold spaces after newlines when comparing
5880
+ if (
5881
+ isinstance (node , ast .Constant )
5882
+ and field == "value"
5883
+ and isinstance (value , str )
5884
+ ):
5885
+ normalized = re .sub (r"\n[ \t]+" , "\n " , value )
5850
5886
else :
5851
- yield f"{ ' ' * (depth + 2 )} { value !r} , # { value .__class__ .__name__ } "
5887
+ normalized = value
5888
+ yield f"{ ' ' * (depth + 2 )} { normalized !r} , # { value .__class__ .__name__ } "
5889
+
5890
+ yield f"{ ' ' * depth } ) # /{ node .__class__ .__name__ } "
5852
5891
5853
- yield f"{ ' ' * depth } ) # /{ node .__class__ .__name__ } "
5854
5892
5893
+ def assert_equivalent (src : str , dst : str ) -> None :
5894
+ """Raise AssertionError if `src` and `dst` aren't equivalent."""
5855
5895
try :
5856
5896
src_ast = parse_ast (src )
5857
5897
except Exception as exc :
@@ -5870,8 +5910,8 @@ def _v(node: Union[ast.AST, ast3.AST, ast27.AST], depth: int = 0) -> Iterator[st
5870
5910
f" helpful: { log } "
5871
5911
) from None
5872
5912
5873
- src_ast_str = "\n " .join (_v (src_ast ))
5874
- dst_ast_str = "\n " .join (_v (dst_ast ))
5913
+ src_ast_str = "\n " .join (_stringify_ast (src_ast ))
5914
+ dst_ast_str = "\n " .join (_stringify_ast (dst_ast ))
5875
5915
if src_ast_str != dst_ast_str :
5876
5916
log = dump_to_file (diff (src_ast_str , dst_ast_str , "src" , "dst" ))
5877
5917
raise AssertionError (
@@ -6236,5 +6276,32 @@ def patched_main() -> None:
6236
6276
main ()
6237
6277
6238
6278
6279
+ def fix_docstring (docstring : str , prefix : str ) -> str :
6280
+ # https://www.python.org/dev/peps/pep-0257/#handling-docstring-indentation
6281
+ if not docstring :
6282
+ return ""
6283
+ # Convert tabs to spaces (following the normal Python rules)
6284
+ # and split into a list of lines:
6285
+ lines = docstring .expandtabs ().splitlines ()
6286
+ # Determine minimum indentation (first line doesn't count):
6287
+ indent = sys .maxsize
6288
+ for line in lines [1 :]:
6289
+ stripped = line .lstrip ()
6290
+ if stripped :
6291
+ indent = min (indent , len (line ) - len (stripped ))
6292
+ # Remove indentation (first line is special):
6293
+ trimmed = [lines [0 ].strip ()]
6294
+ if indent < sys .maxsize :
6295
+ last_line_idx = len (lines ) - 2
6296
+ for i , line in enumerate (lines [1 :]):
6297
+ stripped_line = line [indent :].rstrip ()
6298
+ if stripped_line or i == last_line_idx :
6299
+ trimmed .append (prefix + stripped_line )
6300
+ else :
6301
+ trimmed .append ("" )
6302
+ # Return a single string:
6303
+ return "\n " .join (trimmed )
6304
+
6305
+
6239
6306
if __name__ == "__main__" :
6240
6307
patched_main ()
0 commit comments