Feedback and handle more cases (with added tests)

Harlan Haskins · Harlan Haskins · commit 692ce0d069ff · 2023-10-24T20:39:24.000-06:00
diff --git a/lib/AST/InlinableText.cpp b/lib/AST/InlinableText.cpp
@@ -189,6 +189,13 @@ struct ExtractInactiveRanges : public ASTWalker {
 };
 } // end anonymous namespace
 
+/// Appends the textual contents of the provided source range, stripping
+/// the contents of comments that appear in the source.
+///
+/// Given that comments are treated as whitespace, this also appends a
+/// space or newline (depending if the comment was multi-line and itself
+/// had newlines in the body) in place of the comment, to avoid fusing tokens
+/// together.
 static void appendRange(
   SourceManager &sourceMgr, SourceLoc start, SourceLoc end,
   SmallVectorImpl<char> &scratch) {
@@ -210,28 +217,44 @@ static void appendRange(
     lexer.lex(token);
 
     if (token.is(tok::comment)) {
-      // Append the range from the last non-comment token to the beginning of this comment
-      // token.
+      // Grab the start of the full comment token (with leading trivia as well)
       SourceLoc commentLoc = token.getLoc();
-      auto charRange = CharSourceRange(sourceMgr, nonCommentStart, commentLoc);
-      StringRef text = sourceMgr.extractText(charRange);
-      scratch.append(text.begin(), text.end());
 
-      // Append a single whitespace character, to avoid fusing tokens.
-      scratch.push_back(' ');
-
-      // Set the start of the next non-comment range to the end of this token.
+      // Find the end of the token (with trailing trivia)
       SourceLoc endLoc = Lexer::getLocForEndOfToken(sourceMgr, token.getLoc());
 
-      // The comment token's end location includes trailing whitespace, so trim trailing
+      // The comment token's range includes leading/trailing whitespace, so trim
       // whitespace and only strip the portions of the comment that are not whitespace.
       CharSourceRange range = CharSourceRange(sourceMgr, commentLoc, endLoc);
-      StringRef commentText = sourceMgr.extractText(range);
-      unsigned whitespaceOffset = commentText.size() - commentText.rtrim().size();
-      if (whitespaceOffset > 0) {
-        endLoc = endLoc.getAdvancedLoc(-whitespaceOffset);
+      StringRef fullTokenText = sourceMgr.extractText(range);
+      unsigned leadingWhitespace = fullTokenText.size() - fullTokenText.ltrim().size();
+      if (leadingWhitespace > 0) {
+        commentLoc = commentLoc.getAdvancedLoc(leadingWhitespace);
+      }
+
+      unsigned trailingWhitespace = fullTokenText.size() - fullTokenText.rtrim().size();
+      if (trailingWhitespace > 0) {
+        endLoc = endLoc.getAdvancedLoc(-trailingWhitespace);
       }
 
+      // First, extract the text up to the start of the comment, including the whitespace.
+      auto charRange = CharSourceRange(sourceMgr, nonCommentStart, commentLoc);
+      StringRef text = sourceMgr.extractText(charRange);
+      scratch.append(text.begin(), text.end());
+
+      // Next, search through the comment text to see if it's a block comment with a newline. If so
+      // we need to re-insert a newline to avoid fusing multi-line tokens together.
+      auto commentTextRange = CharSourceRange(sourceMgr, commentLoc, endLoc);
+      StringRef commentText = sourceMgr.extractText(commentTextRange);
+      bool hasNewline = commentText.find_first_of("\n\r") != StringRef::npos;
+
+      // Use a newline as a filler character if the comment itself had a newline in it.
+      char filler = hasNewline ? '\n' : ' ';
+
+      // Append a single whitespace filler character, to avoid fusing tokens.
+      scratch.push_back(filler);
+
+      // Start the next region after the contents of the comment.
       nonCommentStart = endLoc;
     }
   }
diff --git a/test/ModuleInterface/if-configs.swift b/test/ModuleInterface/if-configs.swift
@@ -128,13 +128,23 @@ public func hasIfCompilerCheck(_ x: () -> Bool = {
 }
 
 // CHECK: func hasComments
+// CHECK-NOT: #if NOT_PROVIDED
 // CHECK: print(
+// CHECK: "this should show up"
 // CHECK-NOT: comment! don't mess up indentation!
 // CHECK: {{^}}    """
 // CHECK: {{^}}    """
+// CHECK: #if compiler(>=5.3) {{$}}
+// CHECK: print( "")
+// CHECK: #endif
+// CHECK: let x = 1
+// CHECK-NEXT: let y = 2
+// CHECK: let a = 3
+// CHECK: let b = 2
 // CHECK-NOT: #if
 // CHECK-NOT: comment!
 // CHECK: return true
+@inlinable
 public func hasComments() -> Bool {
   /* comment! */ // comment!
   #if NOT_PROVIDED
@@ -151,6 +161,16 @@ public func hasComments() -> Bool {
     """
     """)
 
+  #if compiler(>=5.3) // comment!
+  print(/*comment!*/"")
+  #endif
+
+  let x = 1/*
+  */let y = 2
+
+  let a = 3
+  /* test */let b = 2
+
   #if !NOT_PROVIDED
     // comment!
     return/* comment! */true/* comment! */