swiftlang
diff --git a/‎include/swift/Syntax/CMakeLists.txt
Lines changed: 1 addition & 0 deletions b/‎include/swift/Syntax/CMakeLists.txt
Lines changed: 1 addition & 0 deletions
diff --git a/‎include/swift/Syntax/SyntaxClassifier.h.gyb
Lines changed: 118 additions & 0 deletions b/‎include/swift/Syntax/SyntaxClassifier.h.gyb
Lines changed: 118 additions & 0 deletions
diff --git a/‎include/swift/Syntax/SyntaxVisitor.h.gyb
Lines changed: 1 addition & 1 deletion b/‎include/swift/Syntax/SyntaxVisitor.h.gyb
Lines changed: 1 addition & 1 deletion
diff --git a/‎lib/Syntax/CMakeLists.txt
Lines changed: 1 addition & 0 deletions b/‎lib/Syntax/CMakeLists.txt
Lines changed: 1 addition & 0 deletions
diff --git a/‎lib/Syntax/SyntaxClassifier.cpp.gyb
Lines changed: 159 additions & 0 deletions b/‎lib/Syntax/SyntaxClassifier.cpp.gyb
Lines changed: 159 additions & 0 deletions
@@ -8,6 +8,7 @@ set(generated_include_sources
     SyntaxKind.h.gyb
     SyntaxNodes.h.gyb
     SyntaxBuilders.h.gyb
+    SyntaxClassifier.h.gyb
     SyntaxFactory.h.gyb
     SyntaxVisitor.h.gyb
     Trivia.h.gyb)
 
@@ -0,0 +1,118 @@
+%{
+  # -*- mode: C++ -*-
+  from gyb_syntax_support import *
+  NODE_MAP = create_node_map()
+  # Ignore the following admonition; it applies to the resulting .h file only
+}%
+//// Automatically Generated From SyntaxClassifier.h.gyb.
+//// Do Not Edit Directly!
+//===----------- SyntaxClassifier.h - SyntaxClassifier definitions --------===//
+//
+// This source file is part of the Swift.org open source project
+//
+// Copyright (c) 2014 - 2018 Apple Inc. and the Swift project authors
+// Licensed under Apache License v2.0 with Runtime Library Exception
+//
+// See https://swift.org/LICENSE.txt for license information
+// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
+//
+//===----------------------------------------------------------------------===//
+
+#ifndef SWIFT_SYNTAX_CLASSIFIER_H
+#define SWIFT_SYNTAX_CLASSIFIER_H
+
+#include "swift/Syntax/SyntaxVisitor.h"
+#include <stack>
+
+namespace swift {
+namespace syntax {
+
+
+/// A classification that determines which color a token should be colored in
+/// for syntax coloring.
+enum class SyntaxClassification {
+  None,
+  Keyword,
+  Identifier,
+  DollarIdentifier,
+  IntegerLiteral,
+  FloatingLiteral,
+  StringLiteral,
+  /// Marks the parens for a string interpolation.
+  StringInterpolationAnchor,
+  TypeIdentifier,
+  /// #if/#else/#endif occurrence.
+  BuildConfigKeyword,
+  /// An identifier in a #if condition.
+  BuildConfigId,
+  /// #-keywords like #warning, #sourceLocation
+  PoundDirectiveKeyword,
+  /// Any occurrence of '@<attribute-name>' anywhere.
+  Attribute,
+  /// An editor placeholder string <#like this#>.
+  EditorPlaceholder,
+  ObjectLiteral
+};
+
+
+class SyntaxClassifier: public SyntaxVisitor {
+  struct ContextStackEntry {
+    /// The classification all identifiers shall inherit
+    SyntaxClassification Classification;
+    /// If set to \c true, all tokens will be forced to receive the above
+    /// classification, overriding their context-free classification
+    bool ForceClassification;
+
+    ContextStackEntry(SyntaxClassification Classification,
+                      bool ForceClassification)
+      : Classification(Classification),
+        ForceClassification(ForceClassification) {}
+  };
+
+  std::map<unsigned, SyntaxClassification> ClassifiedTokens;
+  /// The top classification of this stack determines the color of identifiers
+  std::stack<ContextStackEntry, llvm::SmallVector<ContextStackEntry, 16>> ContextStack;
+
+  template<typename T>
+  void visit(T Node, SyntaxClassification Classification,
+             bool ForceClassification) {
+    ContextStack.emplace(Classification, ForceClassification);
+    visit(Node);
+    ContextStack.pop();
+  }
+
+  template<typename T>
+  void visit(llvm::Optional<T> OptNode) {
+    if (OptNode.hasValue()) {
+      static_cast<SyntaxVisitor *>(this)->visit(OptNode.getValue());
+    }
+  }
+
+  virtual void visit(TokenSyntax TokenNode) override;
+
+  virtual void visit(Syntax Node) override {
+    SyntaxVisitor::visit(Node);
+  }
+
+% for node in SYNTAX_NODES:
+%   if is_visitable(node):
+  virtual void visit(${node.name} Node) override;
+%   end
+% end
+
+public:
+  std::map<unsigned, SyntaxClassification> classify(Syntax Node) {
+    // Clean up the environment
+    ContextStack = std::stack<ContextStackEntry, llvm::SmallVector<ContextStackEntry, 16>>();
+    ContextStack.push({SyntaxClassification::None, false});
+    ClassifiedTokens.clear();
+
+    Node.accept(*this);
+
+    return ClassifiedTokens;
+  }
+};
+} // namespace syntax
+} // namespace swift
+
+#endif // SWIFT_SYNTAX_CLASSIFIER_H
@@ -42,7 +42,7 @@ struct SyntaxVisitor {
 
   virtual void visitPre(Syntax node) {}
   virtual void visitPost(Syntax node) {}
-  void visit(Syntax node);
+  virtual void visit(Syntax node);
 
   void visitChildren(Syntax node) {
     for (unsigned i = 0, e = node.getNumChildren(); i != e; ++i) {
 
@@ -14,5 +14,6 @@ add_swift_library(swiftSyntax STATIC
   RawSyntax.cpp
   Syntax.cpp
   SyntaxArena.cpp
+  SyntaxClassifier.cpp.gyb
   SyntaxData.cpp
   UnknownSyntax.cpp)
@@ -0,0 +1,159 @@
+%{
+  from gyb_syntax_support import *
+  # -*- mode: C++ -*-
+  # Ignore the following admonition; it applies to the resulting .cpp file only
+}%
+//// Automatically Generated From SyntaxClassifier.cpp.gyb.
+//// Do Not Edit Directly!
+//===----- SyntaxClassifier.cpp - Syntax Classifier implementations -------===//
+//
+// This source file is part of the Swift.org open source project
+//
+// Copyright (c) 2014 - 2018 Apple Inc. and the Swift project authors
+// Licensed under Apache License v2.0 with Runtime Library Exception
+//
+// See https://swift.org/LICENSE.txt for license information
+// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
+//
+//===----------------------------------------------------------------------===//
+//
+// This file defines the Syntax Classifier, which walks the syntax tree and
+// creates a classification table for all tokens in the syntax tree, mapping it
+// to a \c SyntaxClassification by its ID.
+//
+//===----------------------------------------------------------------------===//
+
+#include "swift/Basic/EditorPlaceholder.h"
+#include "swift/Syntax/SyntaxClassifier.h"
+
+using namespace swift;
+using namespace swift::syntax;
+
+% for node in SYNTAX_NODES:
+%   if is_visitable(node):
+void SyntaxClassifier::visit(${node.name} Node) {
+%     if node.is_unknown() or node.is_syntax_collection():
+  SyntaxVisitor::visit(Node);
+%     else:
+%       for child in node.children:
+%         if child.classification:
+  visit(Node.get${child.name}(), SyntaxClassification::${child.classification}, ${"true" if child.force_classification else "false"});
+%         else:
+  visit(Node.get${child.name}());
+%         end
+%       end
+%     end
+}
+%   end
+% end
+
+/// Returns the SyntaxClassficiation a token node should receive if it is not
+/// inside a special context. Returns \c None if the token has no context-free
+/// classification and should always inherit from the context.
+llvm::Optional<SyntaxClassification>
+getContextFreeClassificationForToken(TokenSyntax TokenNode) {
+  switch (TokenNode.getTokenKind()) {
+#define KEYWORD(KW) case tok::kw_##KW: return SyntaxClassification::Keyword;
+#define POUND_KEYWORD(KW) case tok::pound_##KW: return SyntaxClassification::Keyword;
+#define POUND_OBJECT_LITERAL(KW, desc, proto) case tok::pound_##KW: return SyntaxClassification::ObjectLiteral;
+#define POUND_DIRECTIVE_KEYWORD(KW) case tok::pound_##KW: return SyntaxClassification::PoundDirectiveKeyword;
+#define POUND_COND_DIRECTIVE_KEYWORD(KW) case tok::pound_##KW: return SyntaxClassification::BuildConfigKeyword;
+#include "swift/Syntax/TokenKinds.def"
+  // Punctuators
+  case tok::l_paren:
+  case tok::r_paren:
+  case tok::l_brace:
+  case tok::r_brace:
+  case tok::l_square:
+  case tok::r_square:
+  case tok::l_angle:
+  case tok::r_angle:
+  case tok::period:
+  case tok::period_prefix:
+  case tok::comma:
+  case tok::colon:
+  case tok::semi:
+  case tok::equal:
+  case tok::pound:
+  case tok::amp_prefix:
+  case tok::arrow:
+  case tok::backtick:
+  case tok::backslash:
+  case tok::exclaim_postfix:
+  case tok::question_postfix:
+  case tok::question_infix:
+  case tok::sil_dollar:
+  case tok::sil_exclamation:
+    return SyntaxClassification::None;
+  case tok::string_quote:
+  case tok::multiline_string_quote:
+    return SyntaxClassification::StringLiteral;
+  case tok::at_sign:
+    return SyntaxClassification::Attribute;
+
+  // Literals
+  case tok::integer_literal:
+    return SyntaxClassification::IntegerLiteral;
+  case tok::floating_literal:
+    return SyntaxClassification::FloatingLiteral;
+  case tok::string_literal:
+    return SyntaxClassification::StringLiteral;
+
+  // Miscelaneous
+  case tok::identifier: {
+    if (isEditorPlaceholder(TokenNode.getText())) {
+      return SyntaxClassification::EditorPlaceholder;
+    } else {
+      return llvm::None;
+    }
+  }
+  case tok::unknown:
+    if (TokenNode.getText().startswith("\"")) {
+      // Unterminated string literal
+      return SyntaxClassification::StringLiteral;
+    } else {
+      return SyntaxClassification::None;
+    }
+    break;
+  case tok::eof:
+  case tok::code_complete:
+  case tok::oper_binary_unspaced:
+  case tok::oper_binary_spaced:
+  case tok::oper_postfix:
+  case tok::oper_prefix:
+    return SyntaxClassification::None;
+  case tok::dollarident:
+    return SyntaxClassification::DollarIdentifier;
+  case tok::sil_local_name:
+    return SyntaxClassification::None;
+  case tok::comment:
+    llvm_unreachable("Comments should be in trivia");
+  case tok::contextual_keyword:
+    return SyntaxClassification::Keyword;
+  case tok::string_segment:
+    return SyntaxClassification::StringLiteral;
+  case tok::string_interpolation_anchor:
+    return SyntaxClassification::StringInterpolationAnchor;
+  case tok::NUM_TOKENS:
+    llvm_unreachable("");
+  }
+}
+
+void SyntaxClassifier::visit(TokenSyntax TokenNode) {
+  SyntaxClassification Classification = ContextStack.top().Classification;
+  bool ForceClassification = ContextStack.top().ForceClassification;
+  if (!ForceClassification) {
+    auto NativeClassification = getContextFreeClassificationForToken(TokenNode);
+    if (NativeClassification.hasValue()) {
+      Classification = NativeClassification.getValue();
+    }
+    if (Classification == SyntaxClassification::None &&
+        TokenNode.getTokenKind() == tok::identifier) {
+      Classification = SyntaxClassification::Identifier;
+    }
+  }
+
+  assert(ClassifiedTokens.count(TokenNode.getId()) == 0 &&
+         "Token already classified");
+  ClassifiedTokens[TokenNode.getId()] = Classification;
+}