feat: Add attribute reference support. (#7)

kinyoklion · web-flow · commit 2203788c658c · 2023-03-27T14:12:28.000-07:00
diff --git a/libs/common/include/attribute_reference.hpp b/libs/common/include/attribute_reference.hpp
@@ -0,0 +1,107 @@
+#pragma once
+
+#include <ostream>
+#include <string>
+#include <vector>
+
+namespace launchdarkly {
+
+/**
+ *  Represents an attribute name or path expression identifying a value within a
+ * [TODO: Context]. This can be used to retrieve a value with [TODO: Get Value],
+ * or to identify an attribute or nested value that should be considered private
+ * with [TODO: private attribute] (the SDK configuration can also have a list of
+ * private attribute references).
+ *
+ *  This is represented as a separate type, rather than just a string, so that
+ * validation and parsing can be done ahead of time if an attribute reference
+ * will be used repeatedly later (such as in flag evaluations).
+ *
+ *  If the string starts with '/', then this is treated as a slash-delimited
+ * path reference where the first component is the name of an attribute, and
+ * subsequent components are the names of nested JSON object properties. In this
+ * syntax, the escape sequences "~0" and "~1" represent '~' and '/' respectively
+ * within a path component.
+ *
+ *  If the string does not start with '/', then it is treated as the literal
+ * name of an attribute.
+ */
+class AttributeReference {
+   public:
+    /**
+     * Get the component of the attribute reference at the specified depth.
+     *
+     * For example, component(1) on the reference `/a/b/c` would return
+     * `b`.
+     *
+     * @param depth The depth to get a component for.
+     * @return The component at the specified depth or an empty string if the
+     * depth is out of bounds.
+     */
+    std::string const& component(size_t depth) const;
+
+    /**
+     * Get the total depth of the reference.
+     *
+     * For example, depth() on the reference `/a/b/c` would return 3.
+     * @return
+     */
+    size_t depth() const;
+
+    /**
+     * Check if the reference is a "kind" reference. Either `/kind` or `kind`.
+     *
+     * @return True if it is a kind reference.
+     */
+    bool is_kind() const;
+
+    /** Check if the reference is valid.
+     *
+     * @return True if the reference is valid.
+     */
+    bool valid() const;
+
+    /**
+     * The redaction name will always be an attribute reference compatible
+     * string. So, for instance, a literal that contained `/attr` would be
+     * converted to `/~1attr`.
+     * @return String to use in redacted attributes.
+     */
+    std::string const& redaction_name() const;
+
+    /**
+     * Create an attribute from a string that is known to be an attribute
+     * reference string.
+     * @param ref_str The reference string.
+     * @return A new AttributeReference based on the reference string.
+     */
+    static AttributeReference from_reference_str(std::string ref_str);
+
+    /**
+     * Create a string from an attribute that is known to be a literal.
+     *
+     * This allows escaping literals that contained special characters.
+     *
+     * @param lit_str The literal attribute name.
+     * @return A new AttributeReference based on the literal name.
+     */
+    static AttributeReference from_literal_str(std::string lit_str);
+
+    friend std::ostream& operator<<(std::ostream& os,
+                                    AttributeReference const& ref) {
+        os << (ref.valid() ? "valid" : "invalid") << "(" << ref.redaction_name()
+           << ")";
+        return os;
+    }
+
+   private:
+    AttributeReference(std::string str, bool is_literal);
+
+    bool valid_;
+
+    std::string redaction_name_;
+    std::vector<std::string> components_;
+    inline static const std::string empty_;
+};
+
+}  // namespace launchdarkly
diff --git a/libs/common/src/CMakeLists.txt b/libs/common/src/CMakeLists.txt
@@ -2,7 +2,7 @@
 file(GLOB HEADER_LIST CONFIGURE_DEPENDS "${LaunchDarklyCPPCommon_SOURCE_DIR}/include/*.hpp")
 
 # Automatic library: static or dynamic based on user config.
-add_library(${LIBNAME} logger.cpp ${HEADER_LIST} console_backend.cpp log_level.cpp ../include/console_backend.hpp)
+add_library(${LIBNAME} logger.cpp ${HEADER_LIST} console_backend.cpp log_level.cpp attribute_reference.cpp)
 
 add_library(launchdarkly::common ALIAS ${LIBNAME})
 
diff --git a/libs/common/src/attribute_reference.cpp b/libs/common/src/attribute_reference.cpp
@@ -0,0 +1,218 @@
+#include "attribute_reference.hpp"
+#include <utility>
+
+namespace launchdarkly {
+
+enum class ParseState {
+    kBegin,        /* start state */
+    kPlain,        /* plain, top-level attribute name detected */
+    kTokenBegin,   /* found the beginning of a token */
+    kSearchingEnd, /* searching for the end of a token */
+    kEscapeBegin,  /* found start of an escape sequence */
+    kRefEnd        /* end state */
+};
+
+enum class ParseEvent {
+    kNoop,         /* no event */
+    kChar,         /* write the input character */
+    kTilde,        /* write a '~' */
+    kForwardSlash, /* write a '/' */
+    kTokenEnd,     /* end of token */
+    kInputEnd,     /* end of input */
+    kError         /* error */
+};
+
+/**
+ * This function is responsible for decoding an input string,
+ * representing a reference, into a list of components.
+ *
+ * Each component is the bits between the '/' separators. For example,
+ * the reference "/foo/bar" will be represented by the components "foo" and
+ * "bar".
+ *
+ * The algorithm proceeds as a single-pass over the input string, performed by
+ * a state machine.
+ */
+std::pair<ParseState, ParseEvent> ParseChar(ParseState state, char input) {
+    switch (state) {
+        case ParseState::kBegin: {
+            switch (input) {
+                case '/': {
+                    return {ParseState::kTokenBegin, ParseEvent::kNoop};
+                }
+                case '\0': {
+                    return {ParseState::kRefEnd, ParseEvent::kError};
+                }
+                default: {
+                    return {ParseState::kPlain, ParseEvent::kChar};
+                }
+            }
+        }
+        case ParseState::kPlain: {
+            if (input == '\0') {
+                return {ParseState::kRefEnd, ParseEvent::kInputEnd};
+            }
+
+            return {ParseState::kPlain, ParseEvent::kChar};
+        }
+        case ParseState::kTokenBegin: {
+            switch (input) {
+                case '\0':  // Falling through to the error case intentionally.
+                case '/': {
+                    return {ParseState::kRefEnd, ParseEvent::kError};
+                }
+                case '~': {
+                    return {ParseState::kEscapeBegin, ParseEvent::kNoop};
+                }
+                default: {
+                    return {ParseState::kSearchingEnd, ParseEvent::kChar};
+                }
+            }
+        }
+        case ParseState::kSearchingEnd: {
+            switch (input) {
+                case '\0': {
+                    return {ParseState::kRefEnd, ParseEvent::kInputEnd};
+                }
+                case '~': {
+                    return {ParseState::kEscapeBegin, ParseEvent::kNoop};
+                }
+                case '/': {
+                    return {ParseState::kTokenBegin, ParseEvent::kTokenEnd};
+                }
+                default: {
+                    return {ParseState::kSearchingEnd, ParseEvent::kChar};
+                }
+            }
+        }
+        case ParseState::kEscapeBegin: {
+            switch (input) {
+                case '0': {
+                    return {ParseState::kSearchingEnd, ParseEvent::kTilde};
+                }
+                case '1': {
+                    return {ParseState::kSearchingEnd,
+                            ParseEvent::kForwardSlash};
+                }
+                default: {
+                    return {ParseState::kRefEnd, ParseEvent::kError};
+                }
+            }
+        }
+        case ParseState::kRefEnd: {
+            return {ParseState::kRefEnd, ParseEvent::kNoop};
+        }
+    }
+    // Should only happen if additional states are added but not handled.
+    return {ParseState::kRefEnd, ParseEvent::kError};
+}
+
+bool ParseRef(std::string str, std::vector<std::string>& components) {
+    auto p_state = ParseState::kBegin;
+
+    std::string tmp_token;
+    // The loop here extends to the size of the string, so we can send a null
+    // into the parsing logic to terminate the parsing.
+    for (auto index = 0; index <= str.size(); index++) {
+        // The character in the string, or null if we go out of bounds of the
+        // string.
+        char character = index < str.size() ? str[index] : '\0';
+        auto [new_p_state, event] = ParseChar(p_state, character);
+        p_state = new_p_state;
+
+        switch (event) {
+            case ParseEvent::kNoop:
+                continue;
+            case ParseEvent::kChar: {
+                tmp_token.push_back(character);
+            } break;
+            case ParseEvent::kForwardSlash: {
+                tmp_token.push_back('/');
+            } break;
+            case ParseEvent::kTilde: {
+                tmp_token.push_back('~');
+            } break;
+            case ParseEvent::kTokenEnd: {
+                components.push_back(std::move(tmp_token));
+                // Could .clear here, but this seems more appropriate.
+                tmp_token = std::string();
+            } break;
+            case ParseEvent::kInputEnd:
+                components.push_back(std::move(tmp_token));
+                return true;
+            case ParseEvent::kError:
+                return false;
+        }
+    }
+    return false;
+}
+
+/**
+ * Literal starting with a '/' needs to be converted to an attribute
+ * reference string.
+ */
+std::string EscapeLiteral(std::string const& literal) {
+    std::string escaped = "/";
+    for (auto const& character : literal) {
+        if (character == '~') {
+            escaped.append("~0");
+        } else if (character == '/') {
+            escaped.append("~1");
+        } else {
+            escaped.push_back(character);
+        }
+    }
+    return escaped;
+}
+
+AttributeReference::AttributeReference(std::string str, bool literal) {
+    if (literal) {
+        components_.push_back(str);
+        // Literal starting with a '/' needs to be converted to an attribute
+        // reference string.
+        if (str[0] == '/') {
+            redaction_name_ = EscapeLiteral(str);
+        } else {
+            redaction_name_ = str;
+        }
+    } else {
+        valid_ = ParseRef(str, components_);
+        redaction_name_ = std::move(str);
+        if (!valid_) {
+            components_.clear();
+        }
+    }
+}
+
+AttributeReference AttributeReference::from_literal_str(std::string lit_str) {
+    return {std::move(lit_str), true};
+}
+
+AttributeReference AttributeReference::from_reference_str(std::string ref_str) {
+    return {std::move(ref_str), false};
+}
+
+std::string const& AttributeReference::component(size_t depth) const {
+    if (depth < components_.size()) {
+        return components_[depth];
+    }
+    return empty_;
+}
+
+size_t AttributeReference::depth() const {
+    return components_.size();
+}
+
+bool AttributeReference::is_kind() const {
+    return depth() == 1 && component(0) == "kind";
+}
+
+bool AttributeReference::valid() const {
+    return valid_;
+}
+
+std::string const& AttributeReference::redaction_name() const {
+    return redaction_name_;
+}
+
+}  // namespace launchdarkly
diff --git a/libs/common/tests/attribute_reference_test.cpp b/libs/common/tests/attribute_reference_test.cpp