plugins/header_rewrite/matcher.h (266 lines of code) (raw):

/* Licensed to the Apache Software Foundation (ASF) under one or more contributor license agreements. See the NOTICE file distributed with this work for additional information regarding copyright ownership. The ASF licenses this file to you under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ ////////////////////////////////////////////////////////////////////////////////////////////// // // Implement the classes for the various types of hash keys we support. // #pragma once #include <string> #include <sstream> #include <stdexcept> #include <type_traits> #include <variant> #include <set> #include "swoc/swoc_ip.h" #include "ts/ts.h" #include "resources.h" #include "regex_helper.h" #include "lulu.h" // Possible operators that we support (at least partially) enum MatcherOps { MATCH_EQUAL, MATCH_LESS_THEN, MATCH_GREATER_THEN, MATCH_REGULAR_EXPRESSION, MATCH_IP_RANGES, MATCH_SET, MATCH_ERROR, }; // Condition modifiers enum class CondModifiers : int { NONE = 0, OR = 1 << 0, AND = 1 << 1, NOT = 1 << 2, MOD_NOCASE = 1 << 3, MOD_L = 1 << 4, MOD_EXT = 1 << 5, MOD_PRE = 1 << 6, MOD_SUF = 1 << 7, MOD_MID = 1 << 8, // Essentially a substring }; inline CondModifiers operator|(CondModifiers a, const CondModifiers b) { using U = std::underlying_type_t<CondModifiers>; return static_cast<CondModifiers>(static_cast<U>(a) | static_cast<U>(b)); } inline CondModifiers operator&(CondModifiers a, const CondModifiers b) { using U = std::underlying_type_t<CondModifiers>; return static_cast<CondModifiers>(static_cast<U>(a) & static_cast<U>(b)); } inline CondModifiers & operator|=(CondModifiers &a, const CondModifiers b) { return a = a | b; } inline CondModifiers & operator&=(CondModifiers &a, const CondModifiers b) { return a = a & b; } inline bool has_modifier(const CondModifiers flags, const CondModifiers bit) { using U = std::underlying_type_t<CondModifiers>; return static_cast<U>(flags) & static_cast<U>(bit); } /////////////////////////////////////////////////////////////////////////////// // Base class for all Matchers (this is also the interface) // class Matcher { public: explicit Matcher(const MatcherOps op) : _op(op) { Dbg(dbg_ctl, "Calling CTOR for Matcher"); } virtual ~Matcher() { Dbg(dbg_ctl, "Calling DTOR for Matcher"); } // noncopyable Matcher(const Matcher &) = delete; void operator=(const Matcher &) = delete; MatcherOps op() const { return _op; } protected: const MatcherOps _op; }; // Template class to match on various types of data template <class T> class Matchers : public Matcher { public: explicit Matchers(const MatcherOps op) : Matcher(op), _data() {} void set(const T &d, CondModifiers mods) { _mods = mods; if constexpr (std::is_same_v<T, std::string>) { set(d, mods, [](const std::string &in) { return in; }); } else { std::get<T>(_data) = d; } } template <typename FN> void set(const std::string &s, CondModifiers mods, FN convert) { static_assert(std::is_same_v<decltype(convert(s)), T>, "Converter must return a value of type T"); _mods = mods; // MATCH_REGULAR_EXPRESSION (only valid for std::string) if constexpr (std::is_same_v<T, std::string>) { if (_op == MATCH_REGULAR_EXPRESSION) { _data.template emplace<regexHelper>(); auto &re = std::get<regexHelper>(_data); if (!re.setRegexMatch(s, has_modifier(mods, CondModifiers::MOD_NOCASE))) { TSError("[%s] Invalid regex: failed to precompile: %s", PLUGIN_NAME, s.c_str()); Dbg(pi_dbg_ctl, "Invalid regex: failed to precompile: %s", s.c_str()); throw std::runtime_error("Malformed regex"); } Dbg(pi_dbg_ctl, "Regex precompiled successfully"); return; } } // MATCH_IP_RANGES (only valid for const sockaddr *) if constexpr (std::is_same_v<T, const sockaddr *>) { if (_op == MATCH_IP_RANGES) { _data.template emplace<swoc::IPRangeSet>(); auto &ranges = std::get<swoc::IPRangeSet>(_data); std::istringstream stream(s); std::string part; size_t count = 0; while (std::getline(stream, part, ',')) { swoc::IPRange r; if (r.load(part)) { ranges.mark(r); ++count; } } if (count > 0) { Dbg(pi_dbg_ctl, "IP-range precompiled successfully with %zu entries", count); } else { TSError("[%s] Invalid IP-range: failed to parse: %s", PLUGIN_NAME, s.c_str()); Dbg(pi_dbg_ctl, "Invalid IP-range: failed to parse: %s", s.c_str()); throw std::runtime_error("Malformed IP-range"); } return; } else { TSReleaseAssert(false); // This should never happen } } // MATCH_SET (allowed for any T) if (_op == MATCH_SET) { _data.template emplace<std::set<T>>(); auto &values = std::get<std::set<T>>(_data); std::istringstream stream(s); std::string part; while (std::getline(stream, part, ',')) { values.insert(convert(part)); } if (!values.empty()) { Dbg(pi_dbg_ctl, " Added %zu set values while parsing", values.size()); } else { Dbg(pi_dbg_ctl, " No set values added, possibly bad input"); throw std::runtime_error("Empty sets not allowed"); } } else { // Default: single value _data.template emplace<T>(convert(s)); } } // Evaluate this matcher bool test(const T &t, const Resources &res) const { switch (_op) { case MATCH_EQUAL: return test_eq(t); break; case MATCH_LESS_THEN: return test_lt(t); break; case MATCH_GREATER_THEN: return test_gt(t); break; case MATCH_REGULAR_EXPRESSION: return test_reg(t, res); // Only the regex matcher needs the resource break; case MATCH_SET: return test_set(t); break; case MATCH_IP_RANGES: // This is an error, the Matcher doesn't make sense to match on IP ranges TSError("[%s] Invalid matcher: MATCH_IP_RANGES", PLUGIN_NAME); throw std::runtime_error("Can not match on IP ranges"); break; default: // ToDo: error break; } return false; } private: void debug_helper(const T &t, const char *op, bool r) const { std::stringstream ss; std::visit( [&](const auto &val) { using V = std::decay_t<decltype(val)>; if constexpr (std::is_same_v<V, T>) { ss << '"' << t << '"' << op << '"' << val << '"'; } else if constexpr (std::is_same_v<V, std::set<T>>) { ss << '"' << t << '"' << op << " set[" << val.size() << " entries]"; } else { ss << '"' << t << '"' << op << " type<" << typeid(V).name() << ">"; } }, _data); ss << " -> " << r; Dbg(pi_dbg_ctl, "\ttesting: %s", ss.str().c_str()); } // For basic types bool test_eq(const T &t) const { TSAssert(std::holds_alternative<T>(_data)); bool r = (t == std::get<T>(_data)); if (pi_dbg_ctl.on()) { debug_helper(t, " == ", r); } return r; } bool test_lt(const T &t) const { TSAssert(std::holds_alternative<T>(_data)); bool r = (t < std::get<T>(_data)); if (pi_dbg_ctl.on()) { debug_helper(t, " < ", r); } return r; } bool test_gt(const T &t) const { TSAssert(std::holds_alternative<T>(_data)); bool r = (t > std::get<T>(_data)); if (pi_dbg_ctl.on()) { debug_helper(t, " > ", r); } return r; } bool test_set(const T &c) const { TSAssert(std::holds_alternative<std::set<T>>(_data)); return std::get<std::set<T>>(_data).contains(c); } bool test_reg(const unsigned int /* t ATS_UNUSED */, const Resources & /* Not used */) const { // Not supported return false; } bool test_reg(const sockaddr * /* t ATS_UNUSED */, const Resources & /* Not used */) const { // Not supported return false; } bool test_reg(const std::string &t, const Resources &res) const { TSAssert(std::holds_alternative<regexHelper>(_data)); Dbg(pi_dbg_ctl, "Test regular expression against: %s (NOCASE = %s)", t.c_str(), has_modifier(_mods, CondModifiers::MOD_NOCASE) ? "true" : "false"); const auto &re = std::get<regexHelper>(_data); int count = re.regexMatch(t.c_str(), t.length(), const_cast<Resources &>(res).ovector); if (count > 0) { Dbg(pi_dbg_ctl, "Successfully found regular expression match"); const_cast<Resources &>(res).ovector_ptr = t.c_str(); const_cast<Resources &>(res).ovector_count = count; return true; } return false; } std::variant<T, std::set<T>, swoc::IPRangeSet, regexHelper> _data; CondModifiers _mods = CondModifiers::NONE; };