plugins/experimental/geoip_acl/acl.cc (244 lines of code) (raw):
/*
Licensed to the Apache Software Foundation (ASF) under one
or more contributor license agreements. See the NOTICE file
distributed with this work for additional information
regarding copyright ownership. The ASF licenses this file
to you under the Apache License, Version 2.0 (the
"License"); you may not use this file except in compliance
with the License. You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
#include <arpa/inet.h>
#include <string>
#include <iostream>
#include <fstream>
#include "acl.h"
#include "lulu.h"
namespace geoip_acl_ns
{
DbgCtl dbg_ctl{PLUGIN_NAME};
}
// Implementation of the ACL base class. This wraps the underlying Geo library
// that we've found and used.
GeoDBHandle Acl::_geoip;
GeoDBHandle Acl::_geoip6;
// Maxmind v1 APIs
#if HAVE_GEOIP_H
bool
Acl::init()
{
Dbg(dbg_ctl, "initialized IPv4 GeoIP DB");
_geoip = GeoIP_new(GEOIP_MMAP_CACHE); // GEOIP_STANDARD seems to break threaded apps...
// Setup IPv6 if possible
if (GeoIP_db_avail(GEOIP_COUNTRY_EDITION_V6)) {
_geoip6 = GeoIP_open_type(GEOIP_COUNTRY_EDITION_V6, GEOIP_MMAP_CACHE | GEOIP_MEMORY_CACHE);
Dbg(dbg_ctl, "initialized IPv6 GeoIP DB");
}
return true;
}
int
Acl::country_id_by_code(const std::string &str) const
{
return GeoIP_id_by_code(str.c_str());
}
int
Acl::country_id_by_addr(const sockaddr *addr) const
{
int iso = -1;
int v = 4;
switch (addr->sa_family) {
case AF_INET: {
uint32_t ip = ntohl(reinterpret_cast<const struct sockaddr_in *>(addr)->sin_addr.s_addr);
iso = GeoIP_id_by_ipnum(_geoip, ip);
} break;
case AF_INET6: {
geoipv6_t ip = reinterpret_cast<const struct sockaddr_in6 *>(addr)->sin6_addr;
iso = GeoIP_id_by_ipnum_v6(_geoip6, ip);
v = 6;
} break;
default:
break;
}
Dbg(dbg_ctl, "eval(): Client IPv%d seems to come from ISO=%d", v, iso);
return iso;
}
#else /* !HAVE_GEOIP_H */
// No library available, nothing will work :)
bool
Acl::init()
{
Dbg(dbg_ctl, "No Geo library available!");
TSError("[%s] No Geo library available!", PLUGIN_NAME);
return false;
}
int
Acl::country_id_by_code(const std::string & /* str ATS_UNUSED */) const
{
return -1;
}
int
Acl::country_id_by_addr(const sockaddr * /* addr ATS_UNUSED */) const
{
return -1;
}
#endif /* HAVE_GEOIP_H */
// This is the rest of the ACL base class, which is the same for all underlying Geo libraries.
void
Acl::read_html(const char *fn)
{
std::ifstream f;
f.open(fn, std::ios::in);
if (f.is_open()) {
_html.append(std::istreambuf_iterator<char>(f), std::istreambuf_iterator<char>());
f.close();
Dbg(dbg_ctl, "Loaded HTML from %s", fn);
} else {
TSError("[%s] Unable to open HTML file %s", PLUGIN_NAME, fn);
}
}
// Implementations for the RegexAcl class
bool
RegexAcl::parse_line(const char *filename, const std::string &line, int lineno, int &tokens)
{
static const char _SEPARATOR[] = " \t\n";
std::string regex, tmp;
std::string::size_type pos1, pos2;
if (line.empty()) {
return false;
}
pos1 = line.find_first_not_of(_SEPARATOR);
if ((pos1 == std::string::npos) || (line[pos1] == '#')) {
return false;
}
pos2 = line.find_first_of(_SEPARATOR, pos1);
if (pos2 != std::string::npos) {
regex = line.substr(pos1, pos2 - pos1);
pos1 = line.find_first_not_of(_SEPARATOR, pos2);
if (pos1 != std::string::npos) {
pos2 = line.find_first_of(_SEPARATOR, pos1);
if (pos2 != std::string::npos) {
tmp = line.substr(pos1, pos2 - pos1);
if (tmp == "allow") {
_acl->set_allow(true);
} else if (tmp == "deny") {
_acl->set_allow(false);
} else {
TSError("[%s] Bad action on in %s:line %d: %s", PLUGIN_NAME, filename, lineno, tmp.c_str());
return false;
}
// The rest are "tokens"
while ((pos1 = line.find_first_not_of(_SEPARATOR, pos2)) != std::string::npos) {
pos2 = line.find_first_of(_SEPARATOR, pos1);
tmp = line.substr(pos1, pos2 - pos1);
_acl->add_token(tmp);
++tokens;
}
compile(regex, filename, lineno);
Dbg(dbg_ctl, "Added regex rule for /%s/", regex.c_str());
return true;
}
}
}
return false;
}
bool
RegexAcl::compile(const std::string &str, const char *filename, int lineno)
{
const char *error;
int erroffset;
_regex_s = str;
_rex = pcre_compile(_regex_s.c_str(), 0, &error, &erroffset, nullptr);
if (nullptr != _rex) {
_extra = pcre_study(_rex, 0, &error);
if ((nullptr == _extra) && error && (*error != 0)) {
TSError("[%s] Failed to study regular expression in %s:line %d at offset %d: %s", PLUGIN_NAME, filename, lineno, erroffset,
error);
return false;
}
} else {
TSError("[%s] Failed to compile regular expression in %s:line %d: %s", PLUGIN_NAME, filename, lineno, error);
return false;
}
return true;
}
void
RegexAcl::append(RegexAcl *ra)
{
if (nullptr == _next) {
_next = ra;
} else {
RegexAcl *cur = _next;
while (cur->_next) {
cur = cur->_next;
}
cur->_next = ra;
}
}
// Implementation of the Country ACL class.
void
CountryAcl::add_token(const std::string &str)
{
int iso = -1;
iso = country_id_by_code(str.c_str());
if (iso > 0 && iso < NUM_ISO_CODES) {
_iso_country_codes[iso] = true;
Dbg(dbg_ctl, "Added %s(%d) to remap rule, ACL=%s", str.c_str(), iso, _allow ? "allow" : "deny");
} else {
TSError("[%s] Tried setting an ISO code (%d) outside the supported range", PLUGIN_NAME, iso);
}
}
void
CountryAcl::read_regex(const char *fn, int &tokens)
{
std::ifstream f;
int lineno = 0;
f.open(fn, std::ios::in);
if (f.is_open()) {
std::string line;
RegexAcl *acl = nullptr;
while (!f.eof()) {
getline(f, line);
++lineno;
acl = new RegexAcl(new CountryAcl());
if (acl->parse_line(fn, line, lineno, tokens)) {
if (nullptr == _regexes) {
_regexes = acl;
} else {
_regexes->append(acl);
}
} else {
delete acl;
}
}
f.close();
Dbg(dbg_ctl, "Loaded regex rules from %s", fn);
} else {
TSError("[%s] Unable to open regex file %s", PLUGIN_NAME, fn);
}
}
bool
CountryAcl::eval(TSRemapRequestInfo *rri, TSHttpTxn txnp) const
{
bool ret = _allow;
Dbg(dbg_ctl, "CountryAcl::eval() called, default ACL is %s", ret ? "allow" : "deny");
// If there are regex rules, they take priority first. If a regex matches, we will
// honor it's eval() rule. If no regexes matches, fall back on the default (which is
// "allow" if nothing else is specified).
if (nullptr != _regexes) {
RegexAcl *acl = _regexes;
int path_len;
const char *path = TSUrlPathGet(rri->requestBufp, rri->requestUrl, &path_len);
do {
if (acl->match(path, path_len)) {
Dbg(dbg_ctl, "Path = %.*s matched /%s/", path_len, path, acl->get_regex().c_str());
return acl->eval(rri, txnp);
}
} while ((acl = acl->next()));
ret = !_allow; // Now we invert the default since no regexes matched
}
// None of the regexes (if any) matched, so fallback to the remap defaults if there are any.
int iso = country_id_by_addr(TSHttpTxnClientAddrGet(txnp));
if ((iso <= 0) || !_iso_country_codes[iso]) {
Dbg(dbg_ctl, "ISO not found in table, returning %d", !ret);
return !ret;
}
Dbg(dbg_ctl, "ISO was found in table, or -1, returning %d", ret);
return ret;
}
int
CountryAcl::process_args(int argc, char *argv[])
{
int tokens = 0;
for (int i = 3; i < argc; ++i) {
if (!strncmp(argv[i], "allow", 5)) {
set_allow(true);
} else if (!strncmp(argv[i], "deny", 4)) {
set_allow(false);
} else if (!strncmp(argv[i], "regex::", 7)) {
read_regex(argv[i] + 7, tokens);
} else if (!strncmp(argv[i], "html::", 6)) {
read_html(argv[i] + 6);
} else { // ISO codes assumed for the rest
add_token(argv[i]);
++tokens;
}
}
return tokens;
}