#include "str.h"
#include "rbl.h"
#include "policy_tokens.h"
+#include "resources.h"
+
+typedef struct strlist_local_t {
+ char *filename;
+ trie_t **db;
+ int weight;
+ unsigned reverse :1;
+ unsigned partial :1;
+} strlist_local_t;
+ARRAY(strlist_local_t)
+
+typedef struct strlist_resource_t {
+ off_t size;
+ time_t mtime;
+ trie_t *trie1;
+ trie_t *trie2;
+} strlist_resource_t;
typedef struct strlist_config_t {
- PA(trie_t) tries;
- A(int) weights;
- A(bool) reverses;
- A(bool) partiales;
+ A(strlist_local_t) locals;
A(char) hosts;
A(int) host_offsets;
unsigned match_reverse :1;
} strlist_config_t;
+typedef struct strlist_async_data_t {
+ A(rbl_result_t) results;
+ int awaited;
+ uint32_t sum;
+ bool error;
+} strlist_async_data_t;
+
+static filter_type_t filter_type = FTK_UNKNOWN;
+
+
+static void strlist_local_wipe(strlist_local_t *entry)
+{
+ if (entry->filename != NULL) {
+ resource_release("strlist", entry->filename);
+ p_delete(&entry->filename);
+ }
+}
+
+static void strlist_resource_wipe(strlist_resource_t *res)
+{
+ trie_delete(&res->trie1);
+ trie_delete(&res->trie2);
+ p_delete(&res);
+}
static strlist_config_t *strlist_config_new(void)
{
static void strlist_config_delete(strlist_config_t **config)
{
if (*config) {
- array_deep_wipe((*config)->tries, trie_delete);
- array_wipe((*config)->weights);
- array_wipe((*config)->reverses);
- array_wipe((*config)->partiales);
+ array_deep_wipe((*config)->locals, strlist_local_wipe);
array_wipe((*config)->hosts);
array_wipe((*config)->host_offsets);
array_wipe((*config)->host_weights);
}
-static trie_t *strlist_create(const char *file, bool reverse, bool lock)
+static bool strlist_create(strlist_local_t *local,
+ const char *file, int weight,
+ bool reverse, bool partial, bool lock)
{
- trie_t *db;
file_map_t map;
const char *p, *end;
char line[BUFSIZ];
+ uint32_t count = 0;
+ time_t now = time(0);
if (!file_map_open(&map, file, false)) {
- return NULL;
+ return false;
}
p = map.map;
end = map.end;
--end;
}
if (end != map.end) {
- warn("file %s miss a final \\n, ignoring last line",
- file);
+ warn("%s: final \\n missing, ignoring last line", file);
+ }
+
+ strlist_resource_t *res = resource_get("strlist", file);
+ if (res == NULL) {
+ res = p_new(strlist_resource_t, 1);
+ resource_set("strlist", file, res, (resource_destructor_t)strlist_resource_wipe);
+ } else if (res->trie2 != NULL) {
+ err("%s not loaded: the file is already used as a rbldns zone file", file);
+ resource_release("strlist", file);
+ file_map_close(&map);
+ return false;
+ }
+
+ p_clear(local, 1);
+ local->filename = m_strdup(file);
+ local->db = &res->trie1;
+ local->weight = weight;
+ local->reverse = reverse;
+ local->partial = partial;
+ if (res->size == map.st.st_size && res->mtime == map.st.st_mtime) {
+ info("%s loaded: already up-to-date", file);
+ file_map_close(&map);
+ return true;
}
+ trie_delete(&res->trie1);
+ res->trie1 = trie_new();
+ res->size = map.st.st_size;
+ res->mtime = map.st.st_mtime;
- db = trie_new();
while (p < end && p != NULL) {
const char *eol = (char *)memchr(p, '\n', end - p);
if (eol == NULL) {
eol = end;
}
if (eol - p >= BUFSIZ) {
- err("unreasonnable long line");
+ err("%s not loaded: unreasonnable long line", file);
file_map_close(&map);
- trie_delete(&db);
- return NULL;
+ trie_delete(&res->trie1);
+ strlist_local_wipe(local);
+ return false;
}
if (*p != '#') {
const char *eos = eol;
}
if (p < eos) {
strlist_copy(line, p, eos - p, reverse);
- trie_insert(db, line);
+ trie_insert(res->trie1, line);
+ ++count;
}
}
p = eol + 1;
}
file_map_close(&map);
- trie_compile(db, lock);
- return db;
+ trie_compile(res->trie1, lock);
+ info("%s loaded: done in %us, %u entries", file, (uint32_t)(time(0) - now), count);
+ return true;
}
-static bool strlist_create_from_rhbl(const char *file, bool lock,
- trie_t **phosts, trie_t **pdomains)
+static bool strlist_create_from_rhbl(strlist_local_t *hosts, strlist_local_t *domains,
+ const char *file, int weight, bool lock)
{
- trie_t *hosts, *domains;
uint32_t host_count, domain_count;
file_map_t map;
const char *p, *end;
char line[BUFSIZ];
+ time_t now = time(0);
if (!file_map_open(&map, file, false)) {
return false;
--end;
}
if (end != map.end) {
- warn("file %s miss a final \\n, ignoring last line",
- file);
+ warn("%s: final \\n missing, ignoring last line", file);
}
- hosts = trie_new();
+
+ strlist_resource_t *res = resource_get("strlist", file);
+ if (res == NULL) {
+ res = p_new(strlist_resource_t, 1);
+ resource_set("strlist", file, res, (resource_destructor_t)strlist_resource_wipe);
+ } else if (res->trie2 == NULL) {
+ err("%s not loaded: the file is already used as a strlist-file parameter", file);
+ resource_release("strlist", file);
+ file_map_close(&map);
+ return false;
+ }
+
+ p_clear(hosts, 1);
+ hosts->filename = m_strdup(file);
+ hosts->db = &res->trie1;
+ hosts->weight = weight;
+ hosts->reverse = true;
host_count = 0;
- domains = trie_new();
+
+ p_clear(domains, 1);
+ /* don't set filename */
+ domains->db = &res->trie2;
+ domains->weight = weight;
+ domains->reverse = true;
+ domains->partial = true;
domain_count = 0;
+
+ if (map.st.st_size == res->size && map.st.st_mtime == res->mtime) {
+ info("%s loaded: already up-to-date", file);
+ file_map_close(&map);
+ return true;
+ }
+
+ trie_delete(&res->trie1);
+ trie_delete(&res->trie2);
+ res->trie1 = trie_new();
+ res->trie2 = trie_new();
+ res->size = map.st.st_size;
+ res->mtime = map.st.st_mtime;
+
while (p < end && p != NULL) {
const char *eol = (char *)memchr(p, '\n', end - p);
if (eol == NULL) {
eol = end;
}
if (eol - p >= BUFSIZ) {
- err("unreasonnable long line");
+ err("%s not loaded: unreasonnable long line", file);
file_map_close(&map);
- trie_delete(&hosts);
- trie_delete(&domains);
+ trie_delete(&res->trie1);
+ trie_delete(&res->trie2);
+ strlist_local_wipe(hosts);
return false;
}
if (*p != '#') {
if (p < eos) {
if (isalnum(*p)) {
strlist_copy(line, p, eos - p, true);
- trie_insert(hosts, line);
+ trie_insert(res->trie1, line);
++host_count;
} else if (*p == '*') {
++p;
strlist_copy(line, p, eos - p, true);
- trie_insert(domains, line);
+ trie_insert(res->trie2, line);
++domain_count;
}
}
}
file_map_close(&map);
if (host_count > 0) {
- trie_compile(hosts, lock);
- *phosts = hosts;
+ trie_compile(res->trie1, lock);
} else {
- trie_delete(&hosts);
- *phosts = NULL;
+ trie_delete(&res->trie1);
}
if (domain_count > 0) {
- trie_compile(domains, lock);
- *pdomains = domains;
+ trie_compile(res->trie2, lock);
} else {
- trie_delete(&domains);
- *pdomains = NULL;
+ trie_delete(&res->trie2);
}
- return hosts != NULL || domains != NULL;
-
+ if (res->trie1 == NULL && res->trie2 == NULL) {
+ err("%s not loaded: no data found", file);
+ strlist_local_wipe(hosts);
+ return false;
+ }
+ info("%s loaded: done in %us, %u hosts, %u domains", file,
+ (uint32_t)(time(0) - now), host_count, domain_count);
+ return true;
}
int weight = 0;
bool reverse = false;
bool partial = false;
- trie_t *trie = NULL;
const char *current = param->value;
const char *p = m_strchrnul(param->value, ':');
char *next = NULL;
lock = false;
} else {
PARSE_CHECK(false, "illegal locking state %.*s",
- p - current, current);
+ (int)(p - current), current);
}
break;
reverse = false;
} else {
PARSE_CHECK(false, "illegal character order value %.*s",
- p - current, current);
+ (int)(p - current), current);
}
break;
weight = strtol(current, &next, 10);
PARSE_CHECK(next == p && weight >= 0 && weight <= 1024,
"illegal weight value %.*s",
- (p - current), current);
+ (int)(p - current), current);
break;
- case 3:
- trie = strlist_create(current, reverse, lock);
- PARSE_CHECK(trie != NULL,
+ case 3: {
+ strlist_local_t entry;
+ PARSE_CHECK(strlist_create(&entry, current, weight,
+ reverse, partial, lock),
"cannot load string list from %s", current);
- array_add(config->tries, trie);
- array_add(config->weights, weight);
- array_add(config->reverses, reverse);
- array_add(config->partiales, partial);
- break;
+ array_add(config->locals, entry);
+ } break;
}
if (i != 3) {
current = p + 1;
case ATK_RBLDNS: {
bool lock = false;
int weight = 0;
- trie_t *trie_hosts = NULL;
- trie_t *trie_domains = NULL;
const char *current = param->value;
const char *p = m_strchrnul(param->value, ':');
char *next = NULL;
lock = false;
} else {
PARSE_CHECK(false, "illegal locking state %.*s",
- p - current, current);
+ (int)(p - current), current);
}
break;
weight = strtol(current, &next, 10);
PARSE_CHECK(next == p && weight >= 0 && weight <= 1024,
"illegal weight value %.*s",
- (p - current), current);
+ (int)(p - current), current);
break;
- case 2:
- PARSE_CHECK(strlist_create_from_rhbl(current, lock,
- &trie_hosts, &trie_domains),
+ case 2: {
+ strlist_local_t trie_hosts, trie_domains;
+ PARSE_CHECK(strlist_create_from_rhbl(&trie_hosts, &trie_domains,
+ current, weight, lock),
"cannot load string list from rhbl %s", current);
- if (trie_hosts != NULL) {
- array_add(config->tries, trie_hosts);
- array_add(config->weights, weight);
- array_add(config->reverses, true);
- array_add(config->partiales, false);
+ if (trie_hosts.db != NULL) {
+ array_add(config->locals, trie_hosts);
}
- if (trie_domains != NULL) {
- array_add(config->tries, trie_domains);
- array_add(config->weights, weight);
- array_add(config->reverses, true);
- array_add(config->partiales, true);
+ if (trie_domains.db != NULL) {
+ array_add(config->locals, trie_domains);
}
config->is_hostname = true;
- break;
+ } break;
}
if (i != 2) {
current = p + 1;
weight = strtol(current, &next, 10);
PARSE_CHECK(next == p && weight >= 0 && weight <= 1024,
"illegal weight value %.*s",
- (p - current), current);
+ (int)(p - current), current);
break;
case 1:
CASE(RECIPIENT, recipient, email);
#undef CASE
default:
- PARSE_CHECK(false, "unknown field %.*s", p - current, current);
+ PARSE_CHECK(false, "unknown field %.*s", (int)(p - current), current);
break;
}
if (!*p) {
PARSE_CHECK(config->is_email != config->is_hostname,
"matched field MUST be emails XOR hostnames");
- PARSE_CHECK(config->tries.len || config->host_offsets.len,
+ PARSE_CHECK(config->locals.len || config->host_offsets.len,
"no file parameter in the filter %s", filter->name);
filter->data = config;
return true;
filter->data = config;
}
-static filter_result_t strlist_filter(const filter_t *filter, const query_t *query)
+static void strlist_filter_async(rbl_result_t *result, void *arg)
+{
+ filter_context_t *context = arg;
+ const filter_t *filter = context->current_filter;
+ const strlist_config_t *data = filter->data;
+ strlist_async_data_t *async = context->contexts[filter_type];
+
+ if (*result != RBL_ERROR) {
+ async->error = false;
+ }
+ --async->awaited;
+
+ debug("got asynchronous request result for filter %s, rbl %d, still awaiting %d answers",
+ filter->name, (int)(result - array_ptr(async->results, 0)), async->awaited);
+
+ if (async->awaited == 0) {
+ filter_result_t res = HTK_FAIL;
+ if (async->error) {
+ res = HTK_ERROR;
+ } else {
+ uint32_t j = 0;
+#define DO_SUM(Field) \
+ if (data->match_ ## Field) { \
+ for (uint32_t i = 0 ; i < array_len(data->host_offsets) ; ++i) { \
+ int weight = array_elt(data->host_weights, i); \
+ \
+ switch (array_elt(async->results, j)) { \
+ case RBL_ASYNC: \
+ crit("no more awaited answer but result is ASYNC"); \
+ abort(); \
+ case RBL_FOUND: \
+ async->sum += weight; \
+ break; \
+ default: \
+ break; \
+ } \
+ ++j; \
+ } \
+ }
+ DO_SUM(helo);
+ DO_SUM(client);
+ DO_SUM(reverse);
+ DO_SUM(recipient);
+ DO_SUM(sender);
+#undef DO_SUM
+ debug("score is %d", async->sum);
+ if (async->sum >= (uint32_t)data->hard_threshold) {
+ res = HTK_HARD_MATCH;
+ } else if (async->sum >= (uint32_t)data->soft_threshold) {
+ res = HTK_SOFT_MATCH;
+ }
+ }
+ debug("answering to filter %s", filter->name);
+ filter_post_async_result(context, res);
+ }
+}
+
+
+static filter_result_t strlist_filter(const filter_t *filter, const query_t *query,
+ filter_context_t *context)
{
char reverse[BUFSIZ];
char normal[BUFSIZ];
const strlist_config_t *config = filter->data;
- int sum = 0;
- bool error = true;
+ strlist_async_data_t *async = context->contexts[filter_type];
+ int result_pos = 0;
+ async->sum = 0;
+ async->error = true;
+ array_ensure_exact_capacity(async->results, (config->match_client
+ + config->match_sender + config->match_helo
+ + config->match_recipient + config->match_reverse)
+ * array_len(config->host_offsets));
+ async->awaited = 0;
if (config->is_email &&
const int len = m_strlen(query->Field); \
strlist_copy(normal, query->Field, len, false); \
strlist_copy(reverse, query->Field, len, true); \
- for (uint32_t i = 0 ; i < config->tries.len ; ++i) { \
- const int weight = array_elt(config->weights, i); \
- const trie_t *trie = array_elt(config->tries, i); \
- const bool rev = array_elt(config->reverses, i); \
- const bool part = array_elt(config->partiales, i); \
- if ((!part && trie_lookup(trie, rev ? reverse : normal)) \
- || (part && trie_prefix(trie, rev ? reverse : normal))) { \
- sum += weight; \
- if (sum >= config->hard_threshold) { \
+ foreach (strlist_local_t *entry, config->locals) { \
+ if ((!entry->partial && trie_lookup(*(entry->db), \
+ entry->reverse ? reverse : normal)) \
+ || (entry->partial && trie_prefix(*(entry->db), \
+ entry->reverse ? reverse : normal))) { \
+ async->sum += entry->weight; \
+ if (async->sum >= (uint32_t)config->hard_threshold) { \
return HTK_HARD_MATCH; \
} \
} \
- error = false; \
- } \
+ async->error = false; \
+ }} \
}
#define DNS(Flag, Field) \
if (config->match_ ## Flag) { \
const int len = m_strlen(query->Field); \
strlist_copy(normal, query->Field, len, false); \
for (uint32_t i = 0 ; len > 0 && i < config->host_offsets.len ; ++i) { \
- const char *rbl = array_ptr(config->hosts, \
- array_elt(config->host_offsets, i));\
- const int weight = array_elt(config->host_weights, i); \
- switch (rhbl_check(normal, rbl)) { \
- case RBL_FOUND: \
- error = false; \
- sum += weight; \
- if (sum >= config->hard_threshold) { \
- return HTK_HARD_MATCH; \
- } \
- break; \
- case RBL_NOTFOUND: \
- error = false; \
- break; \
- case RBL_ERROR: \
- warn("rbl %s unavailable", rbl); \
- break; \
+ const char *rbl = array_ptr(config->hosts, \
+ array_elt(config->host_offsets, i)); \
+ debug("running check of field %s (%s) against %s", STR(Field), \
+ normal, rbl); \
+ if (rhbl_check(rbl, normal, array_ptr(async->results, result_pos), \
+ strlist_filter_async, context)) { \
+ async->error = false; \
+ ++async->awaited; \
} \
+ ++result_pos; \
} \
}
}
#undef DNS
#undef LOOKUP
- if (error) {
+ if (async->awaited > 0) {
+ return HTK_ASYNC;
+ }
+ if (async->error) {
err("filter %s: all the rbls returned an error", filter->name);
return HTK_ERROR;
}
- if (sum >= config->hard_threshold) {
+ if (async->sum >= (uint32_t)config->hard_threshold) {
return HTK_HARD_MATCH;
- } else if (sum >= config->soft_threshold) {
+ } else if (async->sum >= (uint32_t)config->soft_threshold) {
return HTK_SOFT_MATCH;
} else {
return HTK_FAIL;
}
}
+static void *strlist_context_constructor(void)
+{
+ return p_new(strlist_async_data_t, 1);
+}
+
+static void strlist_context_destructor(void *data)
+{
+ strlist_async_data_t *ctx = data;
+ array_wipe(ctx->results);
+ p_delete(&ctx);
+}
+
static int strlist_init(void)
{
- filter_type_t type = filter_register("strlist", strlist_filter_constructor,
- strlist_filter_destructor, strlist_filter);
+ filter_type = filter_register("strlist", strlist_filter_constructor,
+ strlist_filter_destructor, strlist_filter,
+ strlist_context_constructor,
+ strlist_context_destructor);
/* Hooks.
*/
- (void)filter_hook_register(type, "abort");
- (void)filter_hook_register(type, "error");
- (void)filter_hook_register(type, "fail");
- (void)filter_hook_register(type, "hard_match");
- (void)filter_hook_register(type, "soft_match");
+ (void)filter_hook_register(filter_type, "abort");
+ (void)filter_hook_register(filter_type, "error");
+ (void)filter_hook_register(filter_type, "fail");
+ (void)filter_hook_register(filter_type, "hard_match");
+ (void)filter_hook_register(filter_type, "soft_match");
/* Parameters.
*/
- (void)filter_param_register(type, "file");
- (void)filter_param_register(type, "rbldns");
- (void)filter_param_register(type, "dns");
- (void)filter_param_register(type, "hard_threshold");
- (void)filter_param_register(type, "soft_threshold");
- (void)filter_param_register(type, "fields");
+ (void)filter_param_register(filter_type, "file");
+ (void)filter_param_register(filter_type, "rbldns");
+ (void)filter_param_register(filter_type, "dns");
+ (void)filter_param_register(filter_type, "hard_threshold");
+ (void)filter_param_register(filter_type, "soft_threshold");
+ (void)filter_param_register(filter_type, "fields");
return 0;
}
module_init(strlist_init);