struct rspamd_map *map;
GPtrArray *regexps;
GPtrArray *values;
+ gboolean has_utf;
#ifdef WITH_HYPERSCAN
hs_database_t *hs_db;
hs_scratch_t *hs_scratch;
struct rspamd_map *map;
rspamd_regexp_t *re;
GError *err = NULL;
+ gint pcre_flags;
map = re_map->map;
re = rspamd_regexp_new (key, NULL, &err);
return;
}
+ pcre_flags = rspamd_regexp_get_pcre_flags (re);
+
+#ifndef WITH_PCRE2
+ if (pcre_flags & PCRE_FLAG(UTF8)) {
+ re_map->has_utf = TRUE;
+ }
+#else
+ if (pcre_flags & PCRE_FLAG(UTF)) {
+ re_map->has_utf = TRUE;
+ }
+#endif
+
g_ptr_array_add (re_map->regexps, re);
g_ptr_array_add (re_map->values, g_strdup (value));
}
rspamd_regexp_t *re;
gint res = 0;
gpointer ret = NULL;
+ gboolean validated = FALSE;
g_assert (in != NULL && len > 0);
return NULL;
}
+
+ if (map->has_utf) {
+ if (g_utf8_validate (in, len, NULL)) {
+ validated = TRUE;
+ }
+ }
+ else {
+ validated = TRUE;
+ }
+
#ifdef WITH_HYPERSCAN
if (map->hs_db && map->hs_scratch) {
- res = hs_scan (map->hs_db, in, len, 0, map->hs_scratch,
- rspamd_match_hs_single_handler, (void *)&i);
- if (res == HS_SCAN_TERMINATED) {
- res = 1;
- ret = g_ptr_array_index (map->values, i);
- }
+ if (validated) {
- return ret;
+ res = hs_scan (map->hs_db, in, len, 0, map->hs_scratch,
+ rspamd_match_hs_single_handler, (void *)&i);
+
+ if (res == HS_SCAN_TERMINATED) {
+ res = 1;
+ ret = g_ptr_array_index (map->values, i);
+ }
+
+ return ret;
+ }
}
#endif
for (i = 0; i < map->regexps->len; i ++) {
re = g_ptr_array_index (map->regexps, i);
- if (rspamd_regexp_search (re, in, len, NULL, NULL, FALSE, NULL)) {
+ if (rspamd_regexp_search (re, in, len, NULL, NULL, !validated, NULL)) {
ret = g_ptr_array_index (map->values, i);
break;
}