Merge pull request #3012 in SNORT/snort3 from ~MDAGON/snort3:normalized2 to master

author Tom Peters (thopeter) <thopeter@cisco.com>

Wed, 18 Aug 2021 18:14:00 +0000 (18:14 +0000)

committer Tom Peters (thopeter) <thopeter@cisco.com>

Wed, 18 Aug 2021 18:14:00 +0000 (18:14 +0000)
author Tom Peters (thopeter) <thopeter@cisco.com>
Wed, 18 Aug 2021 18:14:00 +0000 (18:14 +0000)
committer Tom Peters (thopeter) <thopeter@cisco.com>
Wed, 18 Aug 2021 18:14:00 +0000 (18:14 +0000)
diff --git a/doc/user/http_inspect.txt b/doc/user/http_inspect.txt

index fa316c2a04b15ff6bebdacf9f653b3ad9f2fd346..26687bff5ce9275a21859bd5eab03309ca286f80 100755 (executable)
--- a/doc/user/http_inspect.txt
+++ b/doc/user/http_inspect.txt
@@ -462,8 +462,8 @@ upper and lower case.
  With http_header the individual header value is normalized in a way that is
  appropriate for that header.
  
-Specifying an individual header is not available for http_raw_header and
-http_raw_header_complete.
+Specifying an individual header is not available for http_raw_header_complete, use
+http_raw_header instead.
  
  If you don't specify a header you get all of the headers. http_raw_header_complete
  includes cookie headers Cookie and Set-Cookie. http_header and http_raw_header don't.
diff --git a/src/service_inspectors/http_inspect/CMakeLists.txt b/src/service_inspectors/http_inspect/CMakeLists.txt

index 57c1d52db3862ecb1c75476151a7130f271d289f..d4972a0010e675aa9f695eb8f80e59439e794075 100644 (file)
--- a/src/service_inspectors/http_inspect/CMakeLists.txt
+++ b/src/service_inspectors/http_inspect/CMakeLists.txt
@@ -34,8 +34,8 @@ set (FILE_LIST
      http_param.h
      http_query_parser.cc
      http_query_parser.h
-    http_header_normalizer.cc
-    http_header_normalizer.h
+    http_normalized_header.cc
+    http_normalized_header.h
      http_uri.cc
      http_uri.h
      http_uri_norm.cc
diff --git a/src/service_inspectors/http_inspect/http_header_normalizer.cc b/src/service_inspectors/http_inspect/http_header_normalizer.cc

deleted file mode 100644 (file)

index 0067038..0000000
--- a/src/service_inspectors/http_inspect/http_header_normalizer.cc
+++ /dev/null
@@ -1,171 +0,0 @@
-//--------------------------------------------------------------------------
-// Copyright (C) 2014-2021 Cisco and/or its affiliates. All rights reserved.
-//
-// This program is free software; you can redistribute it and/or modify it
-// under the terms of the GNU General Public License Version 2 as published
-// by the Free Software Foundation.  You may not use, modify or distribute
-// this program under any other version of the GNU General Public License.
-//
-// This program is distributed in the hope that it will be useful, but
-// WITHOUT ANY WARRANTY; without even the implied warranty of
-// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
-// General Public License for more details.
-//
-// You should have received a copy of the GNU General Public License along
-// with this program; if not, write to the Free Software Foundation, Inc.,
-// 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
-//--------------------------------------------------------------------------
-// http_header_normalizer.cc author Tom Peters <thopeter@cisco.com>
-
-#ifdef HAVE_CONFIG_H
-#include "config.h"
-#endif
-
-#include "http_common.h"
-#include "http_enum.h"
-#include "http_header_normalizer.h"
-
-#include <cstring>
-
-using namespace HttpCommon;
-using namespace HttpEnums;
-
-// This derivation removes leading and trailing linear white space and replaces internal strings of
-// linear whitespace with a single <SP>
-static int32_t derive_header_content(const uint8_t* value, int32_t length, uint8_t* buffer,
-    bool alert_ws, HttpInfractions* infractions, HttpEventGen* events)
-{
-    int32_t out_length = 0;
-    bool beginning = true;
-    bool last_white = true;
-    for (int32_t k=0; k < length; k++)
-    {
-        if (!is_sp_tab_cr_lf[value[k]])
-        {
-            if (alert_ws && last_white && !beginning)
-            {
-                // white space which is not at beginning or end
-                *infractions += INF_BAD_HEADER_WHITESPACE;
-                events->create_event(EVENT_BAD_HEADER_WHITESPACE);
-            }
-            beginning = false;
-            last_white = false;
-            buffer[out_length++] = value[k];
-        }
-        else if (!last_white)
-        {
-            last_white = true;
-            buffer[out_length++] = ' ';
-        }
-    }
-    if ((out_length > 0) && (buffer[out_length - 1] == ' '))
-    {
-        out_length--;
-    }
-    return out_length;
-}
-
-// This method normalizes the header field value for headId.
-void HeaderNormalizer::normalize(const HeaderId head_id, const int count,
-    HttpInfractions* infractions, HttpEventGen* events, const HeaderId header_name_id[],
-    const Field header_value[], const int32_t num_headers, Field& result_field) const
-{
-    if (result_field.length() != STAT_NOT_COMPUTE)
-    {
-        return;
-    }
-
-    assert(count > 0);
-
-    // Search Header IDs from all the headers in this message. All repeated field values are
-    // concatenated into a comma-separated list.
-    // FIXIT-L Set-Cookie is a special case in the RFC because multiple Set-Cookie headers are
-    // widely used but comma-concatenation of cookies is incorrect. That would be a concern for us
-    // if we actually used the cookies. But since we just want a single value to show to the
-    // pattern matcher, concatenating is probably fine. In the future we may wish to revisit this
-    // issue. Specifically, semicolon-concatenation may be better.
-    int num_matches = 0;
-    int32_t buffer_length = 0;
-
-    // FIXIT-P initialization that serves no functional purpose to prevent compiler warning
-    int curr_match = -1;
-    for (int k=0; k < num_headers; k++)
-    {
-        if (header_name_id[k] == head_id)
-        {
-            if (++num_matches == 1)
-                curr_match = k;   // remembering location of the first matching header
-            buffer_length += header_value[k].length();
-            if (num_matches >= count)
-                break;
-        }
-    }
-    assert(num_matches == count);
-    buffer_length += num_matches - 1;    // allow space for concatenation commas
-
-    // We are allocating two buffers to store the normalized field value. The raw field value will
-    // be copied into one of them. Concatenation and white space normalization happen during this
-    // step. Next a series of normalization functions will transform the value into final form.
-    // Each normalization copies the value from one buffer to the other. Based on whether the
-    // number of normalization functions is odd or even, the initial buffer is chosen so that the
-    // final normalization leaves the normalized header value in norm_value.
-
-    uint8_t* const norm_value = new uint8_t[buffer_length];
-    uint8_t* const temp_space = new uint8_t[buffer_length];
-    uint8_t* const norm_start = (num_normalizers%2 == 0) ? norm_value : temp_space;
-    uint8_t* working = norm_start;
-    int32_t data_length = 0;
-    for (int j=0; j < num_matches; j++)
-    {
-        if (j >= 1)
-        {
-            *working++ = ',';
-            data_length++;
-            while (header_name_id[++curr_match] != head_id);
-        }
-        int32_t growth = derive_header_content(header_value[curr_match].start(),
-            header_value[curr_match].length(), working, alert_ws, infractions, events);
-        working += growth;
-        data_length += growth;
-    }
-
-    // Many fields names can appear more than once but some should not. If an event or infraction
-    // is defined we will check as part of normalization. A comma-separated header value is
-    // equivalent to a repeated header name. This is JIT code and we will not check for repeated
-    // headers unless someone asks for that header.
-    if ((repeat_event != EVENT__NONE) || (repeat_inf != INF__NONE))
-    {
-        if (count >= 2)
-        {
-            *infractions += repeat_inf;
-            events->create_event(repeat_event);
-        }
-        else
-        {
-            for (int k=0; k < data_length; k++)
-            {
-                if (norm_start[k] == ',')
-                {
-                    *infractions += repeat_inf;
-                    events->create_event(repeat_event);
-                    break;
-                }
-            }
-        }
-    }
-
-    for (int i=0; i < num_normalizers; i++)
-    {
-        if (i%2 != num_normalizers%2)
-        {
-            data_length = normalizer[i](temp_space, data_length, norm_value, infractions, events);
-        }
-        else
-        {
-            data_length = normalizer[i](norm_value, data_length, temp_space, infractions, events);
-        }
-    }
-    delete[] temp_space;
-    result_field.set(data_length, norm_value, true);
-}
-
diff --git a/src/service_inspectors/http_inspect/http_header_normalizer.h b/src/service_inspectors/http_inspect/http_header_normalizer.h

deleted file mode 100644 (file)

index 4ac2ab2..0000000
--- a/src/service_inspectors/http_inspect/http_header_normalizer.h
+++ /dev/null
@@ -1,62 +0,0 @@
-//--------------------------------------------------------------------------
-// Copyright (C) 2014-2021 Cisco and/or its affiliates. All rights reserved.
-//
-// This program is free software; you can redistribute it and/or modify it
-// under the terms of the GNU General Public License Version 2 as published
-// by the Free Software Foundation.  You may not use, modify or distribute
-// this program under any other version of the GNU General Public License.
-//
-// This program is distributed in the hope that it will be useful, but
-// WITHOUT ANY WARRANTY; without even the implied warranty of
-// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
-// General Public License for more details.
-//
-// You should have received a copy of the GNU General Public License along
-// with this program; if not, write to the Free Software Foundation, Inc.,
-// 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
-//--------------------------------------------------------------------------
-// http_header_normalizer.h author Tom Peters <thopeter@cisco.com>
-
-#ifndef HTTP_HEADER_NORMALIZER_H
-#define HTTP_HEADER_NORMALIZER_H
-
-#include "http_field.h"
-#include "http_normalizers.h"
-
-//-------------------------------------------------------------------------
-// HeaderNormalizer class
-// Strategies for normalizing HTTP header field values
-//-------------------------------------------------------------------------
-
-// Three normalization functions per HeaderNormalizer seems likely to be enough. Nothing subtle
-// will break if you choose to expand it to four or more. Just a whole bunch of signatures and
-// initializers to update. When defining a HeaderNormalizer don't leave holes in the normalizer
-// list. E.g. if you have two normalizers they must be first and second. If you do first and third
-// instead it won't explode but the third one won't be used either.
-
-class HeaderNormalizer
-{
-public:
-    constexpr HeaderNormalizer(HttpEnums::EventSid _repeat_event,
-        HttpEnums::Infraction _repeat_inf, bool _alert_ws,
-        NormFunc* f1, NormFunc* f2, NormFunc* f3)
-        : repeat_event(_repeat_event), repeat_inf(_repeat_inf), alert_ws(_alert_ws),
-        normalizer { f1, f2, f3 },
-        num_normalizers((f1 != nullptr) + (f1 != nullptr)*(f2 != nullptr) + (f1 != nullptr)*(f2 !=
-            nullptr)*(f3 != nullptr)) { }
-
-    void normalize(const HttpEnums::HeaderId head_id, const int count,
-        HttpInfractions* infractions, HttpEventGen* events,
-        const HttpEnums::HeaderId header_name_id[], const Field header_value[],
-        const int32_t num_headers, Field& result_field) const;
-
-private:
-    const HttpEnums::EventSid repeat_event;
-    const HttpEnums::Infraction repeat_inf;
-    const bool alert_ws;  // alert if white space in middle of value
-    NormFunc* const normalizer[3];
-    const int num_normalizers;
-};
-
-#endif
-
diff --git a/src/service_inspectors/http_inspect/http_msg_head_shared.cc b/src/service_inspectors/http_inspect/http_msg_head_shared.cc

index 45c18d5947aa6e2f95076223e93825496e32df3d..65293e50ebea9186086c7c35f32806a7590d71a5 100755 (executable)
--- a/src/service_inspectors/http_inspect/http_msg_head_shared.cc
+++ b/src/service_inspectors/http_inspect/http_msg_head_shared.cc
@@ -330,7 +330,7 @@ void HttpMsgHeadShared::derive_header_name_id(int index)
      delete[] lower_name;
  }
  
-HttpMsgHeadShared::NormalizedHeader* HttpMsgHeadShared::get_header_node(HeaderId header_id) const
+NormalizedHeader* HttpMsgHeadShared::get_header_node(HeaderId header_id) const
  {
      if (!headers_present[header_id])
          return nullptr;
@@ -424,15 +424,26 @@ const Field& HttpMsgHeadShared::get_header_value_raw(HeaderId header_id) const
      return Field::FIELD_NULL;
  }
  
+// Get raw header values. If the same header field appears more than once the
+// values are converted into a comma-separated list
+const Field& HttpMsgHeadShared::get_all_header_values_raw(HeaderId header_id)
+{
+    NormalizedHeader* node = get_header_node(header_id);
+    if (node == nullptr)
+        return Field::FIELD_NULL;
+
+    return node->get_comma_separated_raw(*this, transaction->get_infractions(source_id),
+        session_data->events[source_id], header_name_id, header_value, num_headers);
+}
+
  const Field& HttpMsgHeadShared::get_header_value_norm(HeaderId header_id)
  {
      NormalizedHeader* node = get_header_node(header_id);
      if (node == nullptr)
          return Field::FIELD_NULL;
-    header_norms[header_id]->normalize(header_id, node->count,
-        transaction->get_infractions(source_id), session_data->events[source_id],
-        header_name_id, header_value, num_headers, node->norm);
-    return node->norm;
+
+    return node->get_norm(transaction->get_infractions(source_id),
+        session_data->events[source_id], header_name_id, header_value, num_headers);
  }
  
  // For downloads we use the hash of the URL if it exists. For uploads we use a hash of the filename
diff --git a/src/service_inspectors/http_inspect/http_msg_head_shared.h b/src/service_inspectors/http_inspect/http_msg_head_shared.h

index dcbc6e85cceb782df3529cdc2e60346786f9162f..f27502c0ad3a7cba1708ff69d31e0196d6f45ef7 100755 (executable)
--- a/src/service_inspectors/http_inspect/http_msg_head_shared.h
+++ b/src/service_inspectors/http_inspect/http_msg_head_shared.h
@@ -25,8 +25,8 @@
  #include "http_common.h"
  #include "http_enum.h"
  #include "http_field.h"
-#include "http_header_normalizer.h"
  #include "http_msg_section.h"
+#include "http_normalized_header.h"
  #include "http_str_to_code.h"
  
  //-------------------------------------------------------------------------
@@ -43,6 +43,7 @@ public:
      const Field& get_classic_norm_header();
      const Field& get_classic_norm_cookie();
      const Field& get_header_value_raw(HttpEnums::HeaderId header_id) const;
+    const Field& get_all_header_values_raw(HttpEnums::HeaderId header_id);
      const Field& get_header_value_norm(HttpEnums::HeaderId header_id);
      int get_header_count(HttpEnums::HeaderId header_id) const;
  
@@ -77,22 +78,6 @@ protected:
  private:
      static const int MAX = HttpEnums::HEAD__MAX_VALUE + HttpEnums::MAX_CUSTOM_HEADERS;
  
-    // Header normalization strategies. There should be one defined for every different way we can
-    // process a header field value.
-    static const HeaderNormalizer NORMALIZER_BASIC;
-    static const HeaderNormalizer NORMALIZER_HOST;
-    static const HeaderNormalizer NORMALIZER_CASE_INSENSITIVE;
-    static const HeaderNormalizer NORMALIZER_NUMBER;
-    static const HeaderNormalizer NORMALIZER_TOKEN_LIST;
-    static const HeaderNormalizer NORMALIZER_METHOD_LIST;
-    static const HeaderNormalizer NORMALIZER_DATE;
-    static const HeaderNormalizer NORMALIZER_URI;
-    static const HeaderNormalizer NORMALIZER_CONTENT_LENGTH;
-    static const HeaderNormalizer NORMALIZER_CHARSET;
-
-    // Master table of known header fields and their normalization strategies.
-    static const HeaderNormalizer* const header_norms[];
-
      // All of these are indexed by the relative position of the header field in the message
      static const int MAX_HEADERS = 200;  // I'm an arbitrary number. FIXIT-RC
      static const int MAX_HEADER_LENGTH = 4096; // Based on max cookie size of some browsers
@@ -111,16 +96,6 @@ private:
      HttpEnums::HeaderId* header_name_id = nullptr;
      Field* header_value = nullptr;
  
-    struct NormalizedHeader
-    {
-        NormalizedHeader(NormalizedHeader* next_, int32_t count_, HttpEnums::HeaderId id_) :
-            next(next_), count(count_), id(id_) {}
-
-        Field norm;
-        NormalizedHeader* next;
-        int32_t count;
-        const HttpEnums::HeaderId id;
-    };
      NormalizedHeader* get_header_node(HttpEnums::HeaderId k) const;
      NormalizedHeader* norm_heads = nullptr;
  
diff --git a/src/service_inspectors/http_inspect/http_msg_header.cc b/src/service_inspectors/http_inspect/http_msg_header.cc

index da3ae1c45e9b41ac3b2762c58ccc6aab6d2b9f3f..bc3549ea8a862326ea199335e797ffee06d4ba0f 100755 (executable)
--- a/src/service_inspectors/http_inspect/http_msg_header.cc
+++ b/src/service_inspectors/http_inspect/http_msg_header.cc
@@ -40,6 +40,7 @@
  #include "http_inspect.h"
  #include "http_msg_request.h"
  #include "http_msg_body.h"
+#include "http_normalizers.h"
  
  using namespace snort;
  using namespace HttpCommon;
diff --git a/src/service_inspectors/http_inspect/http_msg_section.cc b/src/service_inspectors/http_inspect/http_msg_section.cc

index 4eb99daa39182fb00dbd8f67c0580701cc9264a7..e31e5718b9096e9aa8b8c59fbdbb893a55dd33ff 100644 (file)
--- a/src/service_inspectors/http_inspect/http_msg_section.cc
+++ b/src/service_inspectors/http_inspect/http_msg_section.cc
@@ -185,7 +185,6 @@ const Field& HttpMsgSection::get_classic_buffer(Cursor& c, const HttpBufferInfo&
      case HTTP_BUFFER_HEADER:
      case HTTP_BUFFER_TRAILER:
        {
-        // FIXIT-L Someday want to be able to return field name or raw field value
          HttpMsgHeadShared* const head = (buf.type == HTTP_BUFFER_HEADER) ?
              (HttpMsgHeadShared*)header[buffer_side] : (HttpMsgHeadShared*)trailer[buffer_side];
          if (head == nullptr)
@@ -317,9 +316,15 @@ const Field& HttpMsgSection::get_classic_buffer(Cursor& c, const HttpBufferInfo&
          return (get_body() != nullptr) ? get_body()->msg_text : Field::FIELD_NULL;
        }
      case HTTP_BUFFER_RAW_HEADER:
+    case HTTP_BUFFER_RAW_TRAILER:
        {
-        return (header[buffer_side] != nullptr) ? header[buffer_side]->get_classic_raw_header() :
-            Field::FIELD_NULL;
+        HttpMsgHeadShared* const head = (buf.type == HTTP_BUFFER_RAW_HEADER) ?
+            (HttpMsgHeadShared*)header[buffer_side] : (HttpMsgHeadShared*)trailer[buffer_side];
+        if (head == nullptr)
+            return Field::FIELD_NULL;
+        if (buf.sub_id == 0)
+            return head->get_classic_raw_header();
+        return head->get_all_header_values_raw((HeaderId)buf.sub_id);
        }
      case HTTP_BUFFER_RAW_HEADER_COMPLETE:
        {
@@ -334,11 +339,6 @@ const Field& HttpMsgSection::get_classic_buffer(Cursor& c, const HttpBufferInfo&
        {
          return (status != nullptr) ? status->msg_text : Field::FIELD_NULL;
        }
-    case HTTP_BUFFER_RAW_TRAILER:
-      {
-        return (trailer[buffer_side] != nullptr) ? trailer[buffer_side]->get_classic_raw_header() :
-            Field::FIELD_NULL;
-      }
      case HTTP_BUFFER_STAT_CODE:
        {
          return (status != nullptr) ? status->get_status_code() : Field::FIELD_NULL;
diff --git a/src/service_inspectors/http_inspect/http_normalized_header.cc b/src/service_inspectors/http_inspect/http_normalized_header.cc

new file mode 100644 (file)

index 0000000..c6c4aa0
--- /dev/null
+++ b/src/service_inspectors/http_inspect/http_normalized_header.cc
@@ -0,0 +1,364 @@
+//--------------------------------------------------------------------------
+// Copyright (C) 2014-2021 Cisco and/or its affiliates. All rights reserved.
+//
+// This program is free software; you can redistribute it and/or modify it
+// under the terms of the GNU General Public License Version 2 as published
+// by the Free Software Foundation.  You may not use, modify or distribute
+// this program under any other version of the GNU General Public License.
+//
+// This program is distributed in the hope that it will be useful, but
+// WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+// General Public License for more details.
+//
+// You should have received a copy of the GNU General Public License along
+// with this program; if not, write to the Free Software Foundation, Inc.,
+// 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
+//--------------------------------------------------------------------------
+// http_normalized_header.cc author Tom Peters <thopeter@cisco.com>
+
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif
+
+#include "http_normalized_header.h"
+
+#include "http_common.h"
+#include "http_enum.h"
+#include "http_msg_head_shared.h"
+#include "http_normalizers.h"
+
+#include <cstring>
+
+using namespace HttpCommon;
+using namespace HttpEnums;
+
+//-------------------------------------------------------------------------
+// HeaderNormalizer class
+// Strategies for normalizing HTTP header field values
+//-------------------------------------------------------------------------
+
+// Three normalization functions per HeaderNormalizer seems likely to be enough. Nothing subtle
+// will break if you choose to expand it to four or more. Just a whole bunch of signatures and
+// initializers to update. When defining a HeaderNormalizer don't leave holes in the normalizer
+// list. E.g. if you have two normalizers they must be first and second. If you do first and third
+// instead it won't explode but the third one won't be used either.
+
+class NormalizedHeader::HeaderNormalizer
+{
+public:
+    constexpr HeaderNormalizer(HttpEnums::EventSid _repeat_event,
+        HttpEnums::Infraction _repeat_inf, bool _alert_ws,
+        NormFunc* f1, NormFunc* f2, NormFunc* f3)
+        : repeat_event(_repeat_event), repeat_inf(_repeat_inf), alert_ws(_alert_ws),
+        normalizer { f1, f2, f3 },
+        num_normalizers((f1 != nullptr) + (f1 != nullptr)*(f2 != nullptr) + (f1 != nullptr)*(f2 !=
+            nullptr)*(f3 != nullptr)) { }
+
+    void normalize(const HttpEnums::HeaderId head_id, const int count,
+        HttpInfractions* infractions, HttpEventGen* events,
+        const HttpEnums::HeaderId header_name_id[], const Field header_value[],
+        const int32_t num_headers, Field& result_field, Field& comma_separated_raw) const;
+
+private:
+    const HttpEnums::EventSid repeat_event;
+    const HttpEnums::Infraction repeat_inf;
+    const bool alert_ws;  // alert if white space in middle of value
+    NormFunc* const normalizer[3];
+    const int num_normalizers;
+};
+
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_BASIC
+    { EVENT__NONE, INF__NONE, false, nullptr, nullptr, nullptr };
+
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_HOST
+    { EVENT_MULTIPLE_HOST_HDRS, INF_MULTIPLE_HOST_HDRS, false, nullptr, nullptr, nullptr };
+
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_CASE_INSENSITIVE
+    { EVENT__NONE, INF__NONE, false, norm_to_lower, nullptr, nullptr };
+
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_NUMBER
+    { EVENT_REPEATED_HEADER, INF_REPEATED_HEADER, false, norm_remove_lws, nullptr, nullptr };
+
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_TOKEN_LIST
+    { EVENT__NONE, INF__NONE, false, norm_remove_lws, norm_to_lower, nullptr };
+
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_METHOD_LIST
+    { EVENT__NONE, INF__NONE, false, norm_remove_lws, nullptr, nullptr };
+
+// FIXIT-L implement a date normalization function that converts the three legal formats into a
+// single standard format. For now we do nothing special for dates. This object is a placeholder
+// to keep track of which headers have date values.
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_DATE
+    { EVENT__NONE, INF__NONE, false, nullptr, nullptr, nullptr };
+
+// FIXIT-M implement a URI normalization function, probably by extending existing URI capabilities
+// to cover relative formats
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_URI
+    { EVENT__NONE, INF__NONE, false, nullptr, nullptr, nullptr };
+
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_CONTENT_LENGTH
+    { EVENT_MULTIPLE_CONTLEN, INF_MULTIPLE_CONTLEN, true, norm_remove_lws, nullptr, nullptr };
+
+const NormalizedHeader::HeaderNormalizer NormalizedHeader::NORMALIZER_CHARSET
+    { EVENT__NONE, INF__NONE, false, norm_remove_quotes_lws, norm_to_lower, nullptr };
+
+const NormalizedHeader::HeaderNormalizer* const NormalizedHeader::header_norms[HEAD__MAX_VALUE + MAX_CUSTOM_HEADERS + 1] = {
+    &NORMALIZER_BASIC,      // 0
+    &NORMALIZER_BASIC,      // HEAD__OTHER
+    &NORMALIZER_TOKEN_LIST, // HEAD_CACHE_CONTROL
+    &NORMALIZER_TOKEN_LIST, // HEAD_CONNECTION
+    &NORMALIZER_DATE,       // HEAD_DATE
+    &NORMALIZER_TOKEN_LIST, // HEAD_PRAGMA
+    &NORMALIZER_TOKEN_LIST, // HEAD_TRAILER
+    &NORMALIZER_BASIC,      // HEAD_COOKIE
+    &NORMALIZER_BASIC,      // HEAD_SET_COOKIE
+    &NORMALIZER_TOKEN_LIST, // HEAD_TRANSFER_ENCODING
+    &NORMALIZER_TOKEN_LIST, // HEAD_UPGRADE
+    &NORMALIZER_BASIC,      // HEAD_VIA
+    &NORMALIZER_BASIC,      // HEAD_WARNING
+    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT
+    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT_CHARSET
+    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT_ENCODING
+    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT_LANGUAGE
+    &NORMALIZER_BASIC,      // HEAD_AUTHORIZATION
+    &NORMALIZER_CASE_INSENSITIVE, // HEAD_EXPECT
+    &NORMALIZER_BASIC,      // HEAD_FROM
+    &NORMALIZER_HOST,       // HEAD_HOST
+    &NORMALIZER_BASIC,      // HEAD_IF_MATCH
+    &NORMALIZER_DATE,       // HEAD_IF_MODIFIED_SINCE
+    &NORMALIZER_BASIC,      // HEAD_IF_NONE_MATCH
+    &NORMALIZER_BASIC,      // HEAD_IF_RANGE
+    &NORMALIZER_DATE,       // HEAD_IF_UNMODIFIED_SINCE
+    &NORMALIZER_BASIC,      // HEAD_MAX_FORWARDS
+    &NORMALIZER_BASIC,      // HEAD_PROXY_AUTHORIZATION
+    &NORMALIZER_BASIC,      // HEAD_RANGE
+    &NORMALIZER_URI,        // HEAD_REFERER
+    &NORMALIZER_TOKEN_LIST, // HEAD_TE
+    &NORMALIZER_BASIC,      // HEAD_USER_AGENT
+    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT_RANGES
+    &NORMALIZER_NUMBER,     // HEAD_AGE
+    &NORMALIZER_BASIC,      // HEAD_ETAG
+    &NORMALIZER_URI,        // HEAD_LOCATION
+    &NORMALIZER_BASIC,      // HEAD_PROXY_AUTHENTICATE
+    &NORMALIZER_BASIC,      // HEAD_RETRY_AFTER, may be date or number
+    &NORMALIZER_BASIC,      // HEAD_SERVER
+    &NORMALIZER_TOKEN_LIST, // HEAD_VARY
+    &NORMALIZER_BASIC,      // HEAD_WWW_AUTHENTICATE
+    &NORMALIZER_METHOD_LIST, // HEAD_ALLOW
+    &NORMALIZER_TOKEN_LIST, // HEAD_CONTENT_ENCODING
+    &NORMALIZER_TOKEN_LIST, // HEAD_CONTENT_LANGUAGE
+    &NORMALIZER_CONTENT_LENGTH, // HEAD_CONTENT_LENGTH
+    &NORMALIZER_URI,        // HEAD_CONTENT_LOCATION
+    &NORMALIZER_BASIC,      // HEAD_CONTENT_MD5
+    &NORMALIZER_BASIC,      // HEAD_CONTENT_RANGE
+    &NORMALIZER_CHARSET,    // HEAD_CONTENT_TYPE
+    &NORMALIZER_DATE,       // HEAD_EXPIRES
+    &NORMALIZER_DATE,       // HEAD_LAST_MODIFIED
+    &NORMALIZER_BASIC,      // HEAD_X_FORWARDED_FOR
+    &NORMALIZER_BASIC,      // HEAD_TRUE_CLIENT_IP
+    &NORMALIZER_BASIC,      // HEAD_X_WORKING_WITH
+    &NORMALIZER_TOKEN_LIST, // HEAD_CONTENT_TRANSFER_ENCODING
+    &NORMALIZER_BASIC,      // HEAD_MIME_VERSION
+    &NORMALIZER_BASIC,      // HEAD_PROXY_AGENT
+    &NORMALIZER_BASIC,      // HEAD_CONTENT_DISPOSITION
+    &NORMALIZER_TOKEN_LIST, // HEAD_HTTP2_SETTINGS
+    &NORMALIZER_BASIC,      // HEAD__MAX_VALUE
+    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
+    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
+    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
+    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
+    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
+    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
+    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
+    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
+};
+
+// This derivation removes leading and trailing linear white space and replaces internal strings of
+// linear whitespace with a single <SP>
+static int32_t derive_header_content(const uint8_t* value, int32_t length, uint8_t* buffer,
+    bool alert_ws, HttpInfractions* infractions, HttpEventGen* events)
+{
+    int32_t out_length = 0;
+    bool beginning = true;
+    bool last_white = true;
+    for (int32_t k=0; k < length; k++)
+    {
+        if (!is_sp_tab_cr_lf[value[k]])
+        {
+            if (alert_ws && last_white && !beginning)
+            {
+                // white space which is not at beginning or end
+                *infractions += INF_BAD_HEADER_WHITESPACE;
+                events->create_event(EVENT_BAD_HEADER_WHITESPACE);
+            }
+            beginning = false;
+            last_white = false;
+            buffer[out_length++] = value[k];
+        }
+        else if (!last_white)
+        {
+            last_white = true;
+            buffer[out_length++] = ' ';
+        }
+    }
+    if ((out_length > 0) && (buffer[out_length - 1] == ' '))
+    {
+        out_length--;
+    }
+    return out_length;
+}
+
+// This method normalizes the header field value for headId.
+void NormalizedHeader::HeaderNormalizer::normalize(const HeaderId head_id, const int count,
+    HttpInfractions* infractions, HttpEventGen* events, const HeaderId header_name_id[],
+    const Field header_value[], const int32_t num_headers, Field& result_field,
+    Field& comma_separated_raw) const
+{
+    assert(count > 0);
+
+    // Search Header IDs from all the headers in this message. All repeated field values are
+    // concatenated into a comma-separated list.
+    // FIXIT-L Set-Cookie is a special case in the RFC because multiple Set-Cookie headers are
+    // widely used but comma-concatenation of cookies is incorrect. That would be a concern for us
+    // if we actually used the cookies. But since we just want a single value to show to the
+    // pattern matcher, concatenating is probably fine. In the future we may wish to revisit this
+    // issue. Specifically, semicolon-concatenation may be better.
+    int num_matches = 0;
+    int32_t buffer_length = 0;
+
+    // FIXIT-P initialization that serves no functional purpose to prevent compiler warning
+    int curr_match = -1;
+    for (int k=0; k < num_headers; k++)
+    {
+        if (header_name_id[k] == head_id)
+        {
+            if (++num_matches == 1)
+                curr_match = k;   // remembering location of the first matching header
+            buffer_length += header_value[k].length();
+            if (num_matches >= count)
+                break;
+        }
+    }
+    assert(num_matches == count);
+    buffer_length += num_matches - 1;    // allow space for concatenation commas
+
+    // We are allocating two buffers to store the normalized field value. The raw field value will
+    // be copied into one of them. Concatenation and white space normalization happen during this
+    // step. Next a series of normalization functions will transform the value into final form.
+    // Each normalization copies the value from one buffer to the other. Based on whether the
+    // number of normalization functions is odd or even, the initial buffer is chosen so that the
+    // final normalization leaves the normalized header value in norm_value.
+
+    uint8_t* const norm_value = new uint8_t[buffer_length];
+    uint8_t* const temp_space = new uint8_t[buffer_length];
+    uint8_t* const norm_start = (num_normalizers%2 == 0) ? norm_value : temp_space;
+    uint8_t* working = norm_start;
+    int32_t data_length = 0;
+    const bool create_combined_raw = (count > 1);
+    uint8_t* const combined_raw = (create_combined_raw) ? new uint8_t[buffer_length] : nullptr;
+    uint8_t* working_raw = combined_raw;
+    for (int j=0; j < num_matches; j++)
+    {
+        if (j >= 1)
+        {
+            *working++ = ',';
+            if (create_combined_raw)
+                *working_raw++ = ',';
+            data_length++;
+            while (header_name_id[++curr_match] != head_id);
+        }
+        const int32_t growth = derive_header_content(header_value[curr_match].start(),
+            header_value[curr_match].length(), working, alert_ws, infractions, events);
+        working += growth;
+        data_length += growth;
+
+        if (create_combined_raw)
+        {
+            memcpy(working_raw, header_value[curr_match].start(),
+                header_value[curr_match].length());
+            working_raw += header_value[curr_match].length();
+        }
+    }
+
+    if (create_combined_raw)
+    {
+        assert((working_raw - combined_raw) == buffer_length);
+        comma_separated_raw.set(buffer_length, combined_raw, true);
+    }
+
+    // Many fields names can appear more than once but some should not. If an event or infraction
+    // is defined we will check as part of normalization. A comma-separated header value is
+    // equivalent to a repeated header name. This is JIT code and we will not check for repeated
+    // headers unless someone asks for that header.
+    if ((repeat_event != EVENT__NONE) || (repeat_inf != INF__NONE))
+    {
+        if (count >= 2)
+        {
+            *infractions += repeat_inf;
+            events->create_event(repeat_event);
+        }
+        else
+        {
+            for (int k=0; k < data_length; k++)
+            {
+                if (norm_start[k] == ',')
+                {
+                    *infractions += repeat_inf;
+                    events->create_event(repeat_event);
+                    break;
+                }
+            }
+        }
+    }
+
+    for (int i=0; i < num_normalizers; i++)
+    {
+        if (i%2 != num_normalizers%2)
+        {
+            data_length = normalizer[i](temp_space, data_length, norm_value, infractions, events);
+        }
+        else
+        {
+            data_length = normalizer[i](norm_value, data_length, temp_space, infractions, events);
+        }
+    }
+    delete[] temp_space;
+    result_field.set(data_length, norm_value, true);
+}
+
+//-------------------------------------------------------------------------
+// End - HeaderNormalizer class
+//-------------------------------------------------------------------------
+
+//-------------------------------------------------------------------------
+// NormalizedHeader class
+//-------------------------------------------------------------------------
+const Field& NormalizedHeader::get_norm(HttpInfractions* infractions, HttpEventGen* events,
+    const HttpEnums::HeaderId header_name_id[], const Field header_value[],
+    const int32_t num_headers)
+{
+    if (norm.length() == STAT_NOT_COMPUTE)
+    {
+        header_norms[id]->normalize(id, count, infractions, events,
+            header_name_id, header_value, num_headers, norm, comma_separated_raw);
+    }
+    
+    return norm;
+}
+
+const Field& NormalizedHeader::get_comma_separated_raw(HttpMsgHeadShared& msg_head,
+    HttpInfractions* infractions, HttpEventGen* events, const HttpEnums::HeaderId header_name_id[],
+    const Field header_value[], const int32_t num_headers)
+{
+    if (count == 1)
+        return msg_head.get_header_value_raw(id);
+
+    if (comma_separated_raw.length() == STAT_NOT_COMPUTE)
+    {
+        header_norms[id]->normalize(id, count, infractions, events,
+            header_name_id, header_value, num_headers, norm, comma_separated_raw);
+    }
+
+    return comma_separated_raw;
+}
diff --git a/src/service_inspectors/http_inspect/http_normalized_header.h b/src/service_inspectors/http_inspect/http_normalized_header.h

new file mode 100644 (file)

index 0000000..c5ea79e
--- /dev/null
+++ b/src/service_inspectors/http_inspect/http_normalized_header.h
@@ -0,0 +1,71 @@
+//--------------------------------------------------------------------------
+// Copyright (C) 2014-2021 Cisco and/or its affiliates. All rights reserved.
+//
+// This program is free software; you can redistribute it and/or modify it
+// under the terms of the GNU General Public License Version 2 as published
+// by the Free Software Foundation.  You may not use, modify or distribute
+// this program under any other version of the GNU General Public License.
+//
+// This program is distributed in the hope that it will be useful, but
+// WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+// General Public License for more details.
+//
+// You should have received a copy of the GNU General Public License along
+// with this program; if not, write to the Free Software Foundation, Inc.,
+// 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
+//--------------------------------------------------------------------------
+// http_normalized_header.h author Tom Peters <thopeter@cisco.com>
+
+#ifndef HTTP_NORMALIZED_HEADER_H
+#define HTTP_NORMALIZED_HEADER_H
+
+#include "http_event.h"
+#include "http_field.h"
+
+class HttpMsgHeadShared;
+
+//-------------------------------------------------------------------------
+// NormalizedHeader class
+//-------------------------------------------------------------------------
+
+class NormalizedHeader
+{
+public:
+    NormalizedHeader(NormalizedHeader* next_, int32_t count_, HttpEnums::HeaderId id_) :
+        next(next_), count(count_), id(id_) {}
+    const Field& get_norm(HttpInfractions* infractions, HttpEventGen* events,
+        const HttpEnums::HeaderId header_name_id[], const Field header_value[],
+        const int32_t num_headers);
+    const Field& get_comma_separated_raw(HttpMsgHeadShared& msg_head, HttpInfractions* infractions,
+       HttpEventGen* events, const HttpEnums::HeaderId header_name_id[], const Field header_value[],
+        const int32_t num_headers);
+
+    NormalizedHeader* next;
+    int32_t count;
+    const HttpEnums::HeaderId id;
+
+private:  
+    // Header normalization strategies. There should be one defined for every different way we can
+    // process a header field value.
+    class HeaderNormalizer;
+    static const HeaderNormalizer NORMALIZER_BASIC;
+    static const HeaderNormalizer NORMALIZER_HOST;
+    static const HeaderNormalizer NORMALIZER_CASE_INSENSITIVE;
+    static const HeaderNormalizer NORMALIZER_NUMBER;
+    static const HeaderNormalizer NORMALIZER_TOKEN_LIST;
+    static const HeaderNormalizer NORMALIZER_METHOD_LIST;
+    static const HeaderNormalizer NORMALIZER_DATE;
+    static const HeaderNormalizer NORMALIZER_URI;
+    static const HeaderNormalizer NORMALIZER_CONTENT_LENGTH;
+    static const HeaderNormalizer NORMALIZER_CHARSET;
+
+    // Master table of known header fields and their normalization strategies.
+    static const HeaderNormalizer* const header_norms[];
+
+    Field norm;
+    Field comma_separated_raw;
+};
+ 
+#endif
+
diff --git a/src/service_inspectors/http_inspect/http_tables.cc b/src/service_inspectors/http_inspect/http_tables.cc

index ffa484da78b6d3b456a02b37acd6bdd3b6fe642f..e93e4f79a349639d1af11a28a0f09bdb0a4f4720 100755 (executable)
--- a/src/service_inspectors/http_inspect/http_tables.cc
+++ b/src/service_inspectors/http_inspect/http_tables.cc
@@ -197,112 +197,6 @@ const StrCode HttpMsgHeadShared::transfer_encoding_list[] =
      { 0,                     nullptr }
  };
  
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_BASIC
-    { EVENT__NONE, INF__NONE, false, nullptr, nullptr, nullptr };
-
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_HOST
-    { EVENT_MULTIPLE_HOST_HDRS, INF_MULTIPLE_HOST_HDRS, false, nullptr, nullptr, nullptr };
-
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_CASE_INSENSITIVE
-    { EVENT__NONE, INF__NONE, false, norm_to_lower, nullptr, nullptr };
-
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_NUMBER
-    { EVENT_REPEATED_HEADER, INF_REPEATED_HEADER, false, norm_remove_lws, nullptr, nullptr };
-
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_TOKEN_LIST
-    { EVENT__NONE, INF__NONE, false, norm_remove_lws, norm_to_lower, nullptr };
-
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_METHOD_LIST
-    { EVENT__NONE, INF__NONE, false, norm_remove_lws, nullptr, nullptr };
-
-// FIXIT-L implement a date normalization function that converts the three legal formats into a
-// single standard format. For now we do nothing special for dates. This object is a placeholder
-// to keep track of which headers have date values.
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_DATE
-    { EVENT__NONE, INF__NONE, false, nullptr, nullptr, nullptr };
-
-// FIXIT-M implement a URI normalization function, probably by extending existing URI capabilities
-// to cover relative formats
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_URI
-    { EVENT__NONE, INF__NONE, false, nullptr, nullptr, nullptr };
-
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_CONTENT_LENGTH
-    { EVENT_MULTIPLE_CONTLEN, INF_MULTIPLE_CONTLEN, true, norm_remove_lws, nullptr, nullptr };
-
-const HeaderNormalizer HttpMsgHeadShared::NORMALIZER_CHARSET
-    { EVENT__NONE, INF__NONE, false, norm_remove_quotes_lws, norm_to_lower, nullptr };
-
-const HeaderNormalizer* const HttpMsgHeadShared::header_norms[HEAD__MAX_VALUE + MAX_CUSTOM_HEADERS + 1] = {
-    &NORMALIZER_BASIC,      // 0
-    &NORMALIZER_BASIC,      // HEAD__OTHER
-    &NORMALIZER_TOKEN_LIST, // HEAD_CACHE_CONTROL
-    &NORMALIZER_TOKEN_LIST, // HEAD_CONNECTION
-    &NORMALIZER_DATE,       // HEAD_DATE
-    &NORMALIZER_TOKEN_LIST, // HEAD_PRAGMA
-    &NORMALIZER_TOKEN_LIST, // HEAD_TRAILER
-    &NORMALIZER_BASIC,      // HEAD_COOKIE
-    &NORMALIZER_BASIC,      // HEAD_SET_COOKIE
-    &NORMALIZER_TOKEN_LIST, // HEAD_TRANSFER_ENCODING
-    &NORMALIZER_TOKEN_LIST, // HEAD_UPGRADE
-    &NORMALIZER_BASIC,      // HEAD_VIA
-    &NORMALIZER_BASIC,      // HEAD_WARNING
-    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT
-    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT_CHARSET
-    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT_ENCODING
-    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT_LANGUAGE
-    &NORMALIZER_BASIC,      // HEAD_AUTHORIZATION
-    &NORMALIZER_CASE_INSENSITIVE, // HEAD_EXPECT
-    &NORMALIZER_BASIC,      // HEAD_FROM
-    &NORMALIZER_HOST,       // HEAD_HOST
-    &NORMALIZER_BASIC,      // HEAD_IF_MATCH
-    &NORMALIZER_DATE,       // HEAD_IF_MODIFIED_SINCE
-    &NORMALIZER_BASIC,      // HEAD_IF_NONE_MATCH
-    &NORMALIZER_BASIC,      // HEAD_IF_RANGE
-    &NORMALIZER_DATE,       // HEAD_IF_UNMODIFIED_SINCE
-    &NORMALIZER_BASIC,      // HEAD_MAX_FORWARDS
-    &NORMALIZER_BASIC,      // HEAD_PROXY_AUTHORIZATION
-    &NORMALIZER_BASIC,      // HEAD_RANGE
-    &NORMALIZER_URI,        // HEAD_REFERER
-    &NORMALIZER_TOKEN_LIST, // HEAD_TE
-    &NORMALIZER_BASIC,      // HEAD_USER_AGENT
-    &NORMALIZER_TOKEN_LIST, // HEAD_ACCEPT_RANGES
-    &NORMALIZER_NUMBER,     // HEAD_AGE
-    &NORMALIZER_BASIC,      // HEAD_ETAG
-    &NORMALIZER_URI,        // HEAD_LOCATION
-    &NORMALIZER_BASIC,      // HEAD_PROXY_AUTHENTICATE
-    &NORMALIZER_BASIC,      // HEAD_RETRY_AFTER, may be date or number
-    &NORMALIZER_BASIC,      // HEAD_SERVER
-    &NORMALIZER_TOKEN_LIST, // HEAD_VARY
-    &NORMALIZER_BASIC,      // HEAD_WWW_AUTHENTICATE
-    &NORMALIZER_METHOD_LIST, // HEAD_ALLOW
-    &NORMALIZER_TOKEN_LIST, // HEAD_CONTENT_ENCODING
-    &NORMALIZER_TOKEN_LIST, // HEAD_CONTENT_LANGUAGE
-    &NORMALIZER_CONTENT_LENGTH, // HEAD_CONTENT_LENGTH
-    &NORMALIZER_URI,        // HEAD_CONTENT_LOCATION
-    &NORMALIZER_BASIC,      // HEAD_CONTENT_MD5
-    &NORMALIZER_BASIC,      // HEAD_CONTENT_RANGE
-    &NORMALIZER_CHARSET,    // HEAD_CONTENT_TYPE
-    &NORMALIZER_DATE,       // HEAD_EXPIRES
-    &NORMALIZER_DATE,       // HEAD_LAST_MODIFIED
-    &NORMALIZER_BASIC,      // HEAD_X_FORWARDED_FOR
-    &NORMALIZER_BASIC,      // HEAD_TRUE_CLIENT_IP
-    &NORMALIZER_BASIC,      // HEAD_X_WORKING_WITH
-    &NORMALIZER_TOKEN_LIST, // HEAD_CONTENT_TRANSFER_ENCODING
-    &NORMALIZER_BASIC,      // HEAD_MIME_VERSION
-    &NORMALIZER_BASIC,      // HEAD_PROXY_AGENT
-    &NORMALIZER_BASIC,      // HEAD_CONTENT_DISPOSITION
-    &NORMALIZER_TOKEN_LIST, // HEAD_HTTP2_SETTINGS
-    &NORMALIZER_BASIC,      // HEAD__MAX_VALUE
-    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
-    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
-    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
-    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
-    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
-    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
-    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
-    &NORMALIZER_BASIC,      // HEAD_CUSTOM_XFF_HEADER
-};
-
  const RuleMap HttpModule::http_events[] =
  {
      { EVENT_ASCII,                      "ascii encoding" },
diff --git a/src/service_inspectors/http_inspect/ips_http.cc b/src/service_inspectors/http_inspect/ips_http.cc

index 2eaf8d7073ed7319f03f6f4a5a1dad27267b174a..06ece90b8f636d2399ac6611349c0faa32978329 100644 (file)
--- a/src/service_inspectors/http_inspect/ips_http.cc
+++ b/src/service_inspectors/http_inspect/ips_http.cc
@@ -618,6 +618,8 @@ static const IpsApi raw_cookie_api =
  
  static const Parameter http_raw_header_params[] =
  {
+    { "field", Parameter::PT_STRING, nullptr, nullptr,
+        "restrict to given header. Header name is case insensitive." },
      { "request", Parameter::PT_IMPLIED, nullptr, nullptr,
          "match against the headers from the request message even when examining the response" },
      { "with_header", Parameter::PT_IMPLIED, nullptr, nullptr,
@@ -824,6 +826,8 @@ static const IpsApi raw_status_api =
  
  static const Parameter http_raw_trailer_params[] =
  {
+    { "field", Parameter::PT_STRING, nullptr, nullptr,
+        "restrict to given trailer. Trailer name is case insensitive." },
      { "request", Parameter::PT_IMPLIED, nullptr, nullptr,
          "match against the trailers from the request message even when examining the response" },
      { "with_header", Parameter::PT_IMPLIED, nullptr, nullptr,
author	Tom Peters (thopeter) <thopeter@cisco.com>
	Wed, 18 Aug 2021 18:14:00 +0000 (18:14 +0000)
committer	Tom Peters (thopeter) <thopeter@cisco.com>
	Wed, 18 Aug 2021 18:14:00 +0000 (18:14 +0000)
doc/user/http_inspect.txt		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/CMakeLists.txt		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_header_normalizer.cc	[deleted file]	patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_header_normalizer.h	[deleted file]	patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_msg_head_shared.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_msg_head_shared.h		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_msg_header.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_msg_section.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_normalized_header.cc	[new file with mode: 0644]	patch \| blob
src/service_inspectors/http_inspect/http_normalized_header.h	[new file with mode: 0644]	patch \| blob
src/service_inspectors/http_inspect/http_tables.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/ips_http.cc		patch \| blob \| blame \| history