http_inspect: publish on sse event boundaries (#5279)

author Anna Norokh <anorokh@cisco.com>

Fri, 10 Apr 2026 00:56:26 +0000 (03:56 +0300)

committer GitHub <noreply@github.com>

Fri, 10 Apr 2026 00:56:26 +0000 (20:56 -0400)
author Anna Norokh <anorokh@cisco.com>
Fri, 10 Apr 2026 00:56:26 +0000 (03:56 +0300)
committer GitHub <noreply@github.com>
Fri, 10 Apr 2026 00:56:26 +0000 (20:56 -0400)
diff --git a/src/pub_sub/http_publish_length_event.h b/src/pub_sub/http_publish_length_event.h

index dffc4f4b289ce24669688b388a6294b19758a62c..507365ac22796e38c71a1292f78c09cdab8fa12a 100644 (file)
--- a/src/pub_sub/http_publish_length_event.h
+++ b/src/pub_sub/http_publish_length_event.h
@@ -20,10 +20,11 @@
  #ifndef HTTP_PUBLISH_LENGTH_EVENT_H
  #define HTTP_PUBLISH_LENGTH_EVENT_H
  
-// An event to dynamically update the publish length used by http_inspect
+// An event to dynamically update the publish length used by http_inspect.
  // Subscribers MUST retain the given publish length if it's larger than
  // the one they desire. That way all subscribers can work together to
-// set the publish length.
+// set the publish length. Subscribers can also request additional
+// publish behavior, such as publishing on SSE event boundaries.
  
  namespace snort
  {
@@ -54,10 +55,17 @@ public:
      bool should_publish_body() const
      { return publish_body; }
  
+    void set_publish_on_sse_event_boundary()
+    { publish_on_sse_event_boundary = true; }
+
+    bool should_publish_on_sse_event_boundary() const
+    { return publish_on_sse_event_boundary; }
+
  private:
      bool is_data_originates_from_client;
      int32_t publish_length;
      bool publish_body = false;
+    bool publish_on_sse_event_boundary = false;
  };
  
  }
diff --git a/src/pub_sub/test/pub_sub_http_transaction_end_event_test.cc b/src/pub_sub/test/pub_sub_http_transaction_end_event_test.cc

index fa87e709cd9b61a6c54c12766703c053c4d9f2b8..2526a30b988a272ac7d5087699a6721ec7377f14 100644 (file)
--- a/src/pub_sub/test/pub_sub_http_transaction_end_event_test.cc
+++ b/src/pub_sub/test/pub_sub_http_transaction_end_event_test.cc
@@ -111,7 +111,8 @@ const snort::StreamBuffer HttpStreamSplitter::reassemble(snort::Flow*, unsigned,
      return buf;
  }
  bool HttpStreamSplitter::finish(snort::Flow*) { return false; }
-void HttpStreamSplitter::prep_partial_flush(snort::Flow*, uint32_t, uint32_t, uint32_t) { }
+void HttpStreamSplitter::prep_partial_flush(snort::Flow*, uint32_t, uint32_t, uint32_t,
+    HttpEnums::PartialFlushType) { }
  
  HttpMsgHeader::HttpMsgHeader(const uint8_t* buffer, const uint16_t buf_size,
      HttpFlowData* session_data_, SourceId source_id_, bool buf_owner, Flow* flow_,
diff --git a/src/service_inspectors/http_inspect/http_cutter.cc b/src/service_inspectors/http_inspect/http_cutter.cc

index 2cf6fa43c8b7944c06bdab5d87639b207bd32cba..a292e9ca136ae0d30304e398530b8d5de66a4478 100644 (file)
--- a/src/service_inspectors/http_inspect/http_cutter.cc
+++ b/src/service_inspectors/http_inspect/http_cutter.cc
@@ -28,6 +28,7 @@
  #include "http_enum.h"
  #include "http_flow_data.h"
  #include "http_module.h"
+#include "http_transaction.h"
  
  using namespace HttpEnums;
  using namespace HttpCommon;
@@ -327,6 +328,10 @@ HttpBodyCutter::DecompressOutput HttpBodyCutter::decompress(const uint8_t* src,
  HttpBodyCutter::HttpBodyCutter(bool accelerated_blocking_, ScriptFinder* finder_,
      HttpFlowData* const session_data, SourceId source_id)
      : accelerated_blocking(accelerated_blocking_)
+    , sse_state(source_id == SRC_SERVER &&
+        session_data->transaction[source_id] &&
+        session_data->transaction[source_id]->should_publish_on_sse_event_boundary() ?
+        SSE_START : SSE_DISABLED)
      , finder(finder_)
      , session_data(session_data)
      , source_id(source_id)
@@ -374,7 +379,8 @@ ScanResult HttpBodyClCutter::cut(const uint8_t* buffer, uint32_t length,
  
      if (octets_seen + length < flow_target)
      {
-        const auto [accelerate, consumed] = analyze_body(buffer, length, infractions, events);
+        const auto flush_ctx = analyze_body(buffer, length, infractions, events);
+        const auto consumed = flush_ctx.consumed;
  
          if ( consumed < length )
          {
@@ -384,14 +390,17 @@ ScanResult HttpBodyClCutter::cut(const uint8_t* buffer, uint32_t length,
          }
  
          octets_seen += length;
-        return accelerate ? SCAN_NOT_FOUND_ACCELERATE : SCAN_NOT_FOUND;
+        if ( flush_ctx.is_none() )
+            return SCAN_NOT_FOUND;
+
+        return flush_ctx.is_publish() ? SCAN_NOT_FOUND_PARTIAL_PUBLISH : SCAN_NOT_FOUND_ACCELERATE;
      }
  
      if (!stretch)
      {
          assert(flow_target >= octets_seen);
          const uint32_t planned_flush = flow_target - octets_seen;
-        const auto [_, consumed] = analyze_body(buffer, planned_flush, infractions, events);
+        const auto consumed = analyze_body(buffer, planned_flush, infractions, events).consumed;
  
          num_flush = consumed;
          remaining -= octets_seen + num_flush;
@@ -409,7 +418,7 @@ ScanResult HttpBodyClCutter::cut(const uint8_t* buffer, uint32_t length,
          else
              planned_flush = flow_target - octets_seen;
  
-        const auto [_, consumed] = analyze_body(buffer, planned_flush, infractions, events);
+        const auto consumed = analyze_body(buffer, planned_flush, infractions, events).consumed;
  
          num_flush = consumed;
          remaining -= octets_seen + num_flush;
@@ -456,7 +465,8 @@ ScanResult HttpBodyOldCutter::cut(const uint8_t* buffer, uint32_t length,
  
      if (octets_seen + length < flow_target)
      {
-        const auto [accelerate, consumed] = analyze_body(buffer, length, infractions, events);
+        const auto flush_ctx = analyze_body(buffer, length, infractions, events);
+        const auto consumed = flush_ctx.consumed;
  
          if ( consumed < length )
          {
@@ -466,13 +476,16 @@ ScanResult HttpBodyOldCutter::cut(const uint8_t* buffer, uint32_t length,
  
          // Not enough data yet to create a message section
          octets_seen += length;
-        return accelerate ? SCAN_NOT_FOUND_ACCELERATE : SCAN_NOT_FOUND;
+        if ( flush_ctx.is_none() )
+            return SCAN_NOT_FOUND;
+
+        return flush_ctx.is_publish() ? SCAN_NOT_FOUND_PARTIAL_PUBLISH : SCAN_NOT_FOUND_ACCELERATE;
      }
      else if (stretch && (octets_seen + length <= flow_target + MAX_SECTION_STRETCH))
      {
          // Cut the section at the end of this TCP segment to avoid splitting a packet
          const uint32_t planned_flush = length;
-        const auto [_, consumed] = analyze_body(buffer, planned_flush, infractions, events);
+        const auto consumed = analyze_body(buffer, planned_flush, infractions, events).consumed;
  
          num_flush = consumed;
  
@@ -483,7 +496,7 @@ ScanResult HttpBodyOldCutter::cut(const uint8_t* buffer, uint32_t length,
          // Cut the section at the target length. Either stretching is not allowed or the end of
          // the segment is too far away.
          const uint32_t planned_flush = flow_target - octets_seen;
-        const auto [_, consumed] = analyze_body(buffer, planned_flush, infractions, events);
+        const auto consumed = analyze_body(buffer, planned_flush, infractions, events).consumed;
  
          num_flush = consumed;
  
@@ -508,6 +521,7 @@ ScanResult HttpBodyChunkCutter::cut(const uint8_t* buffer, uint32_t length,
      const uint32_t adjusted_target = stretch ? MAX_SECTION_STRETCH + flow_target : flow_target;
  
      bool accelerate_this_packet = false;
+    bool partial_publish_this_packet = false;
  
      for (int32_t k=0; k < static_cast<int32_t>(length); k++)
      {
@@ -698,9 +712,12 @@ ScanResult HttpBodyChunkCutter::cut(const uint8_t* buffer, uint32_t length,
  
              if ( accelerated_blocking or !discard_mode )
              {
-                const auto [accelerate, consumed] = analyze_body(buffer + k, skip_amount,
-                    infractions, events);
-                accelerate_this_packet = accelerate or accelerate_this_packet;
+                const auto flush_ctx = analyze_body(buffer + k, skip_amount, infractions, events);
+                const auto consumed = flush_ctx.consumed;
+                if ( flush_ctx.is_publish() )
+                    partial_publish_this_packet = true;
+                else if ( flush_ctx.is_accelerate() )
+                    accelerate_this_packet = true;
  
                  if ( consumed < skip_amount and !discard_mode )
                  {
@@ -788,9 +805,12 @@ ScanResult HttpBodyChunkCutter::cut(const uint8_t* buffer, uint32_t length,
              skip_amount = (skip_amount <= adjusted_target-data_seen) ? skip_amount :
                  adjusted_target-data_seen;
  
-            const auto [accelerate, consumed] = analyze_body(buffer + k,
-                skip_amount, infractions, events);
-            accelerate_this_packet = accelerate or accelerate_this_packet;
+            const auto flush_ctx = analyze_body(buffer + k, skip_amount, infractions, events);
+            const auto consumed = flush_ctx.consumed;
+            if ( flush_ctx.is_publish() )
+                partial_publish_this_packet = true;
+            else if ( flush_ctx.is_accelerate() )
+                accelerate_this_packet = true;
  
              if ( consumed < skip_amount )
              {
@@ -827,10 +847,13 @@ ScanResult HttpBodyChunkCutter::cut(const uint8_t* buffer, uint32_t length,
  
      octets_seen += length;
  
-    if (accelerate_this_packet || (zero_chunk && data_seen))
-        return SCAN_NOT_FOUND_ACCELERATE;
+    if ( zero_chunk && data_seen )
+        accelerate_this_packet = true;
  
-    return SCAN_NOT_FOUND;
+    if ( !accelerate_this_packet && !partial_publish_this_packet )
+        return SCAN_NOT_FOUND;
+
+    return accelerate_this_packet ? SCAN_NOT_FOUND_ACCELERATE : SCAN_NOT_FOUND_PARTIAL_PUBLISH;
  }
  
  ScanResult HttpBodyHXCutter::cut(const uint8_t* buffer, uint32_t length, HttpInfractions* infractions,
@@ -870,7 +893,8 @@ ScanResult HttpBodyHXCutter::cut(const uint8_t* buffer, uint32_t length, HttpInf
          if (octets_seen + length < flow_target)
          {
              // Not enough data yet to create a message section
-            const auto [accelerate, consumed] = analyze_body(buffer, length, infractions, events);
+            const auto flush_ctx = analyze_body(buffer, length, infractions, events);
+            const auto consumed = flush_ctx.consumed;
  
              if ( consumed < length )
              {
@@ -881,7 +905,10 @@ ScanResult HttpBodyHXCutter::cut(const uint8_t* buffer, uint32_t length, HttpInf
  
              octets_seen += length;
              total_octets_scanned += length;
-            return accelerate ? SCAN_NOT_FOUND_ACCELERATE : SCAN_NOT_FOUND;
+            if ( flush_ctx.is_none() )
+                return SCAN_NOT_FOUND;
+
+            return flush_ctx.is_publish() ? SCAN_NOT_FOUND_PARTIAL_PUBLISH : SCAN_NOT_FOUND_ACCELERATE;
          }
          else
          {
@@ -891,7 +918,7 @@ ScanResult HttpBodyHXCutter::cut(const uint8_t* buffer, uint32_t length, HttpInf
              else
                  planned_flush = flow_target - octets_seen;
  
-            const auto [_, consumed] = analyze_body(buffer, planned_flush, infractions, events);
+            const auto consumed = analyze_body(buffer, planned_flush, infractions, events).consumed;
  
              num_flush = consumed;
              total_octets_scanned += num_flush;
@@ -932,10 +959,10 @@ ScanResult HttpBodyHXCutter::cut(const uint8_t* buffer, uint32_t length, HttpInf
  // requires script detection. Exactly what we are looking for is encapsulated in dangerous().
  //
  // Return value FlushContext contains:
-//   accelerate: true indicates a match and enables the packet that completes the matching sequence
-//               to be sent for partial inspection.
  //   consumed: how many input bytes the decompressor actually processed. When less than the
  //             input length the decompressor buffer is full and the caller should flush early.
+//   decision: NONE when no early action is needed, ACCELERATE for detect-driven partial
+//             inspection, PUBLISH for publish-only partial inspection on SSE boundaries.
  //
  // Any attempt to optimize this code should be mindful that once you skip any part of the message
  // body, dangerous() loses the ability to unzip subsequent data.
@@ -947,18 +974,92 @@ HttpBodyCutter::FlushContext HttpBodyCutter::analyze_body(const uint8_t* data, u
      {
          const auto [_, consumed] = decompress(data, length, infractions, events);
          assert(consumed <= length);
-        return { false, consumed };
+
+        if ( (sse_state != SSE_DISABLED) &&
+            (session_data->compress[source_id] == nullptr) && has_sse_boundary(data, consumed) )
+        {
+            return { consumed, FlushContext::PUBLISH };
+        }
+
+        return { consumed, FlushContext::NONE };
      }
  
-    const auto result = dangerous(data, length, infractions, events);
+    auto result = dangerous(data, length, infractions, events);
      assert(result.consumed <= length);
  
-    if ( result.accelerate )
+    if ( result.is_accelerate() )
          HttpModule::increment_peg_counts(PEG_SCRIPT_DETECTION);
  
+    // FIXIT-E blank-line boundary detection currently inspects only the raw response body.
+    // That is sufficient for the current work in progress, but compressed response bodies need
+    // decompression-aware boundary accounting later.
+    if ( result.is_none() && (sse_state != SSE_DISABLED) &&
+        (session_data->compress[source_id] == nullptr) && has_sse_boundary(data, result.consumed) )
+    {
+        result.decision = FlushContext::PUBLISH;
+    }
+
      return result;
  }
  
+bool HttpBodyCutter::has_sse_boundary(const uint8_t* data, uint32_t length)
+{
+    for (uint32_t k = 0; k < length; k++)
+    {
+        switch (sse_state)
+        {
+        case SSE_DISABLED:
+        default:
+            break;
+
+        case SSE_START:
+            if ( (data[k] != '\n') && (data[k] != '\r') )
+                sse_state = SSE_DATA_LINE;
+            break;
+
+        case SSE_DATA_LINE:
+            if (data[k] == '\n')
+                sse_state = SSE_EMPTY_LINE;
+            else if (data[k] == '\r')
+                sse_state = SSE_CR_DATA_LINE;
+            break;
+
+        case SSE_CR_DATA_LINE:
+            if (data[k] == '\n')
+                sse_state = SSE_EMPTY_LINE;
+            else
+                sse_state = (data[k] == '\r') ? SSE_CR_EMPTY_LINE : SSE_DATA_LINE;
+            break;
+
+        case SSE_EMPTY_LINE:
+            if (data[k] == '\n')
+            {
+                sse_state = SSE_START;
+                return true;   // blank-line boundary recognized
+            }
+            if (data[k] == '\r')
+            {
+                sse_state = SSE_CR_EMPTY_LINE;
+                break;
+            }
+            sse_state = SSE_DATA_LINE;
+            break;
+
+        case SSE_CR_EMPTY_LINE:
+            if (data[k] == '\n')
+            {
+                sse_state = SSE_START;
+                return true;   // blank-line boundary recognized
+            }
+
+            sse_state = (data[k] == '\r') ? SSE_CR_EMPTY_LINE : SSE_DATA_LINE;
+            break;
+        }
+    }
+
+    return false;
+}
+
  bool HttpBodyCutter::find_partial(const uint8_t* input_buf, uint32_t input_length, bool end)
  {
      for (uint32_t k = 0; k < input_length; k++)
@@ -990,17 +1091,17 @@ HttpBodyCutter::FlushContext HttpBodyCutter::dangerous(const uint8_t* data, uint
      const auto [decompressed, consumed] = decompress(data, length, infractions, events);
  
      if ( !decompressed )
-        return { true, consumed };
+        return { consumed, FlushContext::ACCELERATE };
  
      auto [input_buf, input_length] = *decompressed;
  
      if ( input_length > string_length )
      {
          if ( partial_match and find_partial(input_buf, input_length, true) )
-            return { true, consumed };
+            return { consumed, FlushContext::ACCELERATE };
  
          if ( finder->search(input_buf, input_length) >= 0 )
-            return { true, consumed };
+            return { consumed, FlushContext::ACCELERATE };
  
          uint32_t delta = input_length - string_length + 1;
          input_buf += delta;
@@ -1008,9 +1109,9 @@ HttpBodyCutter::FlushContext HttpBodyCutter::dangerous(const uint8_t* data, uint
      }
  
      if ( find_partial(input_buf, input_length, false) )
-        return { true, consumed };
+        return { consumed, FlushContext::ACCELERATE };
  
-    return { false, consumed };
+    return { consumed, FlushContext::NONE };
  }
  
  uint8_t HttpZeroNineCutter::match[] = { 'H', 'T', 'T', 'P', '/' };
diff --git a/src/service_inspectors/http_inspect/http_cutter.h b/src/service_inspectors/http_inspect/http_cutter.h

index 37f4a34749cb3370aea3fdeebceaaabea79054ac..588c15279a71a407fc2b9ec7c3ad5ed8f16911b5 100644 (file)
--- a/src/service_inspectors/http_inspect/http_cutter.h
+++ b/src/service_inspectors/http_inspect/http_cutter.h
@@ -128,8 +128,19 @@ public:
  private:
      struct FlushContext
      {
-        bool accelerate = false;
+        enum Decision : uint8_t
+        {
+            ACCELERATE,
+            PUBLISH,
+            NONE,
+        };
+
          uint32_t consumed = 0;
+        Decision decision = NONE;
+
+        bool is_none() const { return decision == NONE; }
+        bool is_publish() const { return decision == PUBLISH; }
+        bool is_accelerate() const { return decision == ACCELERATE; }
      };
  
      struct DecompressOutput
@@ -146,12 +157,24 @@ protected:
  
      const bool accelerated_blocking;
  private:
+    enum SseState : uint8_t
+    {
+        SSE_DISABLED,
+        SSE_START,
+        SSE_DATA_LINE,
+        SSE_CR_DATA_LINE,
+        SSE_EMPTY_LINE,
+        SSE_CR_EMPTY_LINE,
+    };
+
      FlushContext dangerous(const uint8_t* data, uint32_t length,
          HttpInfractions* infractions, HttpEventGen* events);
      bool find_partial(const uint8_t*, uint32_t, bool);
+    bool has_sse_boundary(const uint8_t* data, uint32_t length);
  
      uint8_t partial_match = 0;
      uint8_t string_length = 0;
+    SseState sse_state = SSE_DISABLED;
      ScriptFinder* const finder;
      const uint8_t* match_string = nullptr;
      const uint8_t* match_string_upper = nullptr;
@@ -233,4 +256,3 @@ private:
  };
  
  #endif
-
diff --git a/src/service_inspectors/http_inspect/http_enum.h b/src/service_inspectors/http_inspect/http_enum.h

index 81cffcfb512a0a7f6e0b1067e43906516fe224cb..158986a9d6b9ab92cf5d5e65b6c0386e4c852d5e 100755 (executable)
--- a/src/service_inspectors/http_inspect/http_enum.h
+++ b/src/service_inspectors/http_inspect/http_enum.h
@@ -70,16 +70,20 @@ enum PEG_COUNT { PEG_FLOW = 0, PEG_SCAN, PEG_REASSEMBLE, PEG_INSPECT, PEG_REQUES
      PEG_GET, PEG_HEAD, PEG_POST, PEG_PUT, PEG_DELETE, PEG_CONNECT, PEG_OPTIONS, PEG_TRACE,
      PEG_OTHER_METHOD, PEG_REQUEST_BODY, PEG_CHUNKED, PEG_URI_NORM, PEG_URI_PATH, PEG_URI_CODING,
      PEG_CONCURRENT_SESSIONS, PEG_MAX_CONCURRENT_SESSIONS, PEG_SCRIPT_DETECTION,
-    PEG_PARTIAL_INSPECT, PEG_EXCESS_PARAMS, PEG_PARAMS, PEG_CUTOVERS, PEG_SSL_SEARCH_ABND_EARLY,
+    PEG_PARTIAL_INSPECT, PEG_PARTIAL_PUBLISH, PEG_EXCESS_PARAMS, PEG_PARAMS, PEG_CUTOVERS,
+    PEG_SSL_SEARCH_ABND_EARLY,
      PEG_PIPELINED_FLOWS, PEG_PIPELINED_REQUESTS, PEG_TOTAL_BYTES, PEG_JS_INLINE, PEG_JS_EXTERNAL,
      PEG_JS_PDF, PEG_SKIP_MIME_ATTACH, PEG_COMPRESSED_GZIP, PEG_COMPRESSED_GZIP_FAILED, PEG_COMPRESSED_DEFLATE,
      PEG_INCORRECT_DEFLATE_HEADER, PEG_COMPRESSED_DEFLATE_FAILED, PEG_COMPRESSED_NOT_SUPPORTED,
      PEG_COMPRESSED_UNKNOWN, PEG_MAX_PUBLISH_DEPTH_HITS, PEG_COUNT_MAX};
  
  // Result of scanning by splitter
-enum ScanResult { SCAN_NOT_FOUND, SCAN_NOT_FOUND_ACCELERATE, SCAN_FOUND, SCAN_FOUND_PIECE,
+enum ScanResult { SCAN_NOT_FOUND, SCAN_NOT_FOUND_ACCELERATE,
+    SCAN_NOT_FOUND_PARTIAL_PUBLISH, SCAN_FOUND, SCAN_FOUND_PIECE,
      SCAN_DISCARD, SCAN_DISCARD_PIECE, SCAN_ABORT };
  
+enum PartialFlushType : uint8_t { PF_NONE, PF_DETECT, PF_PUBLISH };
+
  // State machine for chunk parsing
  enum ChunkState { CHUNK_NEWLINES, CHUNK_ZEROS, CHUNK_LEADING_WS, CHUNK_NUMBER, CHUNK_TRAILING_WS,
      CHUNK_OPTIONS, CHUNK_HCRLF, CHUNK_DATA, CHUNK_DCRLF1, CHUNK_DCRLF2, CHUNK_BAD };
@@ -475,4 +479,3 @@ extern const std::map <HttpEnums::VersionId, const char*> VersionEnumToStr;
  } // end namespace HttpEnums
  
  #endif
-
diff --git a/src/service_inspectors/http_inspect/http_flow_data.cc b/src/service_inspectors/http_inspect/http_flow_data.cc

index 7f951b96f16d049e584bbeb1e5d3aff2f7174b5e..8ee9cd06faa13f575ea7e34ed49811740cc4ce48 100644 (file)
--- a/src/service_inspectors/http_inspect/http_flow_data.cc
+++ b/src/service_inspectors/http_inspect/http_flow_data.cc
@@ -269,7 +269,7 @@ void HttpFlowData::finish_hx_body(HttpCommon::SourceId source_id, HttpCommon::HX
      assert((hx_body_state[source_id] == HX_BODY_NOT_COMPLETE) ||
          (hx_body_state[source_id] == HX_BODY_LAST_SEG));
      hx_body_state[source_id] = state;
-    partial_flush[source_id] = false;
+    partial_flush[source_id] = HttpEnums::PF_NONE;
      if (clear_partial_buffer)
      {
          // We've already sent all data through detection so no need to reinspect. Just need to
diff --git a/src/service_inspectors/http_inspect/http_flow_data.h b/src/service_inspectors/http_inspect/http_flow_data.h

index e4a929abfc0b6b60c707053a72256918ceac4bc4..c9fcff7c0b6988839548d9bc9785c40922910324 100644 (file)
--- a/src/service_inspectors/http_inspect/http_flow_data.h
+++ b/src/service_inspectors/http_inspect/http_flow_data.h
@@ -126,7 +126,7 @@ private:
      int32_t octets_reassembled[2] = { HttpCommon::STAT_NOT_PRESENT, HttpCommon::STAT_NOT_PRESENT };
      int32_t num_head_lines[2] = { HttpCommon::STAT_NOT_PRESENT, HttpCommon::STAT_NOT_PRESENT };
      bool tcp_close[2] = { false, false };
-    bool partial_flush[2] = { false, false };
+    HttpEnums::PartialFlushType partial_flush[2] = { HttpEnums::PF_NONE, HttpEnums::PF_NONE };
      uint64_t last_connect_trans_w_early_traffic = 0;
  
      HttpCompressStream* compress[2] = { nullptr, nullptr };
diff --git a/src/service_inspectors/http_inspect/http_inspect.cc b/src/service_inspectors/http_inspect/http_inspect.cc

index 99bfa9b959a0c57dd8b8c98cedf271e4e3bb7e71..8c4237e08ec4eca97e9512b5a58ea3dd0f8c27c8 100755 (executable)
--- a/src/service_inspectors/http_inspect/http_inspect.cc
+++ b/src/service_inspectors/http_inspect/http_inspect.cc
@@ -549,10 +549,22 @@ void HttpInspect::process(const uint8_t* data, const uint16_t dsize, Flow* const
      HttpMsgSection* current_section;
      HttpFlowData* session_data = http_get_flow_data(flow);
  
-    if (!session_data->partial_flush[source_id])
+    switch (session_data->partial_flush[source_id])
+    {
+    case PF_NONE:
          HttpModule::increment_peg_counts(PEG_INSPECT);
-    else
+        break;
+    case PF_DETECT:
          HttpModule::increment_peg_counts(PEG_PARTIAL_INSPECT);
+        break;
+    case PF_PUBLISH:
+        HttpModule::increment_peg_counts(PEG_PARTIAL_PUBLISH);
+        break;
+    default:
+        assert(false);
+        HttpModule::increment_peg_counts(PEG_INSPECT);
+        break;
+    }
  
      switch (session_data->section_type[source_id])
      {
@@ -599,7 +611,7 @@ void HttpInspect::process(const uint8_t* data, const uint16_t dsize, Flow* const
  
      current_section->analyze();
      current_section->gen_events();
-    if (!session_data->partial_flush[source_id])
+    if (session_data->partial_flush[source_id] == PF_NONE)
          current_section->update_flow();
      session_data->section_type[source_id] = SEC__NOT_COMPUTE;
  
@@ -624,7 +636,9 @@ void HttpInspect::process(const uint8_t* data, const uint16_t dsize, Flow* const
          p->set_pdu_section(pdu_section);
      }
  
-    if (current_section->run_detection(p))
+    const bool skip_detection = (session_data->partial_flush[source_id] == PF_PUBLISH);
+
+    if (!skip_detection && current_section->run_detection(p))
      {
  #ifdef REG_TEST
          if (HttpTestManager::use_test_output(HttpTestManager::IN_HTTP))
diff --git a/src/service_inspectors/http_inspect/http_msg_body.cc b/src/service_inspectors/http_inspect/http_msg_body.cc

index 4796a72de3dedd265cd988cc49d2c11c48f7a3a1..adb855079bbdc64723670325f95c2852bc0b17c2 100644 (file)
--- a/src/service_inspectors/http_inspect/http_msg_body.cc
+++ b/src/service_inspectors/http_inspect/http_msg_body.cc
@@ -416,7 +416,7 @@ void HttpMsgBody::analyze()
  
              delete[] partial_detect_buffer;
  
-            if (!session_data->partial_flush[source_id])
+            if (session_data->partial_flush[source_id] == PF_NONE)
              {
                  bookkeeping_regular_flush(partial_detect_length, partial_detect_buffer,
                      partial_js_detect_length, detect_length);
@@ -438,7 +438,7 @@ void HttpMsgBody::analyze()
          }
      }
      body_octets += msg_text.length();
-    if (!session_data->partial_flush[source_id])
+    if (session_data->partial_flush[source_id] == PF_NONE)
          transaction->add_body_len(source_id, detect_data.length());
      partial_inspected_octets = session_data->partial_flush[source_id] ? msg_text.length() : 0;
  }
diff --git a/src/service_inspectors/http_inspect/http_msg_header.cc b/src/service_inspectors/http_inspect/http_msg_header.cc

index 05903744feba8ee80498e2ffe2fa6b3d34774bcd..a8ef289d3aa93ed728f2bba50f8c16cb415f906f 100755 (executable)
--- a/src/service_inspectors/http_inspect/http_msg_header.cc
+++ b/src/service_inspectors/http_inspect/http_msg_header.cc
@@ -603,11 +603,18 @@ void HttpMsgHeader::prepare_body()
      int32_t new_depth = http_publish_length_event.get_publish_length();
  
      int32_t should_publish = (int32_t)http_publish_length_event.should_publish_body();
+    // FIXIT-E move STASH_PUBLISH_REQUEST_BODY / STASH_PUBLISH_RESPONSE_BODY to the
+    // transaction object as well; this body-publish setting is negotiated and consumed
+    // entirely within http_inspect and fits per-transaction state better than generic
+    // flow stash.
      if (is_request)
          flow->set_attr(STASH_PUBLISH_REQUEST_BODY, should_publish);
      else
          flow->set_attr(STASH_PUBLISH_RESPONSE_BODY, should_publish);
  
+    if (http_publish_length_event.should_publish_on_sse_event_boundary())
+        transaction->set_publish_on_sse_event_boundary();
+
      if (new_depth > session_data->publish_depth_remaining[source_id])
      {
          session_data->publish_octets[source_id] = 0;
diff --git a/src/service_inspectors/http_inspect/http_stream_splitter.h b/src/service_inspectors/http_inspect/http_stream_splitter.h

index 9fb5ec30ecbfd7f2846c4bb01c6c6c4b19f9e18c..fa9e6e9319a43af0477f649c2f5822f1112ed80c 100644 (file)
--- a/src/service_inspectors/http_inspect/http_stream_splitter.h
+++ b/src/service_inspectors/http_inspect/http_stream_splitter.h
@@ -45,9 +45,9 @@ public:
          uint8_t* data, unsigned len, uint32_t flags, unsigned& copied) override;
      bool finish(snort::Flow* flow) override;
      void prep_partial_flush(snort::Flow* flow, uint32_t num_flush) override
-    { prep_partial_flush(flow, num_flush, 0, 0); }
+    { prep_partial_flush(flow, num_flush, 0, 0, HttpEnums::PF_DETECT); }
      void prep_partial_flush(snort::Flow* flow, uint32_t num_flush, uint32_t num_excess,
-        uint32_t num_head_lines);
+        uint32_t num_head_lines, HttpEnums::PartialFlushType partial_flush_type);
      bool is_paf() override { return true; }
      static StreamSplitter::Status status_value(StreamSplitter::Status ret_val, bool http2 = false);
  
diff --git a/src/service_inspectors/http_inspect/http_stream_splitter_finish.cc b/src/service_inspectors/http_inspect/http_stream_splitter_finish.cc

index 308bf3ff78c19be59b59c331f6aed6be7d7f68ab..f4df96b2d30820bab1ec9742700593448d942c0d 100644 (file)
--- a/src/service_inspectors/http_inspect/http_stream_splitter_finish.cc
+++ b/src/service_inspectors/http_inspect/http_stream_splitter_finish.cc
@@ -242,7 +242,7 @@ bool HttpStreamSplitter::finish(Flow* flow)
  }
  
  void HttpStreamSplitter::prep_partial_flush(Flow* flow, uint32_t num_flush,
-    uint32_t num_excess, uint32_t num_head_lines)
+    uint32_t num_excess, uint32_t num_head_lines, PartialFlushType partial_flush_type)
  {
      // cppcheck-suppress unreadVariable
      Profile profile(HttpModule::get_profile_stats());
@@ -267,6 +267,6 @@ void HttpStreamSplitter::prep_partial_flush(Flow* flow, uint32_t num_flush,
          session_data->cutter[source_id]->get_is_broken_chunk(),
          session_data->cutter[source_id]->get_num_good_chunks(),
          session_data->cutter[source_id]->get_octets_seen() - num_flush);
-    session_data->partial_flush[source_id] = true;
+    session_data->partial_flush[source_id] = partial_flush_type;
  }
  
diff --git a/src/service_inspectors/http_inspect/http_stream_splitter_scan.cc b/src/service_inspectors/http_inspect/http_stream_splitter_scan.cc

index 296addcc1147569b61b08d204f745f2e666d699d..612c0ad0ff0510c4b4f49ce4a3166faff85bd9de 100644 (file)
--- a/src/service_inspectors/http_inspect/http_stream_splitter_scan.cc
+++ b/src/service_inspectors/http_inspect/http_stream_splitter_scan.cc
@@ -202,6 +202,7 @@ StreamSplitter::Status HttpStreamSplitter::call_cutter(Flow* flow, HttpFlowData*
      {
      case SCAN_NOT_FOUND:
      case SCAN_NOT_FOUND_ACCELERATE:
+    case SCAN_NOT_FOUND_PARTIAL_PUBLISH:
          if (cutter->get_octets_seen() == MAX_OCTETS)
          {
              *session_data->get_infractions(source_id) += INF_ENDLESS_HEADER;
@@ -246,9 +247,11 @@ StreamSplitter::Status HttpStreamSplitter::call_cutter(Flow* flow, HttpFlowData*
              }
          }
  
-        if (cut_result == SCAN_NOT_FOUND_ACCELERATE)
+        if (cut_result == SCAN_NOT_FOUND_ACCELERATE ||
+            cut_result == SCAN_NOT_FOUND_PARTIAL_PUBLISH)
          {
-            prep_partial_flush(flow, length, cutter->get_num_excess(), cutter->get_num_head_lines());
+            prep_partial_flush(flow, length, cutter->get_num_excess(), cutter->get_num_head_lines(),
+                (cut_result == SCAN_NOT_FOUND_ACCELERATE) ? PF_DETECT : PF_PUBLISH);
  #ifdef REG_TEST
              if (!HttpTestManager::use_test_input(HttpTestManager::IN_HTTP))
  #endif
@@ -336,7 +339,7 @@ StreamSplitter::Status HttpStreamSplitter::scan(Flow* flow, const uint8_t* data,
  #endif
  
      SectionType& type = session_data->type_expected[source_id];
-    session_data->partial_flush[source_id] = false;
+    session_data->partial_flush[source_id] = PF_NONE;
  
      if (type == SEC_ABORT)
          return status_value(StreamSplitter::ABORT);
diff --git a/src/service_inspectors/http_inspect/http_tables.cc b/src/service_inspectors/http_inspect/http_tables.cc

index c2fd031b4d299880204a05e137b0d502e5fe6ac3..608f50c9e30e6758e997e98f4c9e8faa31b0899c 100755 (executable)
--- a/src/service_inspectors/http_inspect/http_tables.cc
+++ b/src/service_inspectors/http_inspect/http_tables.cc
@@ -388,6 +388,7 @@ const PegInfo HttpModule::peg_names[PEG_COUNT_MAX+1] =
      { CountType::MAX, "max_concurrent_sessions", "maximum concurrent http sessions" },
      { CountType::SUM, "script_detections", "early inspections of scripts in HTTP responses" },
      { CountType::SUM, "partial_inspections", "early inspections done for script detection" },
+    { CountType::SUM, "partial_publishes", "publish-only partial flushes" },
      { CountType::SUM, "excess_parameters", "repeat parameters exceeding max" },
      { CountType::SUM, "parameters", "HTTP parameters inspected" },
      { CountType::SUM, "connect_tunnel_cutovers", "CONNECT tunnel flow cutovers to wizard" },
diff --git a/src/service_inspectors/http_inspect/http_transaction.h b/src/service_inspectors/http_inspect/http_transaction.h

index 8fdbdecd868312be1d60a8bcd74552ab49cb9ef9..b68ca73cc87846e8873b893db43a292a8557ccc2 100644 (file)
--- a/src/service_inspectors/http_inspect/http_transaction.h
+++ b/src/service_inspectors/http_inspect/http_transaction.h
@@ -60,6 +60,10 @@ public:
  
      void set_one_hundred_response();
      bool final_response() const { return !second_response_expected; }
+    bool should_publish_on_sse_event_boundary() const
+    { return publish_on_sse_event_boundary; }
+    void set_publish_on_sse_event_boundary()
+    { publish_on_sse_event_boundary = true; }
  
      void add_body_len(HttpCommon::SourceId source_id, uint64_t len)
      { body_len[source_id] += len; }
@@ -103,6 +107,8 @@ private:
      HttpMsgSection* archive_hdr_list = nullptr;
      HttpInfractions* infractions[2];
  
+    // FIXIT-E compact these flags into a bitset or packed field if more per-transaction
+    // flags are added; separate bool members are easy to add but waste space.
      bool response_seen = false;
      bool one_hundred_response = false;
      bool second_response_expected = false;
@@ -111,6 +117,7 @@ private:
      // transaction in the fairly rare case where the request and response are received in
      // parallel.
      bool shared_ownership = false;
+    bool publish_on_sse_event_boundary = false;
  
      unsigned pub_id;
      snort::Flow* const flow;
@@ -125,4 +132,3 @@ private:
  };
  
  #endif
-
diff --git a/src/service_inspectors/http_inspect/test/http_decompression_test.cc b/src/service_inspectors/http_inspect/test/http_decompression_test.cc

index 8e98f7eae499c5e9d41f7215cb68a55cc6d21c00..0c23bc21c5879d222ad79c32f98eff37ec04c782 100644 (file)
--- a/src/service_inspectors/http_inspect/test/http_decompression_test.cc
+++ b/src/service_inspectors/http_inspect/test/http_decompression_test.cc
@@ -138,7 +138,8 @@ const snort::StreamBuffer HttpStreamSplitter::reassemble(snort::Flow*, unsigned,
  }
  
  bool HttpStreamSplitter::finish(snort::Flow*) { return false; }
-void HttpStreamSplitter::prep_partial_flush(snort::Flow*, uint32_t, uint32_t, uint32_t) { }
+void HttpStreamSplitter::prep_partial_flush(snort::Flow*, uint32_t, uint32_t, uint32_t,
+    HttpEnums::PartialFlushType) { }
  void HttpMsgSection::clear_tmp_buffers() { }
  
  HttpTransaction::~HttpTransaction() = default;
diff --git a/src/service_inspectors/http_inspect/test/http_msg_head_shared_find_next_header_test.cc b/src/service_inspectors/http_inspect/test/http_msg_head_shared_find_next_header_test.cc

index 3a100d6110114e433f0cb1cad1825892d7041b2c..d13edb9b70b53e97241b071a1d6c82a288592166 100644 (file)
--- a/src/service_inspectors/http_inspect/test/http_msg_head_shared_find_next_header_test.cc
+++ b/src/service_inspectors/http_inspect/test/http_msg_head_shared_find_next_header_test.cc
@@ -119,7 +119,8 @@ const snort::StreamBuffer HttpStreamSplitter::reassemble(snort::Flow*, unsigned,
      return buf;
  }
  bool HttpStreamSplitter::finish(snort::Flow*) { return false; }
-void HttpStreamSplitter::prep_partial_flush(snort::Flow*, uint32_t, uint32_t, uint32_t) {}
+void HttpStreamSplitter::prep_partial_flush(snort::Flow*, uint32_t, uint32_t, uint32_t,
+    HttpEnums::PartialFlushType) {}
  
  // HttpMsgSection stubs (http_msg_section.cc not in SOURCES)
  HttpMsgSection::HttpMsgSection(const uint8_t* buffer, const uint16_t buf_size,
diff --git a/src/service_inspectors/http_inspect/test/http_transaction_test.cc b/src/service_inspectors/http_inspect/test/http_transaction_test.cc

index 8e9f29228e4d943f79527c5dcc94ab3fca228e98..e8ab651dde984fe53d2049a3ff14738de0d7b1d7 100644 (file)
--- a/src/service_inspectors/http_inspect/test/http_transaction_test.cc
+++ b/src/service_inspectors/http_inspect/test/http_transaction_test.cc
@@ -120,7 +120,8 @@ const snort::StreamBuffer HttpStreamSplitter::reassemble(snort::Flow*, unsigned,
      return buf;
  }
  bool HttpStreamSplitter::finish(snort::Flow*) { return false; }
-void HttpStreamSplitter::prep_partial_flush(snort::Flow*, uint32_t, uint32_t, uint32_t) { }
+void HttpStreamSplitter::prep_partial_flush(snort::Flow*, uint32_t, uint32_t, uint32_t,
+    HttpEnums::PartialFlushType) { }
  void HttpMsgSection::clear_tmp_buffers() { }
  
  THREAD_LOCAL PegCount HttpModule::peg_counts[PEG_COUNT_MAX] = { };
diff --git a/src/service_inspectors/http_inspect/test/http_unit_test_helpers.h b/src/service_inspectors/http_inspect/test/http_unit_test_helpers.h

index 3a3160b4c26a2a06bfe4840adeb9c71523431f7e..0106582a593508028fb96cd9e2fd7acf426abe92 100644 (file)
--- a/src/service_inspectors/http_inspect/test/http_unit_test_helpers.h
+++ b/src/service_inspectors/http_inspect/test/http_unit_test_helpers.h
@@ -51,7 +51,8 @@ public:
          bool partial_flush, uint32_t num_excess)
      {
          assert(flow_data!=nullptr);
-        flow_data->partial_flush[source_id] = partial_flush;
+        flow_data->partial_flush[source_id] = partial_flush ? HttpEnums::PF_DETECT :
+            HttpEnums::PF_NONE;
          flow_data->num_excess[source_id] = num_excess;
      }
  };
author	Anna Norokh <anorokh@cisco.com>
	Fri, 10 Apr 2026 00:56:26 +0000 (03:56 +0300)
committer	GitHub <noreply@github.com>
	Fri, 10 Apr 2026 00:56:26 +0000 (20:56 -0400)
src/pub_sub/http_publish_length_event.h		patch \| blob \| blame \| history
src/pub_sub/test/pub_sub_http_transaction_end_event_test.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_cutter.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_cutter.h		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_enum.h		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_flow_data.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_flow_data.h		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_inspect.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_msg_body.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_msg_header.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_stream_splitter.h		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_stream_splitter_finish.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_stream_splitter_scan.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_tables.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/http_transaction.h		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/test/http_decompression_test.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/test/http_msg_head_shared_find_next_header_test.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/test/http_transaction_test.cc		patch \| blob \| blame \| history
src/service_inspectors/http_inspect/test/http_unit_test_helpers.h		patch \| blob \| blame \| history