Bug 3310: regression: %<pt translates as %<p

author Amos Jeffries <squid3@treenet.co.nz>

Thu, 25 Aug 2011 12:32:02 +0000 (00:32 +1200)

committer Amos Jeffries <squid3@treenet.co.nz>

Thu, 25 Aug 2011 12:32:02 +0000 (00:32 +1200)
author Amos Jeffries <squid3@treenet.co.nz>
Thu, 25 Aug 2011 12:32:02 +0000 (00:32 +1200)
committer Amos Jeffries <squid3@treenet.co.nz>
Thu, 25 Aug 2011 12:32:02 +0000 (00:32 +1200)
diff --git a/src/format/Format.cc b/src/format/Format.cc

index b9fd4c16e38d6c56507dca8ac834d021f3b38db9..8da961ef2b57d3b0fca6aa56a9b8a9c2bc29f3a0 100644 (file)
--- a/src/format/Format.cc
+++ b/src/format/Format.cc
@@ -226,12 +226,7 @@ Format::Format::dump(StoreEntry * entry, const char *name)
                  if (arg)
                      storeAppendPrintf(entry, "{%s}", arg);
  
-                for (struct TokenTableEntry *te = TokenTable; te->config != NULL; te++) {
-                    if (te->token_type == type) {
-                        storeAppendPrintf(entry, "%s", te->config);
-                        break;
-                    }
-                }
+                storeAppendPrintf(entry, "%s", t->label);
  
                  if (t->space)
                      entry->append(" ", 1);
diff --git a/src/format/Tokens.cc b/src/format/Tokens.cc

index 59a04c001e64b9a558f7755d05b9ab064e316022..5e39d9c0679fe68bad1068635211f29b782afe17 100644 (file)
--- a/src/format/Tokens.cc
+++ b/src/format/Tokens.cc
@@ -30,17 +30,36 @@ const char *Format::log_tags[] = {
      "LOG_TYPE_MAX"
  };
  
-struct Format::TokenTableEntry Format::TokenTable[] = {
+// Due to token overlaps between 1 and 2 letter tokens (Bug 3310)
+// We split the token table into sets determined by the token length
+namespace Format {
+
+/// 1-char tokens.
+static struct TokenTableEntry TokenTable1C[] = {
  
      {">a", LFT_CLIENT_IP_ADDRESS},
      {">p", LFT_CLIENT_PORT},
      {">A", LFT_CLIENT_FQDN},
-    {">eui", LFT_CLIENT_EUI},
  
      {"<a", LFT_SERVER_IP_ADDRESS},
      {"<p", LFT_SERVER_PORT},
      {"<A", LFT_SERVER_FQDN_OR_PEER_NAME},
  
+    {">h", LFT_REQUEST_HEADER},
+    {">h", LFT_REQUEST_ALL_HEADERS},
+    {"<h", LFT_REPLY_HEADER},
+    {"<h", LFT_REPLY_ALL_HEADERS},
+
+    {">v", LFT_REQUEST_VERSION_OLD_2X},
+
+    {"%", LFT_PERCENT},
+
+    {NULL, LFT_NONE}           /* this must be last */
+};
+
+/// 2-char tokens
+static struct TokenTableEntry TokenTable2C[] = {
+
      {">la", LFT_CLIENT_LOCAL_IP},
      {"la", LFT_CLIENT_LOCAL_IP_OLD_31},
      {">lp", LFT_CLIENT_LOCAL_PORT},
@@ -64,10 +83,6 @@ struct Format::TokenTableEntry Format::TokenTable[] = {
  
      {">ha", LFT_ADAPTED_REQUEST_HEADER},
      {">ha", LFT_ADAPTED_REQUEST_ALL_HEADERS},
-    {">h", LFT_REQUEST_HEADER},
-    {">h", LFT_REQUEST_ALL_HEADERS},
-    {"<h", LFT_REPLY_HEADER},
-    {"<h", LFT_REPLY_ALL_HEADERS},
  
      {"un", LFT_USER_NAME},
      {"ul", LFT_USER_LOGIN},
@@ -83,8 +98,6 @@ struct Format::TokenTableEntry Format::TokenTable[] = {
      {"<bs", LFT_HTTP_BODY_BYTES_READ},
  
      {"Ss", LFT_SQUID_STATUS},
-    { "err_code", LFT_SQUID_ERROR },
-    { "err_detail", LFT_SQUID_ERROR_DETAIL },
      {"Sh", LFT_SQUID_HIERARCHY},
  
      {"mt", LFT_MIME_TYPE},
@@ -99,7 +112,6 @@ struct Format::TokenTableEntry Format::TokenTable[] = {
      {"ru", LFT_REQUEST_URI},   /* doesn't include the query-string */
      {"rp", LFT_REQUEST_URLPATH_OLD_31},
      /* { "rq", LFT_REQUEST_QUERY }, * /     / * the query-string, INCLUDING the leading ? */
-    {">v", LFT_REQUEST_VERSION_OLD_2X},
      {"rv", LFT_REQUEST_VERSION},
  
      {"<rm", LFT_SERVER_REQ_METHOD},
@@ -127,15 +139,22 @@ struct Format::TokenTableEntry Format::TokenTable[] = {
      {"ea", LFT_EXT_LOG},
      {"sn", LFT_SEQUENCE_NUMBER},
  
-    {"%", LFT_PERCENT},
+    {NULL, LFT_NONE}           /* this must be last */
+};
  
  #if USE_ADAPTATION
+/// Adaptation (adapt::) tokens
+static struct TokenTableEntry TokenTableAdapt[] = {
      {"adapt::all_trs", LTF_ADAPTATION_ALL_XACT_TIMES},
      {"adapt::sum_trs", LTF_ADAPTATION_SUM_XACT_TIMES},
      {"adapt::<last_h", LFT_ADAPTATION_LAST_HEADER},
+    {NULL, LFT_NONE}           /* this must be last */
+};
  #endif
  
  #if ICAP_CLIENT
+/// ICAP (icap::) tokens
+static struct TokenTableEntry TokenTableIcap[] = {
      {"icap::tt", LFT_ICAP_TOTAL_TIME},
      {"icap::<last_h", LFT_ADAPTATION_LAST_HEADER}, // deprecated
  
@@ -154,11 +173,37 @@ struct Format::TokenTableEntry Format::TokenTable[] = {
      {"icap::tio",  LFT_ICAP_IO_TIME},
      {"icap::to",  LFT_ICAP_OUTCOME},
      {"icap::Hs",  LFT_ICAP_STATUS_CODE},
+
+    {NULL, LFT_NONE}           /* this must be last */
+};
  #endif
  
+/// Miscellaneous >2 byte tokens
+static struct TokenTableEntry TokenTableMisc[] = {
+    {">eui", LFT_CLIENT_EUI},
+    { "err_code", LFT_SQUID_ERROR },
+    { "err_detail", LFT_SQUID_ERROR_DETAIL },
      {NULL, LFT_NONE}           /* this must be last */
  };
  
+} // namespace Format
+
+/// Scans a token table to see if the next token exists there
+/// returns a pointer to next unparsed byte and updates type member if found
+char *
+Format::Token::scanForToken(const struct TokenTableEntry *table, char *cur)
+{
+    for (const struct TokenTableEntry *lte = table; lte->config != NULL; lte++) {
+        if (strncmp(lte->config, cur, strlen(lte->config)) == 0) {
+            type = lte->token_type;
+            label = lte->config;
+            debugs(46, 7, HERE << "Found token '" << label << "'");
+            return cur + strlen(lte->config);
+        }
+    }
+    return cur;
+}
+
  /* parses a single token. Returns the token length in characters,
   * and fills in the lt item with the token information.
   * def is for sure null-terminated
@@ -168,7 +213,6 @@ Format::Token::parse(char *def, Quoting *quoting)
  {
      char *cur = def;
  
-    struct TokenTableEntry *lte;
      int l;
  
      l = strcspn(cur, "%");
@@ -275,28 +319,52 @@ Format::Token::parse(char *def, Quoting *quoting)
              cur++;
      }
  
-    // For upward compatibility, assume "http::" prefix as default prefix
-    // for all log access formating codes, except those starting
-    // from "icap::", "adapt::" and "%"
-    if (strncmp(cur,"http::", 6) == 0 &&
-            strncmp(cur+6, "icap::", 6) != 0  &&
-            strncmp(cur+6, "adapt::", 12) != 0 && *(cur+6) != '%' ) {
-        cur += 6;
-    }
-
      type = LFT_NONE;
  
-    for (lte = TokenTable; lte->config != NULL; lte++) {
-        if (strncmp(lte->config, cur, strlen(lte->config)) == 0) {
-            type = lte->token_type;
-            cur += strlen(lte->config);
-            break;
+    // Scan each token namespace
+    if (strncmp(cur, "icap::", 6) == 0) {
+#if ICAP_CLIENT
+        cur += 6;
+        debugs(46, 5, HERE << "scan for icap:: token");
+        cur = scanForToken(TokenTableIcap, cur);
+#else
+        debugs(46, DBG_IMPORTANT, "ERROR: Format uses icap:: token. ICAP disabled!");
+#endif
+    } else if (strncmp(cur, "adapt::", 7) == 0) {
+#if USE_ADAPTATION
+        cur += 7;
+        debugs(46, 5, HERE << "scan for adapt:: token");
+        cur = scanForToken(TokenTableAdapt, cur);
+#else
+        debugs(46, DBG_IMPORTANT, "ERROR: Format uses adapt:: token. Adaptation disabled!");
+#endif
+    } else {
+        // For upward compatibility, assume "http::" prefix as default prefix
+        // for all log access formating codes, except those starting with a
+        // "%" or a known namespace. (ie "icap::", "adapt::")
+        if (strncmp(cur,"http::", 6) == 0 && *(cur+6) != '%' )
+            cur += 6;
+
+        // NP: scan the sets of tokens in decreasing size to guarantee no
+        //     mistakes made with overlapping names. (Bug 3310)
+
+        // Scan for various long tokens
+        debugs(46, 5, HERE << "scan for possible Misc token");
+        cur = scanForToken(TokenTableMisc, cur);
+        // scan for 2-char tokens
+        if (type == LFT_NONE) {
+        debugs(46, 5, HERE << "scan for possible 2C token");
+            cur = scanForToken(TokenTable2C, cur);
+        }
+        // finally scan for 1-char tokens.
+        if (type == LFT_NONE) {
+            debugs(46, 5, HERE << "scan for possible 1C token");
+            cur = scanForToken(TokenTable1C, cur);
          }
      }
  
      if (type == LFT_NONE) {
-        fatalf("Can't parse configuration token: '%s'\n",
-               def);
+        fatalf("Can't parse configuration token: '%s'\n", def);
      }
  
      if (*cur == ' ') {
@@ -467,6 +535,7 @@ done:
  
  Format::Token::~Token()
  {
+    label = NULL; // drop reference to global static.
      safe_free(data.string);
      while (next) {
          Token *tokens = next;
diff --git a/src/format/Tokens.h b/src/format/Tokens.h

index d79552c8e47cc0bcd355e517653dc3d55e6b7617..a609718e5bd2bcde5e91604258b78299b00042c9 100644 (file)
--- a/src/format/Tokens.h
+++ b/src/format/Tokens.h
@@ -174,11 +174,18 @@ enum Quoting {
      LOG_QUOTE_RAW
  };
  
+struct TokenTableEntry {
+    const char *config;
+    ByteCode_t token_type;
+    int options;
+};
+
  // XXX: inherit from linked list
  class Token
  {
  public:
      Token() : type(LFT_NONE),
+            label(NULL),
              width(0),
              precision(0),
              quote(LOG_QUOTE_NONE),
@@ -197,6 +204,7 @@ public:
      int parse(char *def, enum Quoting *quote);
  
      ByteCode_t type;
+    const char *label;
      union {
          char *string;
  
@@ -215,16 +223,12 @@ public:
      unsigned int zero:1;
      int divisor;
      Token *next;       /* todo: move from linked list to array */
-};
  
-struct TokenTableEntry {
-    const char *config;
-    ByteCode_t token_type;
-    int options;
+private:
+    char *scanForToken(const struct TokenTableEntry *table, char *cur);
  };
  
  extern const char *log_tags[];
-extern struct TokenTableEntry TokenTable[];
  
  } // namespace Format
author	Amos Jeffries <squid3@treenet.co.nz>
	Thu, 25 Aug 2011 12:32:02 +0000 (00:32 +1200)
committer	Amos Jeffries <squid3@treenet.co.nz>
	Thu, 25 Aug 2011 12:32:02 +0000 (00:32 +1200)
src/format/Format.cc		patch \| blob \| blame \| history
src/format/Tokens.cc		patch \| blob \| blame \| history
src/format/Tokens.h		patch \| blob \| blame \| history