Fix incremental JSON parser numeric token reassembly across chunks.

author Andrew Dunstan <andrew@dunslane.net>

Thu, 9 Apr 2026 11:57:07 +0000 (07:57 -0400)

committer Andrew Dunstan <andrew@dunslane.net>

Fri, 10 Apr 2026 11:13:08 +0000 (07:13 -0400)
author Andrew Dunstan <andrew@dunslane.net>
Thu, 9 Apr 2026 11:57:07 +0000 (07:57 -0400)
committer Andrew Dunstan <andrew@dunslane.net>
Fri, 10 Apr 2026 11:13:08 +0000 (07:13 -0400)
diff --git a/src/common/jsonapi.c b/src/common/jsonapi.c

index 1145d93945f3ac49a5ca82a37a69335921287b8c..12e40f2d564fda0b5c4695e0804815bd746dad77 100644 (file)
--- a/src/common/jsonapi.c
+++ b/src/common/jsonapi.c
@@ -1670,9 +1670,31 @@ json_lex(JsonLexContext *lex)
  
                         if (c == '-' || (c >= '0' && c <= '9'))
                         {
-                               /* for numbers look for possible numeric continuations */
-
+                               /*
+                                * Accumulate numeric continuations, respecting JSON number
+                                * grammar: -? int [frac] [exp]
+                                *
+                                * We must track what parts of the number we've already seen
+                                * so we don't over-consume.  '.' is valid only once and not
+                                * after 'e'/'E'; 'e'/'E' is valid only once; '+'/'-' are
+                                * valid only immediately after 'e'/'E'.
+                                */
                                 bool            numend = false;
+                               bool            seen_dot = false;
+                               bool            seen_exp = false;
+                               char            prev;
+
+                               /* Scan existing partial token for state */
+                               for (int j = 0; j < ptok->len; j++)
+                               {
+                                       char            pc = ptok->data[j];
+
+                                       if (pc == '.')
+                                               seen_dot = true;
+                                       else if (pc == 'e' || pc == 'E')
+                                               seen_exp = true;
+                               }
+                               prev = ptok->data[ptok->len - 1];
  
                                 for (size_t i = 0; i < lex->input_length && !numend; i++)
                                 {
@@ -1682,8 +1704,35 @@ json_lex(JsonLexContext *lex)
                                         {
                                                 case '+':
                                                 case '-':
+                                                       if (prev != 'e' && prev != 'E')
+                                                       {
+                                                               numend = true;
+                                                               break;
+                                                       }
+                                                       jsonapi_appendStringInfoCharMacro(ptok, cc);
+                                                       added++;
+                                                       break;
+                                               case '.':
+                                                       if (seen_dot || seen_exp)
+                                                       {
+                                                               numend = true;
+                                                               break;
+                                                       }
+                                                       seen_dot = true;
+                                                       jsonapi_appendStringInfoCharMacro(ptok, cc);
+                                                       added++;
+                                                       break;
                                                 case 'e':
                                                 case 'E':
+                                                       if (seen_exp)
+                                                       {
+                                                               numend = true;
+                                                               break;
+                                                       }
+                                                       seen_exp = true;
+                                                       jsonapi_appendStringInfoCharMacro(ptok, cc);
+                                                       added++;
+                                                       break;
                                                 case '0':
                                                 case '1':
                                                 case '2':
@@ -1694,14 +1743,14 @@ json_lex(JsonLexContext *lex)
                                                 case '7':
                                                 case '8':
                                                 case '9':
-                                                       {
-                                                               jsonapi_appendStringInfoCharMacro(ptok, cc);
-                                                               added++;
-                                                       }
+                                                       jsonapi_appendStringInfoCharMacro(ptok, cc);
+                                                       added++;
                                                         break;
                                                 default:
                                                         numend = true;
                                         }
+                                       if (!numend)
+                                               prev = cc;
                                 }
                         }
author	Andrew Dunstan <andrew@dunslane.net>
	Thu, 9 Apr 2026 11:57:07 +0000 (07:57 -0400)
committer	Andrew Dunstan <andrew@dunslane.net>
	Fri, 10 Apr 2026 11:13:08 +0000 (07:13 -0400)