]> git.ipfire.org Git - thirdparty/binutils-gdb.git/blob - gdb/xml-support.c
08524f85309dc8af7ab2d3f74f1929d28984194f
[thirdparty/binutils-gdb.git] / gdb / xml-support.c
1 /* Helper routines for parsing XML using Expat.
2
3 Copyright (C) 2006-2025 Free Software Foundation, Inc.
4
5 This file is part of GDB.
6
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3 of the License, or
10 (at your option) any later version.
11
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with this program. If not, see <http://www.gnu.org/licenses/>. */
19
20 #include "cli/cli-cmds.h"
21 #include "xml-builtin.h"
22 #include "xml-support.h"
23 #include "gdbsupport/filestuff.h"
24 #include "gdbsupport/gdb-safe-ctype.h"
25 #include <vector>
26 #include <string>
27
28 /* Debugging flag. */
29 static bool debug_xml;
30
31 /* The contents of this file are only useful if XML support is
32 available. */
33 #ifdef HAVE_LIBEXPAT
34
35 #include "gdb_expat.h"
36
37 /* The maximum depth of <xi:include> nesting. No need to be miserly,
38 we just want to avoid running out of stack on loops. */
39 #define MAX_XINCLUDE_DEPTH 30
40
41 /* Simplified XML parser infrastructure. */
42
43 /* A parsing level -- used to keep track of the current element
44 nesting. */
45 struct scope_level
46 {
47 explicit scope_level (const gdb_xml_element *elements_ = NULL)
48 : elements (elements_),
49 element (NULL),
50 seen (0)
51 {}
52
53 /* Elements we allow at this level. */
54 const struct gdb_xml_element *elements;
55
56 /* The element which we are within. */
57 const struct gdb_xml_element *element;
58
59 /* Mask of which elements we've seen at this level (used for
60 optional and repeatable checking). */
61 unsigned int seen;
62
63 /* Body text accumulation. */
64 std::string body;
65 };
66
67 /* The parser itself, and our additional state. */
68 struct gdb_xml_parser
69 {
70 gdb_xml_parser (const char *name,
71 const gdb_xml_element *elements,
72 void *user_data);
73 ~gdb_xml_parser();
74
75 /* Associate DTD_NAME, which must be the name of a compiled-in DTD,
76 with the parser. */
77 void use_dtd (const char *dtd_name);
78
79 /* Return the name of the expected / default DTD, if specified. */
80 const char *dtd_name ()
81 { return m_dtd_name; }
82
83 /* Invoke the parser on BUFFER. BUFFER is the data to parse, which
84 should be NUL-terminated.
85
86 The return value is 0 for success or -1 for error. It may throw,
87 but only if something unexpected goes wrong during parsing; parse
88 errors will be caught, warned about, and reported as failure. */
89 int parse (const char *buffer);
90
91 /* Issue a debugging message. */
92 void vdebug (const char *format, va_list ap)
93 ATTRIBUTE_PRINTF (2, 0);
94
95 /* Issue an error message, and stop parsing. */
96 [[noreturn]] void verror (const char *format, va_list ap)
97 ATTRIBUTE_PRINTF (2, 0);
98
99 void body_text (const XML_Char *text, int length);
100 void start_element (const XML_Char *name, const XML_Char **attrs);
101 void end_element (const XML_Char *name);
102
103 /* Return the name of this parser. */
104 const char *name ()
105 { return m_name; }
106
107 /* Return the user's callback data, for handlers. */
108 void *user_data ()
109 { return m_user_data; };
110
111 /* Are we the special <xi:include> parser? */
112 void set_is_xinclude (bool is_xinclude)
113 { m_is_xinclude = is_xinclude; }
114
115 /* A thrown error, if any. */
116 void set_error (gdb_exception &&error)
117 {
118 m_error = std::move (error);
119 #ifdef HAVE_XML_STOPPARSER
120 XML_StopParser (m_expat_parser, XML_FALSE);
121 #endif
122 }
123
124 /* Return the underlying expat parser. */
125 XML_Parser expat_parser ()
126 { return m_expat_parser; }
127
128 private:
129 /* The underlying expat parser. */
130 XML_Parser m_expat_parser;
131
132 /* Name of this parser. */
133 const char *m_name;
134
135 /* The user's callback data, for handlers. */
136 void *m_user_data;
137
138 /* Scoping stack. */
139 std::vector<scope_level> m_scopes;
140
141 /* A thrown error, if any. */
142 struct gdb_exception m_error;
143
144 /* The line of the thrown error, or 0. */
145 int m_last_line;
146
147 /* The name of the expected / default DTD, if specified. */
148 const char *m_dtd_name;
149
150 /* Are we the special <xi:include> parser? */
151 bool m_is_xinclude;
152 };
153
154 /* Process some body text. We accumulate the text for later use; it's
155 wrong to do anything with it immediately, because a single block of
156 text might be broken up into multiple calls to this function. */
157
158 void
159 gdb_xml_parser::body_text (const XML_Char *text, int length)
160 {
161 if (m_error.reason < 0)
162 return;
163
164 scope_level &scope = m_scopes.back ();
165 scope.body.append (text, length);
166 }
167
168 static void
169 gdb_xml_body_text (void *data, const XML_Char *text, int length)
170 {
171 struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data;
172
173 parser->body_text (text, length);
174 }
175
176 /* Issue a debugging message from one of PARSER's handlers. */
177
178 void
179 gdb_xml_parser::vdebug (const char *format, va_list ap)
180 {
181 int line = XML_GetCurrentLineNumber (m_expat_parser);
182
183 std::string message = string_vprintf (format, ap);
184 if (line)
185 gdb_printf (gdb_stderr, "%s (line %d): %s\n",
186 m_name, line, message.c_str ());
187 else
188 gdb_printf (gdb_stderr, "%s: %s\n",
189 m_name, message.c_str ());
190 }
191
192 void
193 gdb_xml_debug (struct gdb_xml_parser *parser, const char *format, ...)
194 {
195 if (!debug_xml)
196 return;
197
198 va_list ap;
199 va_start (ap, format);
200 parser->vdebug (format, ap);
201 va_end (ap);
202 }
203
204 /* Issue an error message from one of PARSER's handlers, and stop
205 parsing. */
206
207 void
208 gdb_xml_parser::verror (const char *format, va_list ap)
209 {
210 int line = XML_GetCurrentLineNumber (m_expat_parser);
211
212 m_last_line = line;
213 throw_verror (XML_PARSE_ERROR, format, ap);
214 }
215
216 void
217 gdb_xml_error (struct gdb_xml_parser *parser, const char *format, ...)
218 {
219 va_list ap;
220 va_start (ap, format);
221 parser->verror (format, ap);
222 va_end (ap);
223 }
224
225 /* Find the attribute named NAME in the set of parsed attributes
226 ATTRIBUTES. Returns NULL if not found. */
227
228 struct gdb_xml_value *
229 xml_find_attribute (std::vector<gdb_xml_value> &attributes,
230 const char *name)
231 {
232 for (gdb_xml_value &value : attributes)
233 if (strcmp (value.name, name) == 0)
234 return &value;
235
236 return NULL;
237 }
238
239 /* Handle the start of an element. NAME is the element, and ATTRS are
240 the names and values of this element's attributes. */
241
242 void
243 gdb_xml_parser::start_element (const XML_Char *name,
244 const XML_Char **attrs)
245 {
246 if (m_error.reason < 0)
247 return;
248
249 const struct gdb_xml_element *element;
250 const struct gdb_xml_attribute *attribute;
251 unsigned int seen;
252
253 /* Push an error scope. If we return or throw an exception before
254 filling this in, it will tell us to ignore children of this
255 element. Note we don't take a reference to the element yet
256 because further below we'll process the element which may recurse
257 back here and push more elements to the vector. When the
258 recursion unrolls all such elements will have been popped back
259 already, but if one of those pushes reallocates the vector,
260 previous element references will be invalidated. */
261 m_scopes.emplace_back ();
262
263 /* Get a reference to the current scope. */
264 scope_level &scope = m_scopes[m_scopes.size () - 2];
265
266 gdb_xml_debug (this, _("Entering element <%s>"), name);
267
268 /* Find this element in the list of the current scope's allowed
269 children. Record that we've seen it. */
270
271 seen = 1;
272 for (element = scope.elements; element && element->name;
273 element++, seen <<= 1)
274 if (strcmp (element->name, name) == 0)
275 break;
276
277 if (element == NULL || element->name == NULL)
278 {
279 /* If we're working on XInclude, <xi:include> can be the child
280 of absolutely anything. Copy the previous scope's element
281 list into the new scope even if there was no match. */
282 if (m_is_xinclude)
283 {
284 XML_DefaultCurrent (m_expat_parser);
285
286 scope_level &unknown_scope = m_scopes.back ();
287 unknown_scope.elements = scope.elements;
288 return;
289 }
290
291 gdb_xml_debug (this, _("Element <%s> unknown"), name);
292 return;
293 }
294
295 if (!(element->flags & GDB_XML_EF_REPEATABLE) && (seen & scope.seen))
296 gdb_xml_error (this, _("Element <%s> only expected once"), name);
297
298 scope.seen |= seen;
299
300 std::vector<gdb_xml_value> attributes;
301
302 for (attribute = element->attributes;
303 attribute != NULL && attribute->name != NULL;
304 attribute++)
305 {
306 const char *val = NULL;
307 const XML_Char **p;
308 void *parsed_value;
309
310 for (p = attrs; *p != NULL; p += 2)
311 if (!strcmp (attribute->name, p[0]))
312 {
313 val = p[1];
314 break;
315 }
316
317 if (*p != NULL && val == NULL)
318 {
319 gdb_xml_debug (this, _("Attribute \"%s\" missing a value"),
320 attribute->name);
321 continue;
322 }
323
324 if (*p == NULL && !(attribute->flags & GDB_XML_AF_OPTIONAL))
325 {
326 gdb_xml_error (this, _("Required attribute \"%s\" of "
327 "<%s> not specified"),
328 attribute->name, element->name);
329 continue;
330 }
331
332 if (*p == NULL)
333 continue;
334
335 gdb_xml_debug (this, _("Parsing attribute %s=\"%s\""),
336 attribute->name, val);
337
338 if (attribute->handler)
339 parsed_value = attribute->handler (this, attribute, val);
340 else
341 parsed_value = xstrdup (val);
342
343 attributes.emplace_back (attribute->name, parsed_value);
344 }
345
346 /* Check for unrecognized attributes. */
347 if (debug_xml)
348 {
349 const XML_Char **p;
350
351 for (p = attrs; *p != NULL; p += 2)
352 {
353 for (attribute = element->attributes;
354 attribute != NULL && attribute->name != NULL;
355 attribute++)
356 if (strcmp (attribute->name, *p) == 0)
357 break;
358
359 if (attribute == NULL || attribute->name == NULL)
360 gdb_xml_debug (this, _("Ignoring unknown attribute %s"), *p);
361 }
362 }
363
364 /* Call the element handler if there is one. */
365 if (element->start_handler)
366 element->start_handler (this, element, m_user_data, attributes);
367
368 /* Fill in a new scope level. Note that we must delay getting a
369 back reference till here because above we might have recursed,
370 which may have reallocated the vector which invalidates
371 iterators/pointers/references. */
372 scope_level &new_scope = m_scopes.back ();
373 new_scope.element = element;
374 new_scope.elements = element->children;
375 }
376
377 /* Wrapper for gdb_xml_start_element, to prevent throwing exceptions
378 through expat. */
379
380 static void
381 gdb_xml_start_element_wrapper (void *data, const XML_Char *name,
382 const XML_Char **attrs)
383 {
384 struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data;
385
386 try
387 {
388 parser->start_element (name, attrs);
389 }
390 catch (gdb_exception &ex)
391 {
392 parser->set_error (std::move (ex));
393 }
394 }
395
396 /* Handle the end of an element. NAME is the current element. */
397
398 void
399 gdb_xml_parser::end_element (const XML_Char *name)
400 {
401 if (m_error.reason < 0)
402 return;
403
404 struct scope_level *scope = &m_scopes.back ();
405 const struct gdb_xml_element *element;
406 unsigned int seen;
407
408 gdb_xml_debug (this, _("Leaving element <%s>"), name);
409
410 for (element = scope->elements, seen = 1;
411 element != NULL && element->name != NULL;
412 element++, seen <<= 1)
413 if ((scope->seen & seen) == 0
414 && (element->flags & GDB_XML_EF_OPTIONAL) == 0)
415 gdb_xml_error (this, _("Required element <%s> is missing"),
416 element->name);
417
418 /* Call the element processor. */
419 if (scope->element != NULL && scope->element->end_handler)
420 {
421 const char *body;
422
423 if (scope->body.empty ())
424 body = "";
425 else
426 {
427 int length;
428
429 length = scope->body.size ();
430 body = scope->body.c_str ();
431
432 /* Strip leading and trailing whitespace. */
433 while (length > 0 && ISSPACE (body[length - 1]))
434 length--;
435 scope->body.erase (length);
436 while (*body && ISSPACE (*body))
437 body++;
438 }
439
440 scope->element->end_handler (this, scope->element,
441 m_user_data, body);
442 }
443 else if (scope->element == NULL)
444 XML_DefaultCurrent (m_expat_parser);
445
446 /* Pop the scope level. */
447 m_scopes.pop_back ();
448 }
449
450 /* Wrapper for gdb_xml_end_element, to prevent throwing exceptions
451 through expat. */
452
453 static void
454 gdb_xml_end_element_wrapper (void *data, const XML_Char *name)
455 {
456 struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data;
457
458 try
459 {
460 parser->end_element (name);
461 }
462 catch (gdb_exception &ex)
463 {
464 parser->set_error (std::move (ex));
465 }
466 }
467
468 /* Free a parser and all its associated state. */
469
470 gdb_xml_parser::~gdb_xml_parser ()
471 {
472 XML_ParserFree (m_expat_parser);
473 }
474
475 /* Initialize a parser. */
476
477 gdb_xml_parser::gdb_xml_parser (const char *name,
478 const gdb_xml_element *elements,
479 void *user_data)
480 : m_name (name),
481 m_user_data (user_data),
482 m_last_line (0),
483 m_dtd_name (NULL),
484 m_is_xinclude (false)
485 {
486 m_expat_parser = XML_ParserCreateNS (NULL, '!');
487 if (m_expat_parser == NULL)
488 malloc_failure (0);
489
490 XML_SetUserData (m_expat_parser, this);
491
492 /* Set the callbacks. */
493 XML_SetElementHandler (m_expat_parser, gdb_xml_start_element_wrapper,
494 gdb_xml_end_element_wrapper);
495 XML_SetCharacterDataHandler (m_expat_parser, gdb_xml_body_text);
496
497 /* Initialize the outer scope. */
498 m_scopes.emplace_back (elements);
499 }
500
501 /* External entity handler. The only external entities we support
502 are those compiled into GDB (we do not fetch entities from the
503 target). */
504
505 static int XMLCALL
506 gdb_xml_fetch_external_entity (XML_Parser expat_parser,
507 const XML_Char *context,
508 const XML_Char *base,
509 const XML_Char *systemId,
510 const XML_Char *publicId)
511 {
512 XML_Parser entity_parser;
513 const char *text;
514 enum XML_Status status;
515
516 if (systemId == NULL)
517 {
518 gdb_xml_parser *parser
519 = (gdb_xml_parser *) XML_GetUserData (expat_parser);
520
521 text = fetch_xml_builtin (parser->dtd_name ());
522 if (text == NULL)
523 internal_error (_("could not locate built-in DTD %s"),
524 parser->dtd_name ());
525 }
526 else
527 {
528 text = fetch_xml_builtin (systemId);
529 if (text == NULL)
530 return XML_STATUS_ERROR;
531 }
532
533 entity_parser = XML_ExternalEntityParserCreate (expat_parser,
534 context, NULL);
535
536 /* Don't use our handlers for the contents of the DTD. Just let expat
537 process it. */
538 XML_SetElementHandler (entity_parser, NULL, NULL);
539 XML_SetDoctypeDeclHandler (entity_parser, NULL, NULL);
540 XML_SetXmlDeclHandler (entity_parser, NULL);
541 XML_SetDefaultHandler (entity_parser, NULL);
542 XML_SetUserData (entity_parser, NULL);
543
544 status = XML_Parse (entity_parser, text, strlen (text), 1);
545
546 XML_ParserFree (entity_parser);
547 return status;
548 }
549
550 void
551 gdb_xml_parser::use_dtd (const char *dtd_name)
552 {
553 enum XML_Error err;
554
555 m_dtd_name = dtd_name;
556
557 XML_SetParamEntityParsing (m_expat_parser,
558 XML_PARAM_ENTITY_PARSING_UNLESS_STANDALONE);
559 XML_SetExternalEntityRefHandler (m_expat_parser,
560 gdb_xml_fetch_external_entity);
561
562 /* Even if no DTD is provided, use the built-in DTD anyway. */
563 err = XML_UseForeignDTD (m_expat_parser, XML_TRUE);
564 if (err != XML_ERROR_NONE)
565 internal_error (_("XML_UseForeignDTD failed: %s"),
566 XML_ErrorString (err));
567 }
568
569 /* Invoke PARSER on BUFFER. BUFFER is the data to parse, which
570 should be NUL-terminated.
571
572 The return value is 0 for success or -1 for error. It may throw,
573 but only if something unexpected goes wrong during parsing; parse
574 errors will be caught, warned about, and reported as failure. */
575
576 int
577 gdb_xml_parser::parse (const char *buffer)
578 {
579 enum XML_Status status;
580 const char *error_string;
581
582 gdb_xml_debug (this, _("Starting:\n%s"), buffer);
583
584 status = XML_Parse (m_expat_parser, buffer, strlen (buffer), 1);
585
586 if (status == XML_STATUS_OK && m_error.reason == 0)
587 return 0;
588
589 if (m_error.reason == RETURN_ERROR
590 && m_error.error == XML_PARSE_ERROR)
591 {
592 gdb_assert (m_error.message != NULL);
593 error_string = m_error.what ();
594 }
595 else if (status == XML_STATUS_ERROR)
596 {
597 enum XML_Error err = XML_GetErrorCode (m_expat_parser);
598
599 error_string = XML_ErrorString (err);
600 }
601 else
602 {
603 gdb_assert (m_error.reason < 0);
604 throw_exception (std::move (m_error));
605 }
606
607 if (m_last_line != 0)
608 warning (_("while parsing %s (at line %d): %s"), m_name,
609 m_last_line, error_string);
610 else
611 warning (_("while parsing %s: %s"), m_name, error_string);
612
613 return -1;
614 }
615
616 int
617 gdb_xml_parse_quick (const char *name, const char *dtd_name,
618 const struct gdb_xml_element *elements,
619 const char *document, void *user_data)
620 {
621 gdb_xml_parser parser (name, elements, user_data);
622 if (dtd_name != NULL)
623 parser.use_dtd (dtd_name);
624 return parser.parse (document);
625 }
626
627 /* Parse a field VALSTR that we expect to contain an integer value.
628 The integer is returned in *VALP. The string is parsed with an
629 equivalent to strtoul.
630
631 Returns 0 for success, -1 for error. */
632
633 static int
634 xml_parse_unsigned_integer (const char *valstr, ULONGEST *valp)
635 {
636 const char *endptr;
637 ULONGEST result;
638
639 if (*valstr == '\0')
640 return -1;
641
642 result = strtoulst (valstr, &endptr, 0);
643 if (*endptr != '\0')
644 return -1;
645
646 *valp = result;
647 return 0;
648 }
649
650 /* Parse an integer string into a ULONGEST and return it, or call
651 gdb_xml_error if it could not be parsed. */
652
653 ULONGEST
654 gdb_xml_parse_ulongest (struct gdb_xml_parser *parser, const char *value)
655 {
656 ULONGEST result;
657
658 if (xml_parse_unsigned_integer (value, &result) != 0)
659 gdb_xml_error (parser, _("Can't convert \"%s\" to an integer"), value);
660
661 return result;
662 }
663
664 /* Parse an integer attribute into a ULONGEST. */
665
666 void *
667 gdb_xml_parse_attr_ulongest (struct gdb_xml_parser *parser,
668 const struct gdb_xml_attribute *attribute,
669 const char *value)
670 {
671 ULONGEST result;
672 void *ret;
673
674 if (xml_parse_unsigned_integer (value, &result) != 0)
675 gdb_xml_error (parser, _("Can't convert %s=\"%s\" to an integer"),
676 attribute->name, value);
677
678 ret = XNEW (ULONGEST);
679 memcpy (ret, &result, sizeof (result));
680 return ret;
681 }
682
683 /* A handler_data for yes/no boolean values. */
684
685 const struct gdb_xml_enum gdb_xml_enums_boolean[] = {
686 { "yes", 1 },
687 { "no", 0 },
688 { NULL, 0 }
689 };
690
691 /* Map NAME to VALUE. A struct gdb_xml_enum * should be saved as the
692 value of handler_data when using gdb_xml_parse_attr_enum to parse a
693 fixed list of possible strings. The list is terminated by an entry
694 with NAME == NULL. */
695
696 void *
697 gdb_xml_parse_attr_enum (struct gdb_xml_parser *parser,
698 const struct gdb_xml_attribute *attribute,
699 const char *value)
700 {
701 const struct gdb_xml_enum *enums
702 = (const struct gdb_xml_enum *) attribute->handler_data;
703 void *ret;
704
705 for (enums = (const struct gdb_xml_enum *) attribute->handler_data;
706 enums->name != NULL; enums++)
707 if (strcasecmp (enums->name, value) == 0)
708 break;
709
710 if (enums->name == NULL)
711 gdb_xml_error (parser, _("Unknown attribute value %s=\"%s\""),
712 attribute->name, value);
713
714 ret = xmalloc (sizeof (enums->value));
715 memcpy (ret, &enums->value, sizeof (enums->value));
716 return ret;
717 }
718 \f
719
720 /* XInclude processing. This is done as a separate step from actually
721 parsing the document, so that we can produce a single combined XML
722 document - e.g. to hand to a front end or to simplify comparing two
723 documents. We make extensive use of XML_DefaultCurrent, to pass
724 input text directly into the output without reformatting or
725 requoting it.
726
727 We output the DOCTYPE declaration for the first document unchanged,
728 if present, and discard DOCTYPEs from included documents. Only the
729 one we pass through here is used when we feed the result back to
730 expat. The XInclude standard explicitly does not discuss
731 validation of the result; we choose to apply the same DTD applied
732 to the outermost document.
733
734 We can not simply include the external DTD subset in the document
735 as an internal subset, because <!IGNORE> and <!INCLUDE> are valid
736 only in external subsets. But if we do not pass the DTD into the
737 output at all, default values will not be filled in.
738
739 We don't pass through any <?xml> declaration because we generate
740 UTF-8, not whatever the input encoding was. */
741
742 struct xinclude_parsing_data
743 {
744 xinclude_parsing_data (std::string &output_,
745 xml_fetch_another fetcher_,
746 int include_depth_)
747 : output (output_),
748 skip_depth (0),
749 include_depth (include_depth_),
750 fetcher (fetcher_)
751 {}
752
753 /* Where the output goes. */
754 std::string &output;
755
756 /* A count indicating whether we are in an element whose
757 children should not be copied to the output, and if so,
758 how deep we are nested. This is used for anything inside
759 an xi:include, and for the DTD. */
760 int skip_depth;
761
762 /* The number of <xi:include> elements currently being processed,
763 to detect loops. */
764 int include_depth;
765
766 /* A function to call to obtain additional features, and its
767 baton. */
768 xml_fetch_another fetcher;
769 };
770
771 static void
772 xinclude_start_include (struct gdb_xml_parser *parser,
773 const struct gdb_xml_element *element,
774 void *user_data,
775 std::vector<gdb_xml_value> &attributes)
776 {
777 struct xinclude_parsing_data *data
778 = (struct xinclude_parsing_data *) user_data;
779 char *href = (char *) xml_find_attribute (attributes, "href")->value.get ();
780
781 gdb_xml_debug (parser, _("Processing XInclude of \"%s\""), href);
782
783 if (data->include_depth > MAX_XINCLUDE_DEPTH)
784 gdb_xml_error (parser, _("Maximum XInclude depth (%d) exceeded"),
785 MAX_XINCLUDE_DEPTH);
786
787 std::optional<gdb::char_vector> text = data->fetcher (href);
788 if (!text)
789 gdb_xml_error (parser, _("Could not load XML document \"%s\""), href);
790
791 if (!xml_process_xincludes (data->output, parser->name (),
792 text->data (), data->fetcher,
793 data->include_depth + 1))
794 gdb_xml_error (parser, _("Parsing \"%s\" failed"), href);
795
796 data->skip_depth++;
797 }
798
799 static void
800 xinclude_end_include (struct gdb_xml_parser *parser,
801 const struct gdb_xml_element *element,
802 void *user_data, const char *body_text)
803 {
804 struct xinclude_parsing_data *data
805 = (struct xinclude_parsing_data *) user_data;
806
807 data->skip_depth--;
808 }
809
810 static void XMLCALL
811 xml_xinclude_default (void *data_, const XML_Char *s, int len)
812 {
813 struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data_;
814 xinclude_parsing_data *data = (xinclude_parsing_data *) parser->user_data ();
815
816 /* If we are inside of e.g. xi:include or the DTD, don't save this
817 string. */
818 if (data->skip_depth)
819 return;
820
821 /* Otherwise just add it to the end of the document we're building
822 up. */
823 data->output.append (s, len);
824 }
825
826 static void XMLCALL
827 xml_xinclude_start_doctype (void *data_, const XML_Char *doctypeName,
828 const XML_Char *sysid, const XML_Char *pubid,
829 int has_internal_subset)
830 {
831 struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data_;
832 xinclude_parsing_data *data = (xinclude_parsing_data *) parser->user_data ();
833
834 /* Don't print out the doctype, or the contents of the DTD internal
835 subset, if any. */
836 data->skip_depth++;
837 }
838
839 static void XMLCALL
840 xml_xinclude_end_doctype (void *data_)
841 {
842 struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data_;
843 xinclude_parsing_data *data = (xinclude_parsing_data *) parser->user_data ();
844
845 data->skip_depth--;
846 }
847
848 static void XMLCALL
849 xml_xinclude_xml_decl (void *data_, const XML_Char *version,
850 const XML_Char *encoding, int standalone)
851 {
852 /* Do nothing - this function prevents the default handler from
853 being called, thus suppressing the XML declaration from the
854 output. */
855 }
856
857 const struct gdb_xml_attribute xinclude_attributes[] = {
858 { "href", GDB_XML_AF_NONE, NULL, NULL },
859 { NULL, GDB_XML_AF_NONE, NULL, NULL }
860 };
861
862 const struct gdb_xml_element xinclude_elements[] = {
863 { "http://www.w3.org/2001/XInclude!include", xinclude_attributes, NULL,
864 GDB_XML_EF_OPTIONAL | GDB_XML_EF_REPEATABLE,
865 xinclude_start_include, xinclude_end_include },
866 { NULL, NULL, NULL, GDB_XML_EF_NONE, NULL, NULL }
867 };
868
869 /* The main entry point for <xi:include> processing. */
870
871 bool
872 xml_process_xincludes (std::string &result,
873 const char *name, const char *text,
874 xml_fetch_another fetcher, int depth)
875 {
876 xinclude_parsing_data data (result, fetcher, depth);
877
878 gdb_xml_parser parser (name, xinclude_elements, &data);
879 parser.set_is_xinclude (true);
880
881 XML_SetCharacterDataHandler (parser.expat_parser (), NULL);
882 XML_SetDefaultHandler (parser.expat_parser (), xml_xinclude_default);
883
884 /* Always discard the XML version declarations; the only important
885 thing this provides is encoding, and our result will have been
886 converted to UTF-8. */
887 XML_SetXmlDeclHandler (parser.expat_parser (), xml_xinclude_xml_decl);
888
889 if (depth > 0)
890 /* Discard the doctype for included documents. */
891 XML_SetDoctypeDeclHandler (parser.expat_parser (),
892 xml_xinclude_start_doctype,
893 xml_xinclude_end_doctype);
894
895 parser.use_dtd ("xinclude.dtd");
896
897 if (parser.parse (text) == 0)
898 {
899 if (depth == 0)
900 gdb_xml_debug (&parser, _("XInclude processing succeeded."));
901 return true;
902 }
903
904 return false;
905 }
906 #endif /* HAVE_LIBEXPAT */
907 \f
908
909 /* Return an XML document which was compiled into GDB, from
910 the given FILENAME, or NULL if the file was not compiled in. */
911
912 const char *
913 fetch_xml_builtin (const char *filename)
914 {
915 const char *const (*p)[2];
916
917 for (p = xml_builtin; (*p)[0]; p++)
918 if (strcmp ((*p)[0], filename) == 0)
919 return (*p)[1];
920
921 return NULL;
922 }
923
924 /* A to_xfer_partial helper function which reads XML files which were
925 compiled into GDB. The target may call this function from its own
926 to_xfer_partial handler, after converting object and annex to the
927 appropriate filename. */
928
929 LONGEST
930 xml_builtin_xfer_partial (const char *filename,
931 gdb_byte *readbuf, const gdb_byte *writebuf,
932 ULONGEST offset, LONGEST len)
933 {
934 const char *buf;
935 LONGEST len_avail;
936
937 gdb_assert (readbuf != NULL && writebuf == NULL);
938 gdb_assert (filename != NULL);
939
940 buf = fetch_xml_builtin (filename);
941 if (buf == NULL)
942 return -1;
943
944 len_avail = strlen (buf);
945 if (offset >= len_avail)
946 return 0;
947
948 if (len > len_avail - offset)
949 len = len_avail - offset;
950 memcpy (readbuf, buf + offset, len);
951 return len;
952 }
953 \f
954
955 static void
956 show_debug_xml (struct ui_file *file, int from_tty,
957 struct cmd_list_element *c, const char *value)
958 {
959 gdb_printf (file, _("XML debugging is %s.\n"), value);
960 }
961
962 std::optional<gdb::char_vector>
963 xml_fetch_content_from_file (const char *filename, const char *dirname)
964 {
965 gdb_file_up file;
966
967 if (dirname != nullptr && *dirname != '\0')
968 {
969 gdb::unique_xmalloc_ptr<char> fullname
970 (concat (dirname, "/", filename, (char *) NULL));
971
972 file = gdb_fopen_cloexec (fullname.get (), FOPEN_RB);
973 }
974 else
975 file = gdb_fopen_cloexec (filename, FOPEN_RB);
976
977 if (file == NULL)
978 return {};
979
980 /* Read in the whole file. */
981
982 size_t len;
983
984 if (fseek (file.get (), 0, SEEK_END) == -1)
985 perror_with_name (_("seek to end of file"));
986 len = ftell (file.get ());
987 rewind (file.get ());
988
989 gdb::char_vector text (len + 1);
990
991 if (fread (text.data (), 1, len, file.get ()) != len
992 || ferror (file.get ()))
993 {
994 warning (_("Read error from \"%s\""), filename);
995 return {};
996 }
997
998 text.back () = '\0';
999 return text;
1000 }
1001
1002 INIT_GDB_FILE (xml_support)
1003 {
1004 add_setshow_boolean_cmd ("xml", class_maintenance, &debug_xml,
1005 _("Set XML parser debugging."),
1006 _("Show XML parser debugging."),
1007 _("When set, debugging messages for XML parsers "
1008 "are displayed."),
1009 NULL, show_debug_xml,
1010 &setdebuglist, &showdebuglist);
1011 }