xref: /netbsd-src/external/gpl3/gdb/dist/gdb/xml-support.c (revision 9689912e6b171cbda866ec33f15ae94a04e2c02d)
1 /* Helper routines for parsing XML using Expat.
2 
3    Copyright (C) 2006-2024 Free Software Foundation, Inc.
4 
5    This file is part of GDB.
6 
7    This program is free software; you can redistribute it and/or modify
8    it under the terms of the GNU General Public License as published by
9    the Free Software Foundation; either version 3 of the License, or
10    (at your option) any later version.
11 
12    This program is distributed in the hope that it will be useful,
13    but WITHOUT ANY WARRANTY; without even the implied warranty of
14    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15    GNU General Public License for more details.
16 
17    You should have received a copy of the GNU General Public License
18    along with this program.  If not, see <http://www.gnu.org/licenses/>.  */
19 
20 #include "cli/cli-cmds.h"
21 #include "xml-builtin.h"
22 #include "xml-support.h"
23 #include "gdbsupport/filestuff.h"
24 #include "gdbsupport/gdb-safe-ctype.h"
25 #include <vector>
26 #include <string>
27 
28 /* Debugging flag.  */
29 static bool debug_xml;
30 
31 /* The contents of this file are only useful if XML support is
32    available.  */
33 #ifdef HAVE_LIBEXPAT
34 
35 #include "gdb_expat.h"
36 
37 /* The maximum depth of <xi:include> nesting.  No need to be miserly,
38    we just want to avoid running out of stack on loops.  */
39 #define MAX_XINCLUDE_DEPTH 30
40 
41 /* Simplified XML parser infrastructure.  */
42 
43 /* A parsing level -- used to keep track of the current element
44    nesting.  */
45 struct scope_level
46 {
47   explicit scope_level (const gdb_xml_element *elements_ = NULL)
48     : elements (elements_),
49       element (NULL),
50       seen (0)
51   {}
52 
53   /* Elements we allow at this level.  */
54   const struct gdb_xml_element *elements;
55 
56   /* The element which we are within.  */
57   const struct gdb_xml_element *element;
58 
59   /* Mask of which elements we've seen at this level (used for
60      optional and repeatable checking).  */
61   unsigned int seen;
62 
63   /* Body text accumulation.  */
64   std::string body;
65 };
66 
67 /* The parser itself, and our additional state.  */
68 struct gdb_xml_parser
69 {
70   gdb_xml_parser (const char *name,
71 		  const gdb_xml_element *elements,
72 		  void *user_data);
73   ~gdb_xml_parser();
74 
75   /* Associate DTD_NAME, which must be the name of a compiled-in DTD,
76      with the parser.  */
77   void use_dtd (const char *dtd_name);
78 
79   /* Return the name of the expected / default DTD, if specified.  */
80   const char *dtd_name ()
81   { return m_dtd_name; }
82 
83   /* Invoke the parser on BUFFER.  BUFFER is the data to parse, which
84      should be NUL-terminated.
85 
86      The return value is 0 for success or -1 for error.  It may throw,
87      but only if something unexpected goes wrong during parsing; parse
88      errors will be caught, warned about, and reported as failure.  */
89   int parse (const char *buffer);
90 
91   /* Issue a debugging message.  */
92   void vdebug (const char *format, va_list ap)
93     ATTRIBUTE_PRINTF (2, 0);
94 
95   /* Issue an error message, and stop parsing.  */
96   void verror (const char *format, va_list ap)
97     ATTRIBUTE_NORETURN ATTRIBUTE_PRINTF (2, 0);
98 
99   void body_text (const XML_Char *text, int length);
100   void start_element (const XML_Char *name, const XML_Char **attrs);
101   void end_element (const XML_Char *name);
102 
103   /* Return the name of this parser.  */
104   const char *name ()
105   { return m_name; }
106 
107   /* Return the user's callback data, for handlers.  */
108   void *user_data ()
109   { return m_user_data; };
110 
111   /* Are we the special <xi:include> parser?  */
112   void set_is_xinclude (bool is_xinclude)
113   { m_is_xinclude = is_xinclude; }
114 
115   /* A thrown error, if any.  */
116   void set_error (gdb_exception &&error)
117   {
118     m_error = std::move (error);
119 #ifdef HAVE_XML_STOPPARSER
120     XML_StopParser (m_expat_parser, XML_FALSE);
121 #endif
122   }
123 
124   /* Return the underlying expat parser.  */
125   XML_Parser expat_parser ()
126   { return m_expat_parser; }
127 
128 private:
129   /* The underlying expat parser.  */
130   XML_Parser m_expat_parser;
131 
132   /* Name of this parser.  */
133   const char *m_name;
134 
135   /* The user's callback data, for handlers.  */
136   void *m_user_data;
137 
138   /* Scoping stack.  */
139   std::vector<scope_level> m_scopes;
140 
141 /* A thrown error, if any.  */
142   struct gdb_exception m_error;
143 
144   /* The line of the thrown error, or 0.  */
145   int m_last_line;
146 
147   /* The name of the expected / default DTD, if specified.  */
148   const char *m_dtd_name;
149 
150   /* Are we the special <xi:include> parser?  */
151   bool m_is_xinclude;
152 };
153 
154 /* Process some body text.  We accumulate the text for later use; it's
155    wrong to do anything with it immediately, because a single block of
156    text might be broken up into multiple calls to this function.  */
157 
158 void
159 gdb_xml_parser::body_text (const XML_Char *text, int length)
160 {
161   if (m_error.reason < 0)
162     return;
163 
164   scope_level &scope = m_scopes.back ();
165   scope.body.append (text, length);
166 }
167 
168 static void
169 gdb_xml_body_text (void *data, const XML_Char *text, int length)
170 {
171   struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data;
172 
173   parser->body_text (text, length);
174 }
175 
176 /* Issue a debugging message from one of PARSER's handlers.  */
177 
178 void
179 gdb_xml_parser::vdebug (const char *format, va_list ap)
180 {
181   int line = XML_GetCurrentLineNumber (m_expat_parser);
182 
183   std::string message = string_vprintf (format, ap);
184   if (line)
185     gdb_printf (gdb_stderr, "%s (line %d): %s\n",
186 		m_name, line, message.c_str ());
187   else
188     gdb_printf (gdb_stderr, "%s: %s\n",
189 		m_name, message.c_str ());
190 }
191 
192 void
193 gdb_xml_debug (struct gdb_xml_parser *parser, const char *format, ...)
194 {
195   if (!debug_xml)
196     return;
197 
198   va_list ap;
199   va_start (ap, format);
200   parser->vdebug (format, ap);
201   va_end (ap);
202 }
203 
204 /* Issue an error message from one of PARSER's handlers, and stop
205    parsing.  */
206 
207 void
208 gdb_xml_parser::verror (const char *format, va_list ap)
209 {
210   int line = XML_GetCurrentLineNumber (m_expat_parser);
211 
212   m_last_line = line;
213   throw_verror (XML_PARSE_ERROR, format, ap);
214 }
215 
216 void
217 gdb_xml_error (struct gdb_xml_parser *parser, const char *format, ...)
218 {
219   va_list ap;
220   va_start (ap, format);
221   parser->verror (format, ap);
222   va_end (ap);
223 }
224 
225 /* Find the attribute named NAME in the set of parsed attributes
226    ATTRIBUTES.  Returns NULL if not found.  */
227 
228 struct gdb_xml_value *
229 xml_find_attribute (std::vector<gdb_xml_value> &attributes,
230 		    const char *name)
231 {
232   for (gdb_xml_value &value : attributes)
233     if (strcmp (value.name, name) == 0)
234       return &value;
235 
236   return NULL;
237 }
238 
239 /* Handle the start of an element.  NAME is the element, and ATTRS are
240    the names and values of this element's attributes.  */
241 
242 void
243 gdb_xml_parser::start_element (const XML_Char *name,
244 			       const XML_Char **attrs)
245 {
246   if (m_error.reason < 0)
247     return;
248 
249   const struct gdb_xml_element *element;
250   const struct gdb_xml_attribute *attribute;
251   unsigned int seen;
252 
253   /* Push an error scope.  If we return or throw an exception before
254      filling this in, it will tell us to ignore children of this
255      element.  Note we don't take a reference to the element yet
256      because further below we'll process the element which may recurse
257      back here and push more elements to the vector.  When the
258      recursion unrolls all such elements will have been popped back
259      already, but if one of those pushes reallocates the vector,
260      previous element references will be invalidated.  */
261   m_scopes.emplace_back ();
262 
263   /* Get a reference to the current scope.  */
264   scope_level &scope = m_scopes[m_scopes.size () - 2];
265 
266   gdb_xml_debug (this, _("Entering element <%s>"), name);
267 
268   /* Find this element in the list of the current scope's allowed
269      children.  Record that we've seen it.  */
270 
271   seen = 1;
272   for (element = scope.elements; element && element->name;
273        element++, seen <<= 1)
274     if (strcmp (element->name, name) == 0)
275       break;
276 
277   if (element == NULL || element->name == NULL)
278     {
279       /* If we're working on XInclude, <xi:include> can be the child
280 	 of absolutely anything.  Copy the previous scope's element
281 	 list into the new scope even if there was no match.  */
282       if (m_is_xinclude)
283 	{
284 	  XML_DefaultCurrent (m_expat_parser);
285 
286 	  scope_level &unknown_scope = m_scopes.back ();
287 	  unknown_scope.elements = scope.elements;
288 	  return;
289 	}
290 
291       gdb_xml_debug (this, _("Element <%s> unknown"), name);
292       return;
293     }
294 
295   if (!(element->flags & GDB_XML_EF_REPEATABLE) && (seen & scope.seen))
296     gdb_xml_error (this, _("Element <%s> only expected once"), name);
297 
298   scope.seen |= seen;
299 
300   std::vector<gdb_xml_value> attributes;
301 
302   for (attribute = element->attributes;
303        attribute != NULL && attribute->name != NULL;
304        attribute++)
305     {
306       const char *val = NULL;
307       const XML_Char **p;
308       void *parsed_value;
309 
310       for (p = attrs; *p != NULL; p += 2)
311 	if (!strcmp (attribute->name, p[0]))
312 	  {
313 	    val = p[1];
314 	    break;
315 	  }
316 
317       if (*p != NULL && val == NULL)
318 	{
319 	  gdb_xml_debug (this, _("Attribute \"%s\" missing a value"),
320 			 attribute->name);
321 	  continue;
322 	}
323 
324       if (*p == NULL && !(attribute->flags & GDB_XML_AF_OPTIONAL))
325 	{
326 	  gdb_xml_error (this, _("Required attribute \"%s\" of "
327 				   "<%s> not specified"),
328 			 attribute->name, element->name);
329 	  continue;
330 	}
331 
332       if (*p == NULL)
333 	continue;
334 
335       gdb_xml_debug (this, _("Parsing attribute %s=\"%s\""),
336 		     attribute->name, val);
337 
338       if (attribute->handler)
339 	parsed_value = attribute->handler (this, attribute, val);
340       else
341 	parsed_value = xstrdup (val);
342 
343       attributes.emplace_back (attribute->name, parsed_value);
344     }
345 
346   /* Check for unrecognized attributes.  */
347   if (debug_xml)
348     {
349       const XML_Char **p;
350 
351       for (p = attrs; *p != NULL; p += 2)
352 	{
353 	  for (attribute = element->attributes;
354 	       attribute != NULL && attribute->name != NULL;
355 	       attribute++)
356 	    if (strcmp (attribute->name, *p) == 0)
357 	      break;
358 
359 	  if (attribute == NULL || attribute->name == NULL)
360 	    gdb_xml_debug (this, _("Ignoring unknown attribute %s"), *p);
361 	}
362     }
363 
364   /* Call the element handler if there is one.  */
365   if (element->start_handler)
366     element->start_handler (this, element, m_user_data, attributes);
367 
368   /* Fill in a new scope level.  Note that we must delay getting a
369      back reference till here because above we might have recursed,
370      which may have reallocated the vector which invalidates
371      iterators/pointers/references.  */
372   scope_level &new_scope = m_scopes.back ();
373   new_scope.element = element;
374   new_scope.elements = element->children;
375 }
376 
377 /* Wrapper for gdb_xml_start_element, to prevent throwing exceptions
378    through expat.  */
379 
380 static void
381 gdb_xml_start_element_wrapper (void *data, const XML_Char *name,
382 			       const XML_Char **attrs)
383 {
384   struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data;
385 
386   try
387     {
388       parser->start_element (name, attrs);
389     }
390   catch (gdb_exception &ex)
391     {
392       parser->set_error (std::move (ex));
393     }
394 }
395 
396 /* Handle the end of an element.  NAME is the current element.  */
397 
398 void
399 gdb_xml_parser::end_element (const XML_Char *name)
400 {
401   if (m_error.reason < 0)
402     return;
403 
404   struct scope_level *scope = &m_scopes.back ();
405   const struct gdb_xml_element *element;
406   unsigned int seen;
407 
408   gdb_xml_debug (this, _("Leaving element <%s>"), name);
409 
410   for (element = scope->elements, seen = 1;
411        element != NULL && element->name != NULL;
412        element++, seen <<= 1)
413     if ((scope->seen & seen) == 0
414 	&& (element->flags & GDB_XML_EF_OPTIONAL) == 0)
415       gdb_xml_error (this, _("Required element <%s> is missing"),
416 		     element->name);
417 
418   /* Call the element processor.  */
419   if (scope->element != NULL && scope->element->end_handler)
420     {
421       const char *body;
422 
423       if (scope->body.empty ())
424 	body = "";
425       else
426 	{
427 	  int length;
428 
429 	  length = scope->body.size ();
430 	  body = scope->body.c_str ();
431 
432 	  /* Strip leading and trailing whitespace.  */
433 	  while (length > 0 && ISSPACE (body[length - 1]))
434 	    length--;
435 	  scope->body.erase (length);
436 	  while (*body && ISSPACE (*body))
437 	    body++;
438 	}
439 
440       scope->element->end_handler (this, scope->element,
441 				   m_user_data, body);
442     }
443   else if (scope->element == NULL)
444     XML_DefaultCurrent (m_expat_parser);
445 
446   /* Pop the scope level.  */
447   m_scopes.pop_back ();
448 }
449 
450 /* Wrapper for gdb_xml_end_element, to prevent throwing exceptions
451    through expat.  */
452 
453 static void
454 gdb_xml_end_element_wrapper (void *data, const XML_Char *name)
455 {
456   struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data;
457 
458   try
459     {
460       parser->end_element (name);
461     }
462   catch (gdb_exception &ex)
463     {
464       parser->set_error (std::move (ex));
465     }
466 }
467 
468 /* Free a parser and all its associated state.  */
469 
470 gdb_xml_parser::~gdb_xml_parser ()
471 {
472   XML_ParserFree (m_expat_parser);
473 }
474 
475 /* Initialize a parser.  */
476 
477 gdb_xml_parser::gdb_xml_parser (const char *name,
478 				const gdb_xml_element *elements,
479 				void *user_data)
480   : m_name (name),
481     m_user_data (user_data),
482     m_last_line (0),
483     m_dtd_name (NULL),
484     m_is_xinclude (false)
485 {
486   m_expat_parser = XML_ParserCreateNS (NULL, '!');
487   if (m_expat_parser == NULL)
488     malloc_failure (0);
489 
490   XML_SetUserData (m_expat_parser, this);
491 
492   /* Set the callbacks.  */
493   XML_SetElementHandler (m_expat_parser, gdb_xml_start_element_wrapper,
494 			 gdb_xml_end_element_wrapper);
495   XML_SetCharacterDataHandler (m_expat_parser, gdb_xml_body_text);
496 
497   /* Initialize the outer scope.  */
498   m_scopes.emplace_back (elements);
499 }
500 
501 /* External entity handler.  The only external entities we support
502    are those compiled into GDB (we do not fetch entities from the
503    target).  */
504 
505 static int XMLCALL
506 gdb_xml_fetch_external_entity (XML_Parser expat_parser,
507 			       const XML_Char *context,
508 			       const XML_Char *base,
509 			       const XML_Char *systemId,
510 			       const XML_Char *publicId)
511 {
512   XML_Parser entity_parser;
513   const char *text;
514   enum XML_Status status;
515 
516   if (systemId == NULL)
517     {
518       gdb_xml_parser *parser
519 	= (gdb_xml_parser *) XML_GetUserData (expat_parser);
520 
521       text = fetch_xml_builtin (parser->dtd_name ());
522       if (text == NULL)
523 	internal_error (_("could not locate built-in DTD %s"),
524 			parser->dtd_name ());
525     }
526   else
527     {
528       text = fetch_xml_builtin (systemId);
529       if (text == NULL)
530 	return XML_STATUS_ERROR;
531     }
532 
533   entity_parser = XML_ExternalEntityParserCreate (expat_parser,
534 						  context, NULL);
535 
536   /* Don't use our handlers for the contents of the DTD.  Just let expat
537      process it.  */
538   XML_SetElementHandler (entity_parser, NULL, NULL);
539   XML_SetDoctypeDeclHandler (entity_parser, NULL, NULL);
540   XML_SetXmlDeclHandler (entity_parser, NULL);
541   XML_SetDefaultHandler (entity_parser, NULL);
542   XML_SetUserData (entity_parser, NULL);
543 
544   status = XML_Parse (entity_parser, text, strlen (text), 1);
545 
546   XML_ParserFree (entity_parser);
547   return status;
548 }
549 
550 void
551 gdb_xml_parser::use_dtd (const char *dtd_name)
552 {
553   enum XML_Error err;
554 
555   m_dtd_name = dtd_name;
556 
557   XML_SetParamEntityParsing (m_expat_parser,
558 			     XML_PARAM_ENTITY_PARSING_UNLESS_STANDALONE);
559   XML_SetExternalEntityRefHandler (m_expat_parser,
560 				   gdb_xml_fetch_external_entity);
561 
562   /* Even if no DTD is provided, use the built-in DTD anyway.  */
563   err = XML_UseForeignDTD (m_expat_parser, XML_TRUE);
564   if (err != XML_ERROR_NONE)
565     internal_error (_("XML_UseForeignDTD failed: %s"),
566 		    XML_ErrorString (err));
567 }
568 
569 /* Invoke PARSER on BUFFER.  BUFFER is the data to parse, which
570    should be NUL-terminated.
571 
572    The return value is 0 for success or -1 for error.  It may throw,
573    but only if something unexpected goes wrong during parsing; parse
574    errors will be caught, warned about, and reported as failure.  */
575 
576 int
577 gdb_xml_parser::parse (const char *buffer)
578 {
579   enum XML_Status status;
580   const char *error_string;
581 
582   gdb_xml_debug (this, _("Starting:\n%s"), buffer);
583 
584   status = XML_Parse (m_expat_parser, buffer, strlen (buffer), 1);
585 
586   if (status == XML_STATUS_OK && m_error.reason == 0)
587     return 0;
588 
589   if (m_error.reason == RETURN_ERROR
590       && m_error.error == XML_PARSE_ERROR)
591     {
592       gdb_assert (m_error.message != NULL);
593       error_string = m_error.what ();
594     }
595   else if (status == XML_STATUS_ERROR)
596     {
597       enum XML_Error err = XML_GetErrorCode (m_expat_parser);
598 
599       error_string = XML_ErrorString (err);
600     }
601   else
602     {
603       gdb_assert (m_error.reason < 0);
604       throw_exception (std::move (m_error));
605     }
606 
607   if (m_last_line != 0)
608     warning (_("while parsing %s (at line %d): %s"), m_name,
609 	     m_last_line, error_string);
610   else
611     warning (_("while parsing %s: %s"), m_name, error_string);
612 
613   return -1;
614 }
615 
616 int
617 gdb_xml_parse_quick (const char *name, const char *dtd_name,
618 		     const struct gdb_xml_element *elements,
619 		     const char *document, void *user_data)
620 {
621   gdb_xml_parser parser (name, elements, user_data);
622   if (dtd_name != NULL)
623     parser.use_dtd (dtd_name);
624   return parser.parse (document);
625 }
626 
627 /* Parse a field VALSTR that we expect to contain an integer value.
628    The integer is returned in *VALP.  The string is parsed with an
629    equivalent to strtoul.
630 
631    Returns 0 for success, -1 for error.  */
632 
633 static int
634 xml_parse_unsigned_integer (const char *valstr, ULONGEST *valp)
635 {
636   const char *endptr;
637   ULONGEST result;
638 
639   if (*valstr == '\0')
640     return -1;
641 
642   result = strtoulst (valstr, &endptr, 0);
643   if (*endptr != '\0')
644     return -1;
645 
646   *valp = result;
647   return 0;
648 }
649 
650 /* Parse an integer string into a ULONGEST and return it, or call
651    gdb_xml_error if it could not be parsed.  */
652 
653 ULONGEST
654 gdb_xml_parse_ulongest (struct gdb_xml_parser *parser, const char *value)
655 {
656   ULONGEST result;
657 
658   if (xml_parse_unsigned_integer (value, &result) != 0)
659     gdb_xml_error (parser, _("Can't convert \"%s\" to an integer"), value);
660 
661   return result;
662 }
663 
664 /* Parse an integer attribute into a ULONGEST.  */
665 
666 void *
667 gdb_xml_parse_attr_ulongest (struct gdb_xml_parser *parser,
668 			     const struct gdb_xml_attribute *attribute,
669 			     const char *value)
670 {
671   ULONGEST result;
672   void *ret;
673 
674   if (xml_parse_unsigned_integer (value, &result) != 0)
675     gdb_xml_error (parser, _("Can't convert %s=\"%s\" to an integer"),
676 		   attribute->name, value);
677 
678   ret = XNEW (ULONGEST);
679   memcpy (ret, &result, sizeof (result));
680   return ret;
681 }
682 
683 /* A handler_data for yes/no boolean values.  */
684 
685 const struct gdb_xml_enum gdb_xml_enums_boolean[] = {
686   { "yes", 1 },
687   { "no", 0 },
688   { NULL, 0 }
689 };
690 
691 /* Map NAME to VALUE.  A struct gdb_xml_enum * should be saved as the
692    value of handler_data when using gdb_xml_parse_attr_enum to parse a
693    fixed list of possible strings.  The list is terminated by an entry
694    with NAME == NULL.  */
695 
696 void *
697 gdb_xml_parse_attr_enum (struct gdb_xml_parser *parser,
698 			 const struct gdb_xml_attribute *attribute,
699 			 const char *value)
700 {
701   const struct gdb_xml_enum *enums
702     = (const struct gdb_xml_enum *) attribute->handler_data;
703   void *ret;
704 
705   for (enums = (const struct gdb_xml_enum *) attribute->handler_data;
706        enums->name != NULL; enums++)
707     if (strcasecmp (enums->name, value) == 0)
708       break;
709 
710   if (enums->name == NULL)
711     gdb_xml_error (parser, _("Unknown attribute value %s=\"%s\""),
712 		 attribute->name, value);
713 
714   ret = xmalloc (sizeof (enums->value));
715   memcpy (ret, &enums->value, sizeof (enums->value));
716   return ret;
717 }
718 
719 
720 /* XInclude processing.  This is done as a separate step from actually
721    parsing the document, so that we can produce a single combined XML
722    document - e.g. to hand to a front end or to simplify comparing two
723    documents.  We make extensive use of XML_DefaultCurrent, to pass
724    input text directly into the output without reformatting or
725    requoting it.
726 
727    We output the DOCTYPE declaration for the first document unchanged,
728    if present, and discard DOCTYPEs from included documents.  Only the
729    one we pass through here is used when we feed the result back to
730    expat.  The XInclude standard explicitly does not discuss
731    validation of the result; we choose to apply the same DTD applied
732    to the outermost document.
733 
734    We can not simply include the external DTD subset in the document
735    as an internal subset, because <!IGNORE> and <!INCLUDE> are valid
736    only in external subsets.  But if we do not pass the DTD into the
737    output at all, default values will not be filled in.
738 
739    We don't pass through any <?xml> declaration because we generate
740    UTF-8, not whatever the input encoding was.  */
741 
742 struct xinclude_parsing_data
743 {
744   xinclude_parsing_data (std::string &output_,
745 			 xml_fetch_another fetcher_,
746 			 int include_depth_)
747     : output (output_),
748       skip_depth (0),
749       include_depth (include_depth_),
750       fetcher (fetcher_)
751   {}
752 
753   /* Where the output goes.  */
754   std::string &output;
755 
756   /* A count indicating whether we are in an element whose
757      children should not be copied to the output, and if so,
758      how deep we are nested.  This is used for anything inside
759      an xi:include, and for the DTD.  */
760   int skip_depth;
761 
762   /* The number of <xi:include> elements currently being processed,
763      to detect loops.  */
764   int include_depth;
765 
766   /* A function to call to obtain additional features, and its
767      baton.  */
768   xml_fetch_another fetcher;
769 };
770 
771 static void
772 xinclude_start_include (struct gdb_xml_parser *parser,
773 			const struct gdb_xml_element *element,
774 			void *user_data,
775 			std::vector<gdb_xml_value> &attributes)
776 {
777   struct xinclude_parsing_data *data
778     = (struct xinclude_parsing_data *) user_data;
779   char *href = (char *) xml_find_attribute (attributes, "href")->value.get ();
780 
781   gdb_xml_debug (parser, _("Processing XInclude of \"%s\""), href);
782 
783   if (data->include_depth > MAX_XINCLUDE_DEPTH)
784     gdb_xml_error (parser, _("Maximum XInclude depth (%d) exceeded"),
785 		   MAX_XINCLUDE_DEPTH);
786 
787   std::optional<gdb::char_vector> text = data->fetcher (href);
788   if (!text)
789     gdb_xml_error (parser, _("Could not load XML document \"%s\""), href);
790 
791   if (!xml_process_xincludes (data->output, parser->name (),
792 			      text->data (), data->fetcher,
793 			      data->include_depth + 1))
794     gdb_xml_error (parser, _("Parsing \"%s\" failed"), href);
795 
796   data->skip_depth++;
797 }
798 
799 static void
800 xinclude_end_include (struct gdb_xml_parser *parser,
801 		      const struct gdb_xml_element *element,
802 		      void *user_data, const char *body_text)
803 {
804   struct xinclude_parsing_data *data
805     = (struct xinclude_parsing_data *) user_data;
806 
807   data->skip_depth--;
808 }
809 
810 static void XMLCALL
811 xml_xinclude_default (void *data_, const XML_Char *s, int len)
812 {
813   struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data_;
814   xinclude_parsing_data *data = (xinclude_parsing_data *) parser->user_data ();
815 
816   /* If we are inside of e.g. xi:include or the DTD, don't save this
817      string.  */
818   if (data->skip_depth)
819     return;
820 
821   /* Otherwise just add it to the end of the document we're building
822      up.  */
823   data->output.append (s, len);
824 }
825 
826 static void XMLCALL
827 xml_xinclude_start_doctype (void *data_, const XML_Char *doctypeName,
828 			    const XML_Char *sysid, const XML_Char *pubid,
829 			    int has_internal_subset)
830 {
831   struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data_;
832   xinclude_parsing_data *data = (xinclude_parsing_data *) parser->user_data ();
833 
834   /* Don't print out the doctype, or the contents of the DTD internal
835      subset, if any.  */
836   data->skip_depth++;
837 }
838 
839 static void XMLCALL
840 xml_xinclude_end_doctype (void *data_)
841 {
842   struct gdb_xml_parser *parser = (struct gdb_xml_parser *) data_;
843   xinclude_parsing_data *data = (xinclude_parsing_data *) parser->user_data ();
844 
845   data->skip_depth--;
846 }
847 
848 static void XMLCALL
849 xml_xinclude_xml_decl (void *data_, const XML_Char *version,
850 		       const XML_Char *encoding, int standalone)
851 {
852   /* Do nothing - this function prevents the default handler from
853      being called, thus suppressing the XML declaration from the
854      output.  */
855 }
856 
857 const struct gdb_xml_attribute xinclude_attributes[] = {
858   { "href", GDB_XML_AF_NONE, NULL, NULL },
859   { NULL, GDB_XML_AF_NONE, NULL, NULL }
860 };
861 
862 const struct gdb_xml_element xinclude_elements[] = {
863   { "http://www.w3.org/2001/XInclude!include", xinclude_attributes, NULL,
864     GDB_XML_EF_OPTIONAL | GDB_XML_EF_REPEATABLE,
865     xinclude_start_include, xinclude_end_include },
866   { NULL, NULL, NULL, GDB_XML_EF_NONE, NULL, NULL }
867 };
868 
869 /* The main entry point for <xi:include> processing.  */
870 
871 bool
872 xml_process_xincludes (std::string &result,
873 		       const char *name, const char *text,
874 		       xml_fetch_another fetcher, int depth)
875 {
876   xinclude_parsing_data data (result, fetcher, depth);
877 
878   gdb_xml_parser parser (name, xinclude_elements, &data);
879   parser.set_is_xinclude (true);
880 
881   XML_SetCharacterDataHandler (parser.expat_parser (), NULL);
882   XML_SetDefaultHandler (parser.expat_parser (), xml_xinclude_default);
883 
884   /* Always discard the XML version declarations; the only important
885      thing this provides is encoding, and our result will have been
886      converted to UTF-8.  */
887   XML_SetXmlDeclHandler (parser.expat_parser (), xml_xinclude_xml_decl);
888 
889   if (depth > 0)
890     /* Discard the doctype for included documents.  */
891     XML_SetDoctypeDeclHandler (parser.expat_parser (),
892 			       xml_xinclude_start_doctype,
893 			       xml_xinclude_end_doctype);
894 
895   parser.use_dtd ("xinclude.dtd");
896 
897   if (parser.parse (text) == 0)
898     {
899       if (depth == 0)
900 	gdb_xml_debug (&parser, _("XInclude processing succeeded."));
901       return true;
902     }
903 
904   return false;
905 }
906 #endif /* HAVE_LIBEXPAT */
907 
908 
909 /* Return an XML document which was compiled into GDB, from
910    the given FILENAME, or NULL if the file was not compiled in.  */
911 
912 const char *
913 fetch_xml_builtin (const char *filename)
914 {
915   const char *const (*p)[2];
916 
917   for (p = xml_builtin; (*p)[0]; p++)
918     if (strcmp ((*p)[0], filename) == 0)
919       return (*p)[1];
920 
921   return NULL;
922 }
923 
924 /* A to_xfer_partial helper function which reads XML files which were
925    compiled into GDB.  The target may call this function from its own
926    to_xfer_partial handler, after converting object and annex to the
927    appropriate filename.  */
928 
929 LONGEST
930 xml_builtin_xfer_partial (const char *filename,
931 			  gdb_byte *readbuf, const gdb_byte *writebuf,
932 			  ULONGEST offset, LONGEST len)
933 {
934   const char *buf;
935   LONGEST len_avail;
936 
937   gdb_assert (readbuf != NULL && writebuf == NULL);
938   gdb_assert (filename != NULL);
939 
940   buf = fetch_xml_builtin (filename);
941   if (buf == NULL)
942     return -1;
943 
944   len_avail = strlen (buf);
945   if (offset >= len_avail)
946     return 0;
947 
948   if (len > len_avail - offset)
949     len = len_avail - offset;
950   memcpy (readbuf, buf + offset, len);
951   return len;
952 }
953 
954 
955 static void
956 show_debug_xml (struct ui_file *file, int from_tty,
957 		struct cmd_list_element *c, const char *value)
958 {
959   gdb_printf (file, _("XML debugging is %s.\n"), value);
960 }
961 
962 std::optional<gdb::char_vector>
963 xml_fetch_content_from_file (const char *filename, const char *dirname)
964 {
965   gdb_file_up file;
966 
967   if (dirname != nullptr && *dirname != '\0')
968     {
969       gdb::unique_xmalloc_ptr<char> fullname
970 	(concat (dirname, "/", filename, (char *) NULL));
971 
972       file = gdb_fopen_cloexec (fullname.get (), FOPEN_RB);
973     }
974   else
975     file = gdb_fopen_cloexec (filename, FOPEN_RB);
976 
977   if (file == NULL)
978     return {};
979 
980   /* Read in the whole file.  */
981 
982   size_t len;
983 
984   if (fseek (file.get (), 0, SEEK_END) == -1)
985     perror_with_name (_("seek to end of file"));
986   len = ftell (file.get ());
987   rewind (file.get ());
988 
989   gdb::char_vector text (len + 1);
990 
991   if (fread (text.data (), 1, len, file.get ()) != len
992       || ferror (file.get ()))
993     {
994       warning (_("Read error from \"%s\""), filename);
995       return {};
996     }
997 
998   text.back () = '\0';
999   return text;
1000 }
1001 
1002 void _initialize_xml_support ();
1003 void _initialize_xml_support ();
1004 void
1005 _initialize_xml_support ()
1006 {
1007   add_setshow_boolean_cmd ("xml", class_maintenance, &debug_xml,
1008 			   _("Set XML parser debugging."),
1009 			   _("Show XML parser debugging."),
1010 			   _("When set, debugging messages for XML parsers "
1011 			     "are displayed."),
1012 			   NULL, show_debug_xml,
1013 			   &setdebuglist, &showdebuglist);
1014 }
1015