123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356 |
- /* Copyright 2000-2005 The Apache Software Foundation or its licensors, as
- * applicable.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
- /**
- * @file apr_xml.h
- * @brief APR-UTIL XML Library
- */
- #ifndef APR_XML_H
- #define APR_XML_H
- /**
- * @defgroup APR_Util_XML XML
- * @ingroup APR_Util
- * @{
- */
- #include "apr_pools.h"
- #include "apr_tables.h"
- #include "apr_file_io.h"
- #include "apu.h"
- #if APR_CHARSET_EBCDIC
- #include "apr_xlate.h"
- #endif
- #ifdef __cplusplus
- extern "C" {
- #endif
- /**
- * @package Apache XML library
- */
- /* -------------------------------------------------------------------- */
- /* ### these will need to move at some point to a more logical spot */
- /** @see apr_text */
- typedef struct apr_text apr_text;
- /** Structure to keep a linked list of pieces of text */
- struct apr_text {
- /** The current piece of text */
- const char *text;
- /** a pointer to the next piece of text */
- struct apr_text *next;
- };
- /** @see apr_text_header */
- typedef struct apr_text_header apr_text_header;
- /** A list of pieces of text */
- struct apr_text_header {
- /** The first piece of text in the list */
- apr_text *first;
- /** The last piece of text in the list */
- apr_text *last;
- };
- /**
- * Append a piece of text to the end of a list
- * @param p The pool to allocate out of
- * @param hdr The text header to append to
- * @param text The new text to append
- */
- APU_DECLARE(void) apr_text_append(apr_pool_t *p, apr_text_header *hdr,
- const char *text);
- /* --------------------------------------------------------------------
- **
- ** XML PARSING
- */
- /*
- ** Qualified namespace values
- **
- ** APR_XML_NS_DAV_ID
- ** We always insert the "DAV:" namespace URI at the head of the
- ** namespace array. This means that it will always be at ID==0,
- ** making it much easier to test for.
- **
- ** APR_XML_NS_NONE
- ** This special ID is used for two situations:
- **
- ** 1) The namespace prefix begins with "xml" (and we do not know
- ** what it means). Namespace prefixes with "xml" (any case) as
- ** their first three characters are reserved by the XML Namespaces
- ** specification for future use. mod_dav will pass these through
- ** unchanged. When this identifier is used, the prefix is LEFT in
- ** the element/attribute name. Downstream processing should not
- ** prepend another prefix.
- **
- ** 2) The element/attribute does not have a namespace.
- **
- ** a) No prefix was used, and a default namespace has not been
- ** defined.
- ** b) No prefix was used, and the default namespace was specified
- ** to mean "no namespace". This is done with a namespace
- ** declaration of: xmlns=""
- ** (this declaration is typically used to override a previous
- ** specification for the default namespace)
- **
- ** In these cases, we need to record that the elem/attr has no
- ** namespace so that we will not attempt to prepend a prefix.
- ** All namespaces that are used will have a prefix assigned to
- ** them -- mod_dav will never set or use the default namespace
- ** when generating XML. This means that "no prefix" will always
- ** mean "no namespace".
- **
- ** In both cases, the XML generation will avoid prepending a prefix.
- ** For the first case, this means the original prefix/name will be
- ** inserted into the output stream. For the latter case, it means
- ** the name will have no prefix, and since we never define a default
- ** namespace, this means it will have no namespace.
- **
- ** Note: currently, mod_dav understands the "xmlns" prefix and the
- ** "xml:lang" attribute. These are handled specially (they aren't
- ** left within the XML tree), so the APR_XML_NS_NONE value won't ever
- ** really apply to these values.
- */
- #define APR_XML_NS_DAV_ID 0 /**< namespace ID for "DAV:" */
- #define APR_XML_NS_NONE -10 /**< no namespace for this elem/attr */
- #define APR_XML_NS_ERROR_BASE -100 /**< used only during processing */
- /** Is this namespace an error? */
- #define APR_XML_NS_IS_ERROR(e) ((e) <= APR_XML_NS_ERROR_BASE)
- /** @see apr_xml_attr */
- typedef struct apr_xml_attr apr_xml_attr;
- /** @see apr_xml_elem */
- typedef struct apr_xml_elem apr_xml_elem;
- /** @see apr_xml_doc */
- typedef struct apr_xml_doc apr_xml_doc;
- /** apr_xml_attr: holds a parsed XML attribute */
- struct apr_xml_attr {
- /** attribute name */
- const char *name;
- /** index into namespace array */
- int ns;
- /** attribute value */
- const char *value;
- /** next attribute */
- struct apr_xml_attr *next;
- };
- /** apr_xml_elem: holds a parsed XML element */
- struct apr_xml_elem {
- /** element name */
- const char *name;
- /** index into namespace array */
- int ns;
- /** xml:lang for attrs/contents */
- const char *lang;
- /** cdata right after start tag */
- apr_text_header first_cdata;
- /** cdata after MY end tag */
- apr_text_header following_cdata;
- /** parent element */
- struct apr_xml_elem *parent;
- /** next (sibling) element */
- struct apr_xml_elem *next;
- /** first child element */
- struct apr_xml_elem *first_child;
- /** first attribute */
- struct apr_xml_attr *attr;
- /* used only during parsing */
- /** last child element */
- struct apr_xml_elem *last_child;
- /** namespaces scoped by this elem */
- struct apr_xml_ns_scope *ns_scope;
- /* used by modules during request processing */
- /** Place for modules to store private data */
- void *priv;
- };
- /** Is this XML element empty? */
- #define APR_XML_ELEM_IS_EMPTY(e) ((e)->first_child == NULL && \
- (e)->first_cdata.first == NULL)
- /** apr_xml_doc: holds a parsed XML document */
- struct apr_xml_doc {
- /** root element */
- apr_xml_elem *root;
- /** array of namespaces used */
- apr_array_header_t *namespaces;
- };
- /** Opaque XML parser structure */
- typedef struct apr_xml_parser apr_xml_parser;
- /**
- * Create an XML parser
- * @param pool The pool for allocating the parser and the parse results.
- * @return The new parser.
- */
- APU_DECLARE(apr_xml_parser *) apr_xml_parser_create(apr_pool_t *pool);
- /**
- * Parse a File, producing a xml_doc
- * @param p The pool for allocating the parse results.
- * @param parser A pointer to *parser (needed so calling function can get
- * errors), will be set to NULL on successfull completion.
- * @param ppdoc A pointer to *apr_xml_doc (which has the parsed results in it)
- * @param xmlfd A file to read from.
- * @param buffer_length Buffer length which would be suitable
- * @return Any errors found during parsing.
- */
- APU_DECLARE(apr_status_t) apr_xml_parse_file(apr_pool_t *p,
- apr_xml_parser **parser,
- apr_xml_doc **ppdoc,
- apr_file_t *xmlfd,
- apr_size_t buffer_length);
- /**
- * Feed input into the parser
- * @param parser The XML parser for parsing this data.
- * @param data The data to parse.
- * @param len The length of the data.
- * @return Any errors found during parsing.
- * @remark Use apr_xml_parser_geterror() to get more error information.
- */
- APU_DECLARE(apr_status_t) apr_xml_parser_feed(apr_xml_parser *parser,
- const char *data,
- apr_size_t len);
- /**
- * Terminate the parsing and return the result
- * @param parser The XML parser for parsing this data.
- * @param pdoc The resulting parse information. May be NULL to simply
- * terminate the parsing without fetching the info.
- * @return Any errors found during the final stage of parsing.
- * @remark Use apr_xml_parser_geterror() to get more error information.
- */
- APU_DECLARE(apr_status_t) apr_xml_parser_done(apr_xml_parser *parser,
- apr_xml_doc **pdoc);
- /**
- * Fetch additional error information from the parser.
- * @param parser The XML parser to query for errors.
- * @param errbuf A buffer for storing error text.
- * @param errbufsize The length of the error text buffer.
- * @return The error buffer
- */
- APU_DECLARE(char *) apr_xml_parser_geterror(apr_xml_parser *parser,
- char *errbuf,
- apr_size_t errbufsize);
- /**
- * Converts an XML element tree to flat text
- * @param p The pool to allocate out of
- * @param elem The XML element to convert
- * @param style How to covert the XML. One of:
- * <PRE>
- * APR_XML_X2T_FULL start tag, contents, end tag
- * APR_XML_X2T_INNER contents only
- * APR_XML_X2T_LANG_INNER xml:lang + inner contents
- * APR_XML_X2T_FULL_NS_LANG FULL + ns defns + xml:lang
- * </PRE>
- * @param namespaces The namespace of the current XML element
- * @param ns_map Namespace mapping
- * @param pbuf Buffer to put the converted text into
- * @param psize Size of the converted text
- */
- APU_DECLARE(void) apr_xml_to_text(apr_pool_t *p, const apr_xml_elem *elem,
- int style, apr_array_header_t *namespaces,
- int *ns_map, const char **pbuf,
- apr_size_t *psize);
- /* style argument values: */
- #define APR_XML_X2T_FULL 0 /**< start tag, contents, end tag */
- #define APR_XML_X2T_INNER 1 /**< contents only */
- #define APR_XML_X2T_LANG_INNER 2 /**< xml:lang + inner contents */
- #define APR_XML_X2T_FULL_NS_LANG 3 /**< FULL + ns defns + xml:lang */
- /**
- * empty XML element
- * @param p The pool to allocate out of
- * @param elem The XML element to empty
- * @return the string that was stored in the XML element
- */
- APU_DECLARE(const char *) apr_xml_empty_elem(apr_pool_t *p,
- const apr_xml_elem *elem);
- /**
- * quote an XML string
- * Replace '<', '>', and '&' with '<', '>', and '&'.
- * @param p The pool to allocate out of
- * @param s The string to quote
- * @param quotes If quotes is true, then replace '"' with '"'.
- * @return The quoted string
- * @note If the string does not contain special characters, it is not
- * duplicated into the pool and the original string is returned.
- */
- APU_DECLARE(const char *) apr_xml_quote_string(apr_pool_t *p, const char *s,
- int quotes);
- /**
- * Quote an XML element
- * @param p The pool to allocate out of
- * @param elem The element to quote
- */
- APU_DECLARE(void) apr_xml_quote_elem(apr_pool_t *p, apr_xml_elem *elem);
- /* manage an array of unique URIs: apr_xml_insert_uri() and APR_XML_URI_ITEM() */
- /**
- * return the URI's (existing) index, or insert it and return a new index
- * @param uri_array array to insert into
- * @param uri The uri to insert
- * @return int The uri's index
- */
- APU_DECLARE(int) apr_xml_insert_uri(apr_array_header_t *uri_array,
- const char *uri);
- /** Get the URI item for this XML element */
- #define APR_XML_GET_URI_ITEM(ary, i) (((const char * const *)(ary)->elts)[i])
- #if APR_CHARSET_EBCDIC
- /**
- * Convert parsed tree in EBCDIC
- * @param p The pool to allocate out of
- * @param pdoc The apr_xml_doc to convert.
- * @param xlate The translation handle to use.
- * @return Any errors found during conversion.
- */
- APU_DECLARE(apr_status_t) apr_xml_parser_convert_doc(apr_pool_t *p,
- apr_xml_doc *pdoc,
- apr_xlate_t *convset);
- #endif
- #ifdef __cplusplus
- }
- #endif
- /** @} */
- #endif /* APR_XML_H */
|