diff options
-rw-r--r-- | configure.in | 2 | ||||
-rw-r--r-- | doc/APIchunk12.html | 1 | ||||
-rw-r--r-- | doc/APIchunk13.html | 1 | ||||
-rw-r--r-- | doc/APIchunk18.html | 1 | ||||
-rw-r--r-- | doc/APIchunk20.html | 2 | ||||
-rw-r--r-- | doc/APIchunk22.html | 1 | ||||
-rw-r--r-- | doc/APIchunk26.html | 1 | ||||
-rw-r--r-- | doc/APIchunk28.html | 1 | ||||
-rw-r--r-- | doc/APIchunk4.html | 1 | ||||
-rw-r--r-- | doc/APIfiles.html | 1 | ||||
-rw-r--r-- | doc/APIsymbols.html | 1 | ||||
-rw-r--r-- | doc/devhelp/libxml2-HTMLparser.html | 3 | ||||
-rw-r--r-- | doc/devhelp/libxml2-tree.html | 8 | ||||
-rw-r--r-- | doc/devhelp/libxml2.devhelp | 1 | ||||
-rw-r--r-- | doc/html/libxml-HTMLparser.html | 3 | ||||
-rw-r--r-- | doc/html/libxml-tree.html | 8 | ||||
-rw-r--r-- | doc/libxml2-api.xml | 12 | ||||
-rw-r--r-- | doc/libxml2-refs.xml | 22 | ||||
-rwxr-xr-x | python/setup.py | 2 |
19 files changed, 57 insertions, 15 deletions
diff --git a/configure.in b/configure.in index 26f54676..17c11cde 100644 --- a/configure.in +++ b/configure.in @@ -6,7 +6,7 @@ AC_CANONICAL_HOST LIBXML_MAJOR_VERSION=2 LIBXML_MINOR_VERSION=7 -LIBXML_MICRO_VERSION=6 +LIBXML_MICRO_VERSION=7 LIBXML_MICRO_VERSION_SUFFIX= LIBXML_VERSION=$LIBXML_MAJOR_VERSION.$LIBXML_MINOR_VERSION.$LIBXML_MICRO_VERSION$LIBXML_MICRO_VERSION_SUFFIX LIBXML_VERSION_INFO=`expr $LIBXML_MAJOR_VERSION + $LIBXML_MINOR_VERSION`:$LIBXML_MICRO_VERSION:$LIBXML_MINOR_VERSION diff --git a/doc/APIchunk12.html b/doc/APIchunk12.html index d95f37d7..13c1702c 100644 --- a/doc/APIchunk12.html +++ b/doc/APIchunk12.html @@ -395,6 +395,7 @@ A:link, A:visited, A:active { text-decoration: underline } </dd><dt>comparisons</dt><dd><a href="html/libxml-xmlreader.html#xmlTextReaderConstString">xmlTextReaderConstString</a><br /> <a href="html/libxml-xpathInternals.html#xmlXPathSubstringFunction">xmlXPathSubstringFunction</a><br /> </dd><dt>compatibility</dt><dd><a href="html/libxml-xmlversion.html#LIBXML_LEGACY_ENABLED">LIBXML_LEGACY_ENABLED</a><br /> +<a href="html/libxml-HTMLparser.html#htmlParseElement">htmlParseElement</a><br /> <a href="html/libxml-tree.html#xmlChildrenNode">xmlChildrenNode</a><br /> <a href="html/libxml-parserInternals.html#xmlCopyChar">xmlCopyChar</a><br /> <a href="html/libxml-entities.html#xmlEncodeEntities">xmlEncodeEntities</a><br /> diff --git a/doc/APIchunk13.html b/doc/APIchunk13.html index d1390ebe..d693461b 100644 --- a/doc/APIchunk13.html +++ b/doc/APIchunk13.html @@ -504,6 +504,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-tree.html#xmlDocGetRootElement">xmlDocGetRootElement</a><br /> <a href="html/libxml-tree.html#xmlDocSetRootElement">xmlDocSetRootElement</a><br /> <a href="html/libxml-xmlwriter.html#xmlNewTextWriterTree">xmlNewTextWriterTree</a><br /> +<a href="html/libxml-tree.html#xmlNodeGetBase">xmlNodeGetBase</a><br /> </dd><dt>docs</dt><dd><a href="html/libxml-uri.html#xmlBuildRelativeURI">xmlBuildRelativeURI</a><br /> </dd><dt>doctypedecl</dt><dd><a href="html/libxml-parserInternals.html#xmlParseDocTypeDecl">xmlParseDocTypeDecl</a><br /> <a href="html/libxml-parser.html#xmlParseDocument">xmlParseDocument</a><br /> diff --git a/doc/APIchunk18.html b/doc/APIchunk18.html index d9444ad7..41fad5e5 100644 --- a/doc/APIchunk18.html +++ b/doc/APIchunk18.html @@ -73,6 +73,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-xpath.html#_xmlXPathContext">_xmlXPathContext</a><br /> <a href="html/libxml-HTMLparser.html#htmlAutoCloseTag">htmlAutoCloseTag</a><br /> <a href="html/libxml-HTMLparser.html#htmlIsAutoClosed">htmlIsAutoClosed</a><br /> +<a href="html/libxml-HTMLparser.html#htmlParseElement">htmlParseElement</a><br /> <a href="html/libxml-parser.html#xmlKeepBlanksDefault">xmlKeepBlanksDefault</a><br /> <a href="html/libxml-xpath.html#xmlXPathOrderDocElems">xmlXPathOrderDocElems</a><br /> </dd><dt>keyword</dt><dd><a href="html/libxml-parserInternals.html#xmlParseDefaultDecl">xmlParseDefaultDecl</a><br /> diff --git a/doc/APIchunk20.html b/doc/APIchunk20.html index 9c4ed36c..f39da0e6 100644 --- a/doc/APIchunk20.html +++ b/doc/APIchunk20.html @@ -166,6 +166,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-valid.html#xmlValidGetValidElements">xmlValidGetValidElements</a><br /> </dd><dt>node-set?</dt><dd><a href="html/libxml-xpathInternals.html#xmlXPathLocalNameFunction">xmlXPathLocalNameFunction</a><br /> <a href="html/libxml-xpathInternals.html#xmlXPathNamespaceURIFunction">xmlXPathNamespaceURIFunction</a><br /> +</dd><dt>nodeInfos</dt><dd><a href="html/libxml-parser.html#_xmlParserCtxt">_xmlParserCtxt</a><br /> </dd><dt>nodelist</dt><dd><a href="html/libxml-parser.html#xmlParseBalancedChunkMemoryRecover">xmlParseBalancedChunkMemoryRecover</a><br /> </dd><dt>nodes1</dt><dd><a href="html/libxml-xpathInternals.html#xmlXPathDifference">xmlXPathDifference</a><br /> </dd><dt>nodes2</dt><dd><a href="html/libxml-xpathInternals.html#xmlXPathDifference">xmlXPathDifference</a><br /> @@ -197,6 +198,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-c14n.html#xmlC14NExecute">xmlC14NExecute</a><br /> </dd><dt>non-normative</dt><dd><a href="html/libxml-encoding.html#xmlDetectCharEncoding">xmlDetectCharEncoding</a><br /> </dd><dt>non-null</dt><dd><a href="html/libxml-debugXML.html#xmlShellPrintNode">xmlShellPrintNode</a><br /> +</dd><dt>non-recursive</dt><dd><a href="html/libxml-parser.html#_xmlParserCtxt">_xmlParserCtxt</a><br /> </dd><dt>non-stateless</dt><dd><a href="html/libxml-encoding.html#xmlCharEncOutFunc">xmlCharEncOutFunc</a><br /> </dd><dt>non-validating</dt><dd><a href="html/libxml-parserInternals.html#xmlParseAttValue">xmlParseAttValue</a><br /> <a href="html/libxml-parserInternals.html#xmlParseEntityRef">xmlParseEntityRef</a><br /> diff --git a/doc/APIchunk22.html b/doc/APIchunk22.html index 7a647dd0..f95bac08 100644 --- a/doc/APIchunk22.html +++ b/doc/APIchunk22.html @@ -343,6 +343,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-entities.html#_xmlEntity">_xmlEntity</a><br /> <a href="html/libxml-tree.html#_xmlNode">_xmlNode</a><br /> <a href="html/libxml-HTMLparser.html#htmlHandleOmittedElem">htmlHandleOmittedElem</a><br /> +<a href="html/libxml-HTMLparser.html#htmlParseElement">htmlParseElement</a><br /> <a href="html/libxml-tree.html#xmlAddPrevSibling">xmlAddPrevSibling</a><br /> <a href="html/libxml-catalog.html#xmlCatalogSetDebug">xmlCatalogSetDebug</a><br /> <a href="html/libxml-catalog.html#xmlCatalogSetDefaultPrefer">xmlCatalogSetDefaultPrefer</a><br /> diff --git a/doc/APIchunk26.html b/doc/APIchunk26.html index a99c7084..26e410c9 100644 --- a/doc/APIchunk26.html +++ b/doc/APIchunk26.html @@ -270,6 +270,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-schemasInternals.html#XML_SCHEMAS_TYPE_VARIETY_LIST">XML_SCHEMAS_TYPE_VARIETY_LIST</a><br /> <a href="html/libxml-schemasInternals.html#XML_SCHEMAS_TYPE_VARIETY_UNION">XML_SCHEMAS_TYPE_VARIETY_UNION</a><br /> </dd><dt>various</dt><dd><a href="html/libxml-tree.html#_xmlDOMWrapCtxt">_xmlDOMWrapCtxt</a><br /> +</dd><dt>versions</dt><dd><a href="html/libxml-HTMLparser.html#htmlParseElement">htmlParseElement</a><br /> </dd><dt>very</dt><dd><a href="html/libxml-HTMLparser.html#_htmlElemDesc">_htmlElemDesc</a><br /> <a href="html/libxml-parser.html#_xmlParserInput">_xmlParserInput</a><br /> <a href="html/libxml-encoding.html#xmlCharEncFirstLine">xmlCharEncFirstLine</a><br /> diff --git a/doc/APIchunk28.html b/doc/APIchunk28.html index b2a9f11e..af942daa 100644 --- a/doc/APIchunk28.html +++ b/doc/APIchunk28.html @@ -147,7 +147,6 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-xmlwriter.html#xmlNewTextWriterDoc">xmlNewTextWriterDoc</a><br /> <a href="html/libxml-xmlwriter.html#xmlNewTextWriterTree">xmlNewTextWriterTree</a><br /> <a href="html/libxml-xmlreader.html#xmlTextReaderCurrentDoc">xmlTextReaderCurrentDoc</a><br /> -</dd><dt>xmlDocumentGetBase</dt><dd><a href="html/libxml-tree.html#xmlNodeGetBase">xmlNodeGetBase</a><br /> </dd><dt>xmlDtdPtr</dt><dd><a href="html/libxml-tree.html#xmlCopyDtd">xmlCopyDtd</a><br /> <a href="html/libxml-parser.html#xmlIOParseDTD">xmlIOParseDTD</a><br /> <a href="html/libxml-parser.html#xmlParseDTD">xmlParseDTD</a><br /> diff --git a/doc/APIchunk4.html b/doc/APIchunk4.html index 395dbfc3..9a2222f9 100644 --- a/doc/APIchunk4.html +++ b/doc/APIchunk4.html @@ -263,6 +263,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-tree.html#xmlNodeListGetRawString">xmlNodeListGetRawString</a><br /> <a href="html/libxml-tree.html#xmlNodeListGetString">xmlNodeListGetString</a><br /> <a href="html/libxml-xpathInternals.html#xmlXPathNewNodeSet">xmlXPathNewNodeSet</a><br /> +</dd><dt>NodeInfo</dt><dd><a href="html/libxml-parser.html#_xmlParserCtxt">_xmlParserCtxt</a><br /> </dd><dt>NodeList</dt><dd><a href="html/libxml-xpath.html#xmlXPathNodeSetGetLength">xmlXPathNodeSetGetLength</a><br /> <a href="html/libxml-xpath.html#xmlXPathNodeSetItem">xmlXPathNodeSetItem</a><br /> </dd><dt>NodePtr</dt><dd><a href="html/libxml-xpathInternals.html#xmlXPathNewNodeSet">xmlXPathNewNodeSet</a><br /> diff --git a/doc/APIfiles.html b/doc/APIfiles.html index 22b7bea5..33ac7f9d 100644 --- a/doc/APIfiles.html +++ b/doc/APIfiles.html @@ -30,6 +30,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-HTMLparser.html#HTML_PARSE_COMPACT">HTML_PARSE_COMPACT</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_NOBLANKS">HTML_PARSE_NOBLANKS</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_NOERROR">HTML_PARSE_NOERROR</a><br /> +<a href="html/libxml-HTMLparser.html#HTML_PARSE_NOIMPLIED">HTML_PARSE_NOIMPLIED</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_NONET">HTML_PARSE_NONET</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_NOWARNING">HTML_PARSE_NOWARNING</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_PEDANTIC">HTML_PARSE_PEDANTIC</a><br /> diff --git a/doc/APIsymbols.html b/doc/APIsymbols.html index e2d4d0dd..d8784396 100644 --- a/doc/APIsymbols.html +++ b/doc/APIsymbols.html @@ -28,6 +28,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="html/libxml-HTMLparser.html#HTML_PARSE_COMPACT">HTML_PARSE_COMPACT</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_NOBLANKS">HTML_PARSE_NOBLANKS</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_NOERROR">HTML_PARSE_NOERROR</a><br /> +<a href="html/libxml-HTMLparser.html#HTML_PARSE_NOIMPLIED">HTML_PARSE_NOIMPLIED</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_NONET">HTML_PARSE_NONET</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_NOWARNING">HTML_PARSE_NOWARNING</a><br /> <a href="html/libxml-HTMLparser.html#HTML_PARSE_PEDANTIC">HTML_PARSE_PEDANTIC</a><br /> diff --git a/doc/devhelp/libxml2-HTMLparser.html b/doc/devhelp/libxml2-HTMLparser.html index 827da396..1ce01e3f 100644 --- a/doc/devhelp/libxml2-HTMLparser.html +++ b/doc/devhelp/libxml2-HTMLparser.html @@ -189,6 +189,7 @@ int <a href="#htmlCtxtUseOptions">htmlCtxtUseOptions</a> (<a href="libxml2-HTML <a name="HTML_PARSE_PEDANTIC">HTML_PARSE_PEDANTIC</a> = 128 /* pedantic error reporting */ <a name="HTML_PARSE_NOBLANKS">HTML_PARSE_NOBLANKS</a> = 256 /* remove blank nodes */ <a name="HTML_PARSE_NONET">HTML_PARSE_NONET</a> = 2048 /* Forbid network access */ + <a name="HTML_PARSE_NOIMPLIED">HTML_PARSE_NOIMPLIED</a> = 8192 /* Do not add implied html/body... elements */ <a name="HTML_PARSE_COMPACT">HTML_PARSE_COMPACT</a> = 65536 /* compact small text nodes */ }; </pre><p/> @@ -321,7 +322,7 @@ int <a href="#htmlCtxtUseOptions">htmlCtxtUseOptions</a> (<a href="libxml2-HTML <div class="variablelist"><table border="0"><col align="left"/><tbody><tr><td><span class="term"><i><tt>ctxt</tt></i>:</span></td><td>an HTML parser context</td></tr><tr><td><span class="term"><i><tt>Returns</tt></i>:</span></td><td>0, -1 in case of error. the parser context is augmented as a result of the parsing.</td></tr></tbody></table></div></div> <hr/> <div class="refsect2" lang="en"><h3><a name="htmlParseElement"/>htmlParseElement ()</h3><pre class="programlisting">void htmlParseElement (<a href="libxml2-HTMLparser.html#htmlParserCtxtPtr">htmlParserCtxtPtr</a> ctxt)<br/> -</pre><p>parse an HTML element, this is highly recursive [39] element ::= EmptyElemTag | STag content ETag [41] Attribute ::= Name Eq AttValue</p> +</pre><p>parse an HTML element, this is highly recursive this is kept for compatibility with previous code versions [39] element ::= EmptyElemTag | STag content ETag [41] Attribute ::= Name Eq AttValue</p> <div class="variablelist"><table border="0"><col align="left"/><tbody><tr><td><span class="term"><i><tt>ctxt</tt></i>:</span></td><td>an HTML parser context</td></tr></tbody></table></div></div> <hr/> <div class="refsect2" lang="en"><h3><a name="htmlParseEntityRef"/>htmlParseEntityRef ()</h3><pre class="programlisting">const <a href="libxml2-HTMLparser.html#htmlEntityDesc">htmlEntityDesc</a> * htmlParseEntityRef (<a href="libxml2-HTMLparser.html#htmlParserCtxtPtr">htmlParserCtxtPtr</a> ctxt, <br/> const <a href="libxml2-xmlstring.html#xmlChar">xmlChar</a> ** str)<br/> diff --git a/doc/devhelp/libxml2-tree.html b/doc/devhelp/libxml2-tree.html index c3702036..2c254a32 100644 --- a/doc/devhelp/libxml2-tree.html +++ b/doc/devhelp/libxml2-tree.html @@ -781,7 +781,11 @@ void <a href="#xmlFreeNsList">xmlFreeNsList</a> (<a href="libxml2-tree.html#xm <a href="libxml2-xmlerror.html#xmlError">xmlError</a> lastError <a href="libxml2-parser.html#xmlParserMode">xmlParserMode</a> parseMode : the parser mode unsigned long nbentities : number of entities references - unsigned long sizeentities : size of parsed entities + unsigned long sizeentities : size of parsed entities for use by HTML non-recursive parser + <a href="libxml2-parser.html#xmlParserNodeInfo">xmlParserNodeInfo</a> * nodeInfo : Current NodeInfo + int nodeInfoNr : Depth of the parsing stack + int nodeInfoMax : Max depth of the parsing stack + <a href="libxml2-parser.html#xmlParserNodeInfo">xmlParserNodeInfo</a> * nodeInfoTab : array of nodeInfos } xmlParserCtxt; </pre><p/> </div> @@ -1349,7 +1353,7 @@ void <a href="#xmlFreeNsList">xmlFreeNsList</a> (<a href="libxml2-tree.html#xm <div class="variablelist"><table border="0"><col align="left"/><tbody><tr><td><span class="term"><i><tt>buf</tt></i>:</span></td><td>the XML buffer output</td></tr><tr><td><span class="term"><i><tt>doc</tt></i>:</span></td><td>the document</td></tr><tr><td><span class="term"><i><tt>cur</tt></i>:</span></td><td>the current node</td></tr><tr><td><span class="term"><i><tt>level</tt></i>:</span></td><td>the imbrication level for indenting</td></tr><tr><td><span class="term"><i><tt>format</tt></i>:</span></td><td>is formatting allowed</td></tr><tr><td><span class="term"><i><tt>encoding</tt></i>:</span></td><td>an optional encoding string</td></tr></tbody></table></div></div> <hr/> <div class="refsect2" lang="en"><h3><a name="xmlNodeGetBase"/>xmlNodeGetBase ()</h3><pre class="programlisting"><a href="libxml2-xmlstring.html#xmlChar">xmlChar</a> * xmlNodeGetBase (<a href="libxml2-tree.html#xmlDocPtr">xmlDocPtr</a> doc, <br/> <a href="libxml2-tree.html#xmlNodePtr">xmlNodePtr</a> cur)<br/> -</pre><p>Searches for the BASE URL. The code should work on both XML and HTML document even if base mechanisms are completely different. It returns the base as defined in RFC 2396 sections 5.1.1. Base URI within Document Content and 5.1.2. Base URI from the Encapsulating Entity However it does not return the document base (5.1.3), use xmlDocumentGetBase() for this</p> +</pre><p>Searches for the BASE URL. The code should work on both XML and HTML document even if base mechanisms are completely different. It returns the base as defined in RFC 2396 sections 5.1.1. Base URI within Document Content and 5.1.2. Base URI from the Encapsulating Entity However it does not return the document base (5.1.3), use doc->URL in this case</p> <div class="variablelist"><table border="0"><col align="left"/><tbody><tr><td><span class="term"><i><tt>doc</tt></i>:</span></td><td>the document the node pertains to</td></tr><tr><td><span class="term"><i><tt>cur</tt></i>:</span></td><td>the node being checked</td></tr><tr><td><span class="term"><i><tt>Returns</tt></i>:</span></td><td>a pointer to the base URL, or NULL if not found It's up to the caller to free the memory with xmlFree().</td></tr></tbody></table></div></div> <hr/> <div class="refsect2" lang="en"><h3><a name="xmlNodeGetContent"/>xmlNodeGetContent ()</h3><pre class="programlisting"><a href="libxml2-xmlstring.html#xmlChar">xmlChar</a> * xmlNodeGetContent (<a href="libxml2-tree.html#xmlNodePtr">xmlNodePtr</a> cur)<br/> diff --git a/doc/devhelp/libxml2.devhelp b/doc/devhelp/libxml2.devhelp index 81529794..3e632b62 100644 --- a/doc/devhelp/libxml2.devhelp +++ b/doc/devhelp/libxml2.devhelp @@ -306,6 +306,7 @@ <function name="HTML_PARSE_COMPACT" link="libxml2-HTMLparser.html#HTML_PARSE_COMPACT"/> <function name="HTML_PARSE_NOBLANKS" link="libxml2-HTMLparser.html#HTML_PARSE_NOBLANKS"/> <function name="HTML_PARSE_NOERROR" link="libxml2-HTMLparser.html#HTML_PARSE_NOERROR"/> + <function name="HTML_PARSE_NOIMPLIED" link="libxml2-HTMLparser.html#HTML_PARSE_NOIMPLIED"/> <function name="HTML_PARSE_NONET" link="libxml2-HTMLparser.html#HTML_PARSE_NONET"/> <function name="HTML_PARSE_NOWARNING" link="libxml2-HTMLparser.html#HTML_PARSE_NOWARNING"/> <function name="HTML_PARSE_PEDANTIC" link="libxml2-HTMLparser.html#HTML_PARSE_PEDANTIC"/> diff --git a/doc/html/libxml-HTMLparser.html b/doc/html/libxml-HTMLparser.html index 0bc7dbd5..09c959b6 100644 --- a/doc/html/libxml-HTMLparser.html +++ b/doc/html/libxml-HTMLparser.html @@ -93,6 +93,7 @@ A:link, A:visited, A:active { text-decoration: underline } <a name="HTML_PARSE_PEDANTIC" id="HTML_PARSE_PEDANTIC">HTML_PARSE_PEDANTIC</a> = 128 : pedantic error reporting <a name="HTML_PARSE_NOBLANKS" id="HTML_PARSE_NOBLANKS">HTML_PARSE_NOBLANKS</a> = 256 : remove blank nodes <a name="HTML_PARSE_NONET" id="HTML_PARSE_NONET">HTML_PARSE_NONET</a> = 2048 : Forbid network access + <a name="HTML_PARSE_NOIMPLIED" id="HTML_PARSE_NOIMPLIED">HTML_PARSE_NOIMPLIED</a> = 8192 : Do not add implied html/body... elements <a name="HTML_PARSE_COMPACT" id="HTML_PARSE_COMPACT">HTML_PARSE_COMPACT</a> = 65536 : compact small text nodes } </pre><h3>Enum <a name="htmlStatus" id="htmlStatus">htmlStatus</a></h3><pre class="programlisting">Enum htmlStatus { @@ -157,7 +158,7 @@ A:link, A:visited, A:active { text-decoration: underline } <div class="variablelist"><table border="0"><col align="left" /><tbody><tr><td><span class="term"><i><tt>cur</tt></i>:</span></td><td>a pointer to an array of <a href="libxml-xmlstring.html#xmlChar">xmlChar</a></td></tr><tr><td><span class="term"><i><tt>encoding</tt></i>:</span></td><td>a free form C string describing the HTML document encoding, or NULL</td></tr><tr><td><span class="term"><i><tt>Returns</tt></i>:</span></td><td>the resulting document tree</td></tr></tbody></table></div><h3><a name="htmlParseDocument" id="htmlParseDocument"></a>Function: htmlParseDocument</h3><pre class="programlisting">int htmlParseDocument (<a href="libxml-HTMLparser.html#htmlParserCtxtPtr">htmlParserCtxtPtr</a> ctxt)<br /> </pre><p>parse an HTML document (and build a tree if using the standard SAX interface).</p> <div class="variablelist"><table border="0"><col align="left" /><tbody><tr><td><span class="term"><i><tt>ctxt</tt></i>:</span></td><td>an HTML parser context</td></tr><tr><td><span class="term"><i><tt>Returns</tt></i>:</span></td><td>0, -1 in case of error. the parser context is augmented as a result of the parsing.</td></tr></tbody></table></div><h3><a name="htmlParseElement" id="htmlParseElement"></a>Function: htmlParseElement</h3><pre class="programlisting">void htmlParseElement (<a href="libxml-HTMLparser.html#htmlParserCtxtPtr">htmlParserCtxtPtr</a> ctxt)<br /> -</pre><p>parse an HTML element, this is highly recursive [39] element ::= EmptyElemTag | STag content ETag [41] Attribute ::= Name Eq AttValue</p> +</pre><p>parse an HTML element, this is highly recursive this is kept for compatibility with previous code versions [39] element ::= EmptyElemTag | STag content ETag [41] Attribute ::= Name Eq AttValue</p> <div class="variablelist"><table border="0"><col align="left" /><tbody><tr><td><span class="term"><i><tt>ctxt</tt></i>:</span></td><td>an HTML parser context</td></tr></tbody></table></div><h3><a name="htmlParseEntityRef" id="htmlParseEntityRef"></a>Function: htmlParseEntityRef</h3><pre class="programlisting">const <a href="libxml-HTMLparser.html#htmlEntityDesc">htmlEntityDesc</a> * htmlParseEntityRef (<a href="libxml-HTMLparser.html#htmlParserCtxtPtr">htmlParserCtxtPtr</a> ctxt, <br /> const <a href="libxml-xmlstring.html#xmlChar">xmlChar</a> ** str)<br /> </pre><p>parse an HTML ENTITY references [68] EntityRef ::= '&' Name ';'</p> <div class="variablelist"><table border="0"><col align="left" /><tbody><tr><td><span class="term"><i><tt>ctxt</tt></i>:</span></td><td>an HTML parser context</td></tr><tr><td><span class="term"><i><tt>str</tt></i>:</span></td><td>location to store the entity name</td></tr><tr><td><span class="term"><i><tt>Returns</tt></i>:</span></td><td>the associated <a href="libxml-HTMLparser.html#htmlEntityDescPtr">htmlEntityDescPtr</a> if found, or NULL otherwise, if non-NULL *str will have to be freed by the caller.</td></tr></tbody></table></div><h3><a name="htmlParseFile" id="htmlParseFile"></a>Function: htmlParseFile</h3><pre class="programlisting"><a href="libxml-HTMLparser.html#htmlDocPtr">htmlDocPtr</a> htmlParseFile (const char * filename, <br /> const char * encoding)<br /> diff --git a/doc/html/libxml-tree.html b/doc/html/libxml-tree.html index 6f916056..50cc4471 100644 --- a/doc/html/libxml-tree.html +++ b/doc/html/libxml-tree.html @@ -563,7 +563,11 @@ A:link, A:visited, A:active { text-decoration: underline } <a href="libxml-xmlerror.html#xmlError">xmlError</a> lastError <a href="libxml-parser.html#xmlParserMode">xmlParserMode</a> parseMode : the parser mode unsigned long nbentities : number of entities references - unsigned long sizeentities : size of parsed entities + unsigned long sizeentities : size of parsed entities for use by HTML + <a href="libxml-parser.html#xmlParserNodeInfo">xmlParserNodeInfo</a> * nodeInfo : Current NodeInfo + int nodeInfoNr : Depth of the parsing stack + int nodeInfoMax : Max depth of the parsing stack + <a href="libxml-parser.html#xmlParserNodeInfo">xmlParserNodeInfo</a> * nodeInfoTab : array of nodeInfos }</pre><h3><a name="xmlParserInput" id="xmlParserInput">Structure xmlParserInput</a></h3><pre class="programlisting">Structure xmlParserInput<br />struct _xmlParserInput { <a href="libxml-tree.html#xmlParserInputBufferPtr">xmlParserInputBufferPtr</a> buf : UTF-8 encoded buffer const char * filename : The file analyzed, if any @@ -860,7 +864,7 @@ A:link, A:visited, A:active { text-decoration: underline } <div class="variablelist"><table border="0"><col align="left" /><tbody><tr><td><span class="term"><i><tt>buf</tt></i>:</span></td><td>the XML buffer output</td></tr><tr><td><span class="term"><i><tt>doc</tt></i>:</span></td><td>the document</td></tr><tr><td><span class="term"><i><tt>cur</tt></i>:</span></td><td>the current node</td></tr><tr><td><span class="term"><i><tt>level</tt></i>:</span></td><td>the imbrication level for indenting</td></tr><tr><td><span class="term"><i><tt>format</tt></i>:</span></td><td>is formatting allowed</td></tr><tr><td><span class="term"><i><tt>Returns</tt></i>:</span></td><td>the number of bytes written to the buffer or -1 in case of error</td></tr></tbody></table></div><h3><a name="xmlNodeDumpOutput" id="xmlNodeDumpOutput"></a>Function: xmlNodeDumpOutput</h3><pre class="programlisting">void xmlNodeDumpOutput (<a href="libxml-tree.html#xmlOutputBufferPtr">xmlOutputBufferPtr</a> buf, <br /> <a href="libxml-tree.html#xmlDocPtr">xmlDocPtr</a> doc, <br /> <a href="libxml-tree.html#xmlNodePtr">xmlNodePtr</a> cur, <br /> int level, <br /> int format, <br /> const char * encoding)<br /> </pre><p>Dump an XML node, recursive behaviour, children are printed too. Note that @format = 1 provide node indenting only if <a href="libxml-globals.html#xmlIndentTreeOutput">xmlIndentTreeOutput</a> = 1 or xmlKeepBlanksDefault(0) was called</p> <div class="variablelist"><table border="0"><col align="left" /><tbody><tr><td><span class="term"><i><tt>buf</tt></i>:</span></td><td>the XML buffer output</td></tr><tr><td><span class="term"><i><tt>doc</tt></i>:</span></td><td>the document</td></tr><tr><td><span class="term"><i><tt>cur</tt></i>:</span></td><td>the current node</td></tr><tr><td><span class="term"><i><tt>level</tt></i>:</span></td><td>the imbrication level for indenting</td></tr><tr><td><span class="term"><i><tt>format</tt></i>:</span></td><td>is formatting allowed</td></tr><tr><td><span class="term"><i><tt>encoding</tt></i>:</span></td><td>an optional encoding string</td></tr></tbody></table></div><h3><a name="xmlNodeGetBase" id="xmlNodeGetBase"></a>Function: xmlNodeGetBase</h3><pre class="programlisting"><a href="libxml-xmlstring.html#xmlChar">xmlChar</a> * xmlNodeGetBase (<a href="libxml-tree.html#xmlDocPtr">xmlDocPtr</a> doc, <br /> <a href="libxml-tree.html#xmlNodePtr">xmlNodePtr</a> cur)<br /> -</pre><p>Searches for the BASE URL. The code should work on both XML and HTML document even if base mechanisms are completely different. It returns the base as defined in RFC 2396 sections 5.1.1. Base URI within Document Content and 5.1.2. Base URI from the Encapsulating Entity However it does not return the document base (5.1.3), use xmlDocumentGetBase() for this</p> +</pre><p>Searches for the BASE URL. The code should work on both XML and HTML document even if base mechanisms are completely different. It returns the base as defined in RFC 2396 sections 5.1.1. Base URI within Document Content and 5.1.2. Base URI from the Encapsulating Entity However it does not return the document base (5.1.3), use doc->URL in this case</p> <div class="variablelist"><table border="0"><col align="left" /><tbody><tr><td><span class="term"><i><tt>doc</tt></i>:</span></td><td>the document the node pertains to</td></tr><tr><td><span class="term"><i><tt>cur</tt></i>:</span></td><td>the node being checked</td></tr><tr><td><span class="term"><i><tt>Returns</tt></i>:</span></td><td>a pointer to the base URL, or NULL if not found It's up to the caller to free the memory with xmlFree().</td></tr></tbody></table></div><h3><a name="xmlNodeGetContent" id="xmlNodeGetContent"></a>Function: xmlNodeGetContent</h3><pre class="programlisting"><a href="libxml-xmlstring.html#xmlChar">xmlChar</a> * xmlNodeGetContent (<a href="libxml-tree.html#xmlNodePtr">xmlNodePtr</a> cur)<br /> </pre><p>Read the value of a node, this can be either the text carried directly by this node if it's a TEXT node or the aggregate string of the values carried by this node child's (TEXT and ENTITY_REF). Entity references are substituted.</p> <div class="variablelist"><table border="0"><col align="left" /><tbody><tr><td><span class="term"><i><tt>cur</tt></i>:</span></td><td>the node being read</td></tr><tr><td><span class="term"><i><tt>Returns</tt></i>:</span></td><td>a new #xmlChar * or NULL if no content is available. It's up to the caller to free the memory with xmlFree().</td></tr></tbody></table></div><h3><a name="xmlNodeGetLang" id="xmlNodeGetLang"></a>Function: xmlNodeGetLang</h3><pre class="programlisting"><a href="libxml-xmlstring.html#xmlChar">xmlChar</a> * xmlNodeGetLang (<a href="libxml-tree.html#xmlNodePtr">xmlNodePtr</a> cur)<br /> diff --git a/doc/libxml2-api.xml b/doc/libxml2-api.xml index 5cf19cb9..046be3d5 100644 --- a/doc/libxml2-api.xml +++ b/doc/libxml2-api.xml @@ -42,6 +42,7 @@ <exports symbol='HTML_DEPRECATED' type='enum'/> <exports symbol='HTML_PARSE_PEDANTIC' type='enum'/> <exports symbol='HTML_PARSE_RECOVER' type='enum'/> + <exports symbol='HTML_PARSE_NOIMPLIED' type='enum'/> <exports symbol='HTML_PARSE_NOWARNING' type='enum'/> <exports symbol='htmlParserNodeInfo' type='typedef'/> <exports symbol='htmlParserInput' type='typedef'/> @@ -4593,6 +4594,7 @@ <enum name='HTML_PARSE_COMPACT' file='HTMLparser' value='65536' type='htmlParserOption' info=' compact small text nodes'/> <enum name='HTML_PARSE_NOBLANKS' file='HTMLparser' value='256' type='htmlParserOption' info='remove blank nodes'/> <enum name='HTML_PARSE_NOERROR' file='HTMLparser' value='32' type='htmlParserOption' info='suppress error reports'/> + <enum name='HTML_PARSE_NOIMPLIED' file='HTMLparser' value='8192' type='htmlParserOption' info='Do not add implied html/body... elements'/> <enum name='HTML_PARSE_NONET' file='HTMLparser' value='2048' type='htmlParserOption' info='Forbid network access'/> <enum name='HTML_PARSE_NOWARNING' file='HTMLparser' value='64' type='htmlParserOption' info='suppress warning reports'/> <enum name='HTML_PARSE_PEDANTIC' file='HTMLparser' value='128' type='htmlParserOption' info='pedantic error reporting'/> @@ -6339,7 +6341,11 @@ actually an xmlCharEncoding'/> <field name='lastError' type='xmlError' info=''/> <field name='parseMode' type='xmlParserMode' info=' the parser mode'/> <field name='nbentities' type='unsigned long' info=' number of entities references'/> - <field name='sizeentities' type='unsigned long' info=' size of parsed entities'/> + <field name='sizeentities' type='unsigned long' info=' size of parsed entities for use by HTML non-recursive parser'/> + <field name='nodeInfo' type='xmlParserNodeInfo *' info=' Current NodeInfo'/> + <field name='nodeInfoNr' type='int' info=' Depth of the parsing stack'/> + <field name='nodeInfoMax' type='int' info=' Max depth of the parsing stack'/> + <field name='nodeInfoTab' type='xmlParserNodeInfo *' info=' array of nodeInfos'/> </struct> <typedef name='xmlParserCtxtPtr' file='tree' type='xmlParserCtxt *'/> <typedef name='xmlParserErrors' file='xmlerror' type='enum'/> @@ -7647,7 +7653,7 @@ Could we use @subtypes for this?'/> </function> <function name='htmlParseElement' file='HTMLparser' module='HTMLparser'> <cond>defined(LIBXML_HTML_ENABLED)</cond> - <info>parse an HTML element, this is highly recursive [39] element ::= EmptyElemTag | STag content ETag [41] Attribute ::= Name Eq AttValue</info> + <info>parse an HTML element, this is highly recursive this is kept for compatibility with previous code versions [39] element ::= EmptyElemTag | STag content ETag [41] Attribute ::= Name Eq AttValue</info> <return type='void'/> <arg name='ctxt' type='htmlParserCtxtPtr' info='an HTML parser context'/> </function> @@ -11621,7 +11627,7 @@ Could we use @subtypes for this?'/> <arg name='encoding' type='const char *' info='an optional encoding string'/> </function> <function name='xmlNodeGetBase' file='tree' module='tree'> - <info>Searches for the BASE URL. The code should work on both XML and HTML document even if base mechanisms are completely different. It returns the base as defined in RFC 2396 sections 5.1.1. Base URI within Document Content and 5.1.2. Base URI from the Encapsulating Entity However it does not return the document base (5.1.3), use xmlDocumentGetBase() for this</info> + <info>Searches for the BASE URL. The code should work on both XML and HTML document even if base mechanisms are completely different. It returns the base as defined in RFC 2396 sections 5.1.1. Base URI within Document Content and 5.1.2. Base URI from the Encapsulating Entity However it does not return the document base (5.1.3), use doc->URL in this case</info> <return type='xmlChar *' info='a pointer to the base URL, or NULL if not found It's up to the caller to free the memory with xmlFree().'/> <arg name='doc' type='xmlDocPtr' info='the document the node pertains to'/> <arg name='cur' type='xmlNodePtr' info='the node being checked'/> diff --git a/doc/libxml2-refs.xml b/doc/libxml2-refs.xml index 368c612b..3e26ec75 100644 --- a/doc/libxml2-refs.xml +++ b/doc/libxml2-refs.xml @@ -22,6 +22,7 @@ <reference name='HTML_PARSE_COMPACT' href='html/libxml-HTMLparser.html#HTML_PARSE_COMPACT'/> <reference name='HTML_PARSE_NOBLANKS' href='html/libxml-HTMLparser.html#HTML_PARSE_NOBLANKS'/> <reference name='HTML_PARSE_NOERROR' href='html/libxml-HTMLparser.html#HTML_PARSE_NOERROR'/> + <reference name='HTML_PARSE_NOIMPLIED' href='html/libxml-HTMLparser.html#HTML_PARSE_NOIMPLIED'/> <reference name='HTML_PARSE_NONET' href='html/libxml-HTMLparser.html#HTML_PARSE_NONET'/> <reference name='HTML_PARSE_NOWARNING' href='html/libxml-HTMLparser.html#HTML_PARSE_NOWARNING'/> <reference name='HTML_PARSE_PEDANTIC' href='html/libxml-HTMLparser.html#HTML_PARSE_PEDANTIC'/> @@ -3563,6 +3564,7 @@ <ref name='HTML_PARSE_COMPACT'/> <ref name='HTML_PARSE_NOBLANKS'/> <ref name='HTML_PARSE_NOERROR'/> + <ref name='HTML_PARSE_NOIMPLIED'/> <ref name='HTML_PARSE_NONET'/> <ref name='HTML_PARSE_NOWARNING'/> <ref name='HTML_PARSE_PEDANTIC'/> @@ -10622,6 +10624,7 @@ <ref name='HTML_PARSE_COMPACT'/> <ref name='HTML_PARSE_NOBLANKS'/> <ref name='HTML_PARSE_NOERROR'/> + <ref name='HTML_PARSE_NOIMPLIED'/> <ref name='HTML_PARSE_NONET'/> <ref name='HTML_PARSE_NOWARNING'/> <ref name='HTML_PARSE_PEDANTIC'/> @@ -16575,6 +16578,9 @@ <ref name='xmlNodeListGetString'/> <ref name='xmlXPathNewNodeSet'/> </word> + <word name='NodeInfo'> + <ref name='_xmlParserCtxt'/> + </word> <word name='NodeList'> <ref name='xmlXPathNodeSetGetLength'/> <ref name='xmlXPathNodeSetItem'/> @@ -20305,6 +20311,7 @@ </word> <word name='compatibility'> <ref name='LIBXML_LEGACY_ENABLED'/> + <ref name='htmlParseElement'/> <ref name='xmlChildrenNode'/> <ref name='xmlCopyChar'/> <ref name='xmlEncodeEntities'/> @@ -21655,6 +21662,7 @@ <ref name='xmlDocGetRootElement'/> <ref name='xmlDocSetRootElement'/> <ref name='xmlNewTextWriterTree'/> + <ref name='xmlNodeGetBase'/> </word> <word name='docs'> <ref name='xmlBuildRelativeURI'/> @@ -24225,6 +24233,7 @@ <ref name='_xmlXPathContext'/> <ref name='htmlAutoCloseTag'/> <ref name='htmlIsAutoClosed'/> + <ref name='htmlParseElement'/> <ref name='xmlKeepBlanksDefault'/> <ref name='xmlXPathOrderDocElems'/> </word> @@ -25384,6 +25393,9 @@ <ref name='xmlXPathLocalNameFunction'/> <ref name='xmlXPathNamespaceURIFunction'/> </word> + <word name='nodeInfos'> + <ref name='_xmlParserCtxt'/> + </word> <word name='nodelist'> <ref name='xmlParseBalancedChunkMemoryRecover'/> </word> @@ -25447,6 +25459,9 @@ <word name='non-null'> <ref name='xmlShellPrintNode'/> </word> + <word name='non-recursive'> + <ref name='_xmlParserCtxt'/> + </word> <word name='non-stateless'> <ref name='xmlCharEncOutFunc'/> </word> @@ -26525,6 +26540,7 @@ <ref name='_xmlEntity'/> <ref name='_xmlNode'/> <ref name='htmlHandleOmittedElem'/> + <ref name='htmlParseElement'/> <ref name='xmlAddPrevSibling'/> <ref name='xmlCatalogSetDebug'/> <ref name='xmlCatalogSetDefaultPrefer'/> @@ -29968,6 +29984,9 @@ <word name='various'> <ref name='_xmlDOMWrapCtxt'/> </word> + <word name='versions'> + <ref name='htmlParseElement'/> + </word> <word name='very'> <ref name='_htmlElemDesc'/> <ref name='_xmlParserInput'/> @@ -30613,9 +30632,6 @@ <ref name='xmlNewTextWriterTree'/> <ref name='xmlTextReaderCurrentDoc'/> </word> - <word name='xmlDocumentGetBase'> - <ref name='xmlNodeGetBase'/> - </word> <word name='xmlDtdPtr'> <ref name='xmlCopyDtd'/> <ref name='xmlIOParseDTD'/> diff --git a/python/setup.py b/python/setup.py index f80a66c4..6522a516 100755 --- a/python/setup.py +++ b/python/setup.py @@ -226,7 +226,7 @@ else: setup (name = "libxml2-python", # On *nix, the version number is created from setup.py.in # On windows, it is set by configure.js - version = "2.7.6", + version = "2.7.7", description = descr, author = "Daniel Veillard", author_email = "veillard@redhat.com", |