~ubuntu-branches/ubuntu/saucy/lxml/saucy-updates

« back to all changes in this revision

Viewing changes to src/lxml/parser.pxi

Committer: Package Import Robot
Author(s): Matthias Klose
Date: 2012-10-19 19:02:57 UTC
mfrom: (1.3.9)
Revision ID: package-import@ubuntu.com-20121019190257-ryczr7c7lbgrvi9h

Tags: 3.0.1-0ubuntu1

New upstream version.

files added:
doc/html/api/abc.ABCMeta-class.html

doc/html/api/lxml.cssselect.LxmlHTMLTranslator-class.html

doc/html/api/lxml.cssselect.LxmlTranslator-class.html

doc/html/api/lxml.etree._ElementMatchIterator-class.html

doc/html/api/lxml.includes-module.html

doc/html/api/lxml.includes-pysrc.html

doc/html/api/lxml.tests.common_imports.skipif-class.html

doc/html/api/lxml.tests.test_builder-module.html

doc/html/api/lxml.tests.test_builder-pysrc.html

doc/html/api/lxml.tests.test_builder.BuilderTestCase-class.html

doc/html/api/lxml.tests.test_elementtree._ETreeTestCaseBase-class.html

doc/html/api/lxml.tests.test_etree._XIncludeTestCase-class.html

doc/html/api/lxml.tests.test_io._IOTestCaseBase-class.html

doc/html/api/lxml.tests.test_xslt.ETreeEXSLTTestCase-class.html

doc/html/api/str-class.html

doc/html/api/toc-lxml.includes-module.html

doc/html/api/toc-lxml.tests.test_builder-module.html

doc/html/changes-3.0.1.html

src/lxml/cvarargs.pxd

src/lxml/debug.pxi

src/lxml/html/tests/test_html5parser.py

src/lxml/includes

src/lxml/includes/__init__.py

src/lxml/includes/c14n.pxd

src/lxml/includes/config.pxd

src/lxml/includes/dtdvalid.pxd

src/lxml/includes/etree_defs.h

src/lxml/includes/etreepublic.pxd

src/lxml/includes/htmlparser.pxd

src/lxml/includes/lxml-version.h

src/lxml/includes/relaxng.pxd

src/lxml/includes/schematron.pxd

src/lxml/includes/tree.pxd

src/lxml/includes/uri.pxd

src/lxml/includes/xinclude.pxd

src/lxml/includes/xmlerror.pxd

src/lxml/includes/xmlparser.pxd

src/lxml/includes/xmlschema.pxd

src/lxml/includes/xpath.pxd

src/lxml/includes/xslt.pxd

src/lxml/tests/shakespeare.html

src/lxml/tests/test_builder.py

files removed:
doc/html/api/lxml.cssselect.Attrib-class.html

doc/html/api/lxml.cssselect.Class-class.html

doc/html/api/lxml.cssselect.CombinedSelector-class.html

doc/html/api/lxml.cssselect.Element-class.html

doc/html/api/lxml.cssselect.ExpressionError-class.html

doc/html/api/lxml.cssselect.Function-class.html

doc/html/api/lxml.cssselect.Hash-class.html

doc/html/api/lxml.cssselect.Or-class.html

doc/html/api/lxml.cssselect.Pseudo-class.html

doc/html/api/lxml.cssselect.SelectorSyntaxError-class.html

doc/html/api/lxml.cssselect.String-class.html

doc/html/api/lxml.cssselect.Symbol-class.html

doc/html/api/lxml.cssselect.Token-class.html

doc/html/api/lxml.cssselect.TokenStream-class.html

doc/html/api/lxml.cssselect.XPathExpr-class.html

doc/html/api/lxml.cssselect.XPathExprOr-class.html

doc/html/api/lxml.cssselect._UniToken-class.html

doc/html/api/lxml.etree._AppendOnlyElementProxy-class.html

doc/html/api/lxml.etree._AttribIterator-class.html

doc/html/api/lxml.etree._BaseContext-class.html

doc/html/api/lxml.etree._ClassNamespaceRegistry-class.html

doc/html/api/lxml.etree._ExceptionContext-class.html

doc/html/api/lxml.etree._ExsltRegExp-class.html

doc/html/api/lxml.etree._FileReaderContext-class.html

doc/html/api/lxml.etree._FilelikeWriter-class.html

doc/html/api/lxml.etree._FunctionNamespaceRegistry-class.html

doc/html/api/lxml.etree._InputDocument-class.html

doc/html/api/lxml.etree._IterparseContext-class.html

doc/html/api/lxml.etree._ModifyContentOnlyEntityProxy-class.html

doc/html/api/lxml.etree._ModifyContentOnlyPIProxy-class.html

doc/html/api/lxml.etree._ModifyContentOnlyProxy-class.html

doc/html/api/lxml.etree._NamespaceRegistry-class.html

doc/html/api/lxml.etree._OpaqueDocumentWrapper-class.html

doc/html/api/lxml.etree._OpaqueNodeWrapper-class.html

doc/html/api/lxml.etree._ParserContext-class.html

doc/html/api/lxml.etree._ParserDictionaryContext-class.html

doc/html/api/lxml.etree._ParserSchemaValidationContext-class.html

doc/html/api/lxml.etree._PythonSaxParserTarget-class.html

doc/html/api/lxml.etree._ReadOnlyElementProxy-class.html

doc/html/api/lxml.etree._ReadOnlyEntityProxy-class.html

doc/html/api/lxml.etree._ReadOnlyPIProxy-class.html

doc/html/api/lxml.etree._ReadOnlyProxy-class.html

doc/html/api/lxml.etree._ResolverContext-class.html

doc/html/api/lxml.etree._ResolverRegistry-class.html

doc/html/api/lxml.etree._SaxParserContext-class.html

doc/html/api/lxml.etree._TargetParserContext-class.html

doc/html/api/lxml.etree._TempStore-class.html

doc/html/api/lxml.etree._XPathContext-class.html

doc/html/api/lxml.etree._XPathFunctionNamespaceRegistry-class.html

doc/html/api/lxml.etree._XSLTContext-class.html

doc/html/api/lxml.etree._XSLTQuotedStringParam-class.html

doc/html/api/lxml.etree._XSLTResolverContext-class.html

doc/html/api/lxml.etree.__ContentOnlyElement-class.html

doc/html/api/lxml.include-module.html

doc/html/api/lxml.include-pysrc.html

doc/html/api/lxml.tests.test_elementtree.ETreeTestCaseBase-class.html

doc/html/api/lxml.tests.test_etree.XIncludeTestCase-class.html

doc/html/api/lxml.tests.test_io.IOTestCaseBase-class.html

doc/html/api/toc-lxml.include-module.html

doc/html/changes-2.3.5.html

src/lxml/c14n.pxd

src/lxml/config.pxd

src/lxml/cstd.pxd

src/lxml/dtdvalid.pxd

src/lxml/etree_defs.h

src/lxml/etreepublic.pxd

src/lxml/html/_dictmixin.py

src/lxml/htmlparser.pxd

src/lxml/include

src/lxml/include/__init__.py

src/lxml/relaxng.pxd

src/lxml/schematron.pxd

src/lxml/tests/css_shakespear.html

src/lxml/tests/test_css.txt

src/lxml/tests/test_css_select.txt

src/lxml/tree.pxd

src/lxml/uri.pxd

src/lxml/xinclude.pxd

src/lxml/xmlerror.pxd

src/lxml/xmlparser.pxd

src/lxml/xmlschema.pxd

src/lxml/xpath.pxd

src/lxml/xslt.pxd

files modified:
CHANGES.txt

CREDITS.txt

INSTALL.txt

LICENSES.txt

Makefile

PKG-INFO

README.rst

TODO.txt

buildlibxml.py

debian/changelog

doc/FAQ.txt

doc/api.txt

doc/build.txt

doc/cssselect.txt

doc/extensions.txt

doc/html/FAQ.html

doc/html/api.html

doc/html/api/api-objects.txt

doc/html/api/class-tree.html

doc/html/api/deprecated-index.html

doc/html/api/exceptions.AssertionError-class.html

doc/html/api/help.html

doc/html/api/identifier-index-A.html

doc/html/api/identifier-index-B.html

doc/html/api/identifier-index-C.html

doc/html/api/identifier-index-D.html

doc/html/api/identifier-index-E.html

doc/html/api/identifier-index-F.html

doc/html/api/identifier-index-G.html

doc/html/api/identifier-index-H.html

doc/html/api/identifier-index-I.html

doc/html/api/identifier-index-J.html

doc/html/api/identifier-index-K.html

doc/html/api/identifier-index-L.html

doc/html/api/identifier-index-M.html

doc/html/api/identifier-index-N.html

doc/html/api/identifier-index-O.html

doc/html/api/identifier-index-P.html

doc/html/api/identifier-index-Q.html

doc/html/api/identifier-index-R.html

doc/html/api/identifier-index-S.html

doc/html/api/identifier-index-T.html

doc/html/api/identifier-index-U.html

doc/html/api/identifier-index-V.html

doc/html/api/identifier-index-W.html

doc/html/api/identifier-index-X.html

doc/html/api/identifier-index-Y.html

doc/html/api/identifier-index-Z.html

doc/html/api/identifier-index-_.html

doc/html/api/identifier-index.html

doc/html/api/lxml-module.html

doc/html/api/lxml-pysrc.html

doc/html/api/lxml.ElementInclude-module.html

doc/html/api/lxml.ElementInclude-pysrc.html

doc/html/api/lxml.ElementInclude.FatalIncludeError-class.html

doc/html/api/lxml.builder-module.html

doc/html/api/lxml.builder-pysrc.html

doc/html/api/lxml.builder.ElementMaker-class.html

doc/html/api/lxml.cssselect-module.html

doc/html/api/lxml.cssselect-pysrc.html

doc/html/api/lxml.cssselect.CSSSelector-class.html

doc/html/api/lxml.doctestcompare-module.html

doc/html/api/lxml.doctestcompare-pysrc.html

doc/html/api/lxml.doctestcompare.LHTMLOutputChecker-class.html

doc/html/api/lxml.doctestcompare.LXMLOutputChecker-class.html

doc/html/api/lxml.doctestcompare._RestoreChecker-class.html

doc/html/api/lxml.etree-module.html

doc/html/api/lxml.etree.AncestorsIterator-class.html

doc/html/api/lxml.etree.AttributeBasedElementClassLookup-class.html

doc/html/api/lxml.etree.C14NError-class.html

doc/html/api/lxml.etree.CDATA-class.html

doc/html/api/lxml.etree.CommentBase-class.html

doc/html/api/lxml.etree.CustomElementClassLookup-class.html

doc/html/api/lxml.etree.DTD-class.html

doc/html/api/lxml.etree.DTDError-class.html

doc/html/api/lxml.etree.DTDParseError-class.html

doc/html/api/lxml.etree.DTDValidateError-class.html

doc/html/api/lxml.etree.DocInfo-class.html

doc/html/api/lxml.etree.DocumentInvalid-class.html

doc/html/api/lxml.etree.ETCompatXMLParser-class.html

doc/html/api/lxml.etree.ETXPath-class.html

doc/html/api/lxml.etree.ElementBase-class.html

doc/html/api/lxml.etree.ElementChildIterator-class.html

doc/html/api/lxml.etree.ElementClassLookup-class.html

doc/html/api/lxml.etree.ElementDefaultClassLookup-class.html

doc/html/api/lxml.etree.ElementDepthFirstIterator-class.html

doc/html/api/lxml.etree.ElementNamespaceClassLookup-class.html

doc/html/api/lxml.etree.ElementTextIterator-class.html

doc/html/api/lxml.etree.EntityBase-class.html

doc/html/api/lxml.etree.Error-class.html

doc/html/api/lxml.etree.ErrorDomains-class.html

doc/html/api/lxml.etree.ErrorLevels-class.html

doc/html/api/lxml.etree.ErrorTypes-class.html

doc/html/api/lxml.etree.FallbackElementClassLookup-class.html

doc/html/api/lxml.etree.HTMLParser-class.html

doc/html/api/lxml.etree.LxmlError-class.html

doc/html/api/lxml.etree.LxmlRegistryError-class.html

doc/html/api/lxml.etree.LxmlSyntaxError-class.html

doc/html/api/lxml.etree.NamespaceRegistryError-class.html

doc/html/api/lxml.etree.PIBase-class.html

doc/html/api/lxml.etree.ParseError-class.html

doc/html/api/lxml.etree.ParserBasedElementClassLookup-class.html

doc/html/api/lxml.etree.ParserError-class.html

doc/html/api/lxml.etree.PyErrorLog-class.html

doc/html/api/lxml.etree.PythonElementClassLookup-class.html

doc/html/api/lxml.etree.QName-class.html

doc/html/api/lxml.etree.RelaxNG-class.html

doc/html/api/lxml.etree.RelaxNGError-class.html

doc/html/api/lxml.etree.RelaxNGErrorTypes-class.html

doc/html/api/lxml.etree.RelaxNGParseError-class.html

doc/html/api/lxml.etree.RelaxNGValidateError-class.html

doc/html/api/lxml.etree.Resolver-class.html

doc/html/api/lxml.etree.Schematron-class.html

doc/html/api/lxml.etree.SchematronError-class.html

doc/html/api/lxml.etree.SchematronParseError-class.html

doc/html/api/lxml.etree.SchematronValidateError-class.html

doc/html/api/lxml.etree.SerialisationError-class.html

doc/html/api/lxml.etree.SiblingsIterator-class.html

doc/html/api/lxml.etree.TreeBuilder-class.html

doc/html/api/lxml.etree.XInclude-class.html

doc/html/api/lxml.etree.XIncludeError-class.html

doc/html/api/lxml.etree.XMLParser-class.html

doc/html/api/lxml.etree.XMLSchema-class.html

doc/html/api/lxml.etree.XMLSchemaError-class.html

doc/html/api/lxml.etree.XMLSchemaParseError-class.html

doc/html/api/lxml.etree.XMLSchemaValidateError-class.html

doc/html/api/lxml.etree.XMLSyntaxError-class.html

doc/html/api/lxml.etree.XPath-class.html

doc/html/api/lxml.etree.XPathDocumentEvaluator-class.html

doc/html/api/lxml.etree.XPathElementEvaluator-class.html

doc/html/api/lxml.etree.XPathError-class.html

doc/html/api/lxml.etree.XPathEvalError-class.html

doc/html/api/lxml.etree.XPathFunctionError-class.html

doc/html/api/lxml.etree.XPathResultError-class.html

doc/html/api/lxml.etree.XPathSyntaxError-class.html

doc/html/api/lxml.etree.XSLT-class.html

doc/html/api/lxml.etree.XSLTAccessControl-class.html

doc/html/api/lxml.etree.XSLTApplyError-class.html

doc/html/api/lxml.etree.XSLTError-class.html

doc/html/api/lxml.etree.XSLTExtension-class.html

doc/html/api/lxml.etree.XSLTExtensionError-class.html

doc/html/api/lxml.etree.XSLTParseError-class.html

doc/html/api/lxml.etree.XSLTSaveError-class.html

doc/html/api/lxml.etree._Attrib-class.html

doc/html/api/lxml.etree._BaseErrorLog-class.html

doc/html/api/lxml.etree._BaseParser-class.html

doc/html/api/lxml.etree._Comment-class.html

doc/html/api/lxml.etree._Document-class.html

doc/html/api/lxml.etree._DomainErrorLog-class.html

doc/html/api/lxml.etree._Element-class.html

doc/html/api/lxml.etree._ElementIterator-class.html

doc/html/api/lxml.etree._ElementStringResult-class.html

doc/html/api/lxml.etree._ElementTagMatcher-class.html

doc/html/api/lxml.etree._ElementTree-class.html

doc/html/api/lxml.etree._ElementUnicodeResult-class.html

doc/html/api/lxml.etree._Entity-class.html

doc/html/api/lxml.etree._ErrorLog-class.html

doc/html/api/lxml.etree._FeedParser-class.html

doc/html/api/lxml.etree._IDDict-class.html

doc/html/api/lxml.etree._ListErrorLog-class.html

doc/html/api/lxml.etree._LogEntry-class.html

doc/html/api/lxml.etree._ProcessingInstruction-class.html

doc/html/api/lxml.etree._RotatingErrorLog-class.html

doc/html/api/lxml.etree._SaxParserTarget-class.html

doc/html/api/lxml.etree._TargetParserResult-class.html

doc/html/api/lxml.etree._Validator-class.html

doc/html/api/lxml.etree._XPathEvaluatorBase-class.html

doc/html/api/lxml.etree._XSLTProcessingInstruction-class.html

doc/html/api/lxml.etree._XSLTResultTree-class.html

doc/html/api/lxml.etree.iterparse-class.html

doc/html/api/lxml.etree.iterwalk-class.html

doc/html/api/lxml.html-module.html

doc/html/api/lxml.html-pysrc.html

doc/html/api/lxml.html.CheckboxGroup-class.html

doc/html/api/lxml.html.CheckboxValues-class.html

doc/html/api/lxml.html.ElementSoup-module.html

doc/html/api/lxml.html.ElementSoup-pysrc.html

doc/html/api/lxml.html.FieldsDict-class.html

doc/html/api/lxml.html.FormElement-class.html

doc/html/api/lxml.html.HTMLParser-class.html

doc/html/api/lxml.html.HtmlComment-class.html

doc/html/api/lxml.html.HtmlElement-class.html

doc/html/api/lxml.html.HtmlElementClassLookup-class.html

doc/html/api/lxml.html.HtmlEntity-class.html

doc/html/api/lxml.html.HtmlMixin-class.html

doc/html/api/lxml.html.HtmlProcessingInstruction-class.html

doc/html/api/lxml.html.InputElement-class.html

doc/html/api/lxml.html.InputGetter-class.html

doc/html/api/lxml.html.InputMixin-class.html

doc/html/api/lxml.html.LabelElement-class.html

doc/html/api/lxml.html.MultipleSelectOptions-class.html

doc/html/api/lxml.html.RadioGroup-class.html

doc/html/api/lxml.html.SelectElement-class.html

doc/html/api/lxml.html.TextareaElement-class.html

doc/html/api/lxml.html.XHTMLParser-class.html

doc/html/api/lxml.html._MethodFunc-class.html

doc/html/api/lxml.html.builder-module.html

doc/html/api/lxml.html.builder-pysrc.html

doc/html/api/lxml.html.clean-module.html

doc/html/api/lxml.html.clean-pysrc.html

doc/html/api/lxml.html.clean.Cleaner-class.html

doc/html/api/lxml.html.defs-module.html

doc/html/api/lxml.html.defs-pysrc.html

doc/html/api/lxml.html.diff-module.html

doc/html/api/lxml.html.diff-pysrc.html

doc/html/api/lxml.html.diff.DEL_END-class.html

doc/html/api/lxml.html.diff.DEL_START-class.html

doc/html/api/lxml.html.diff.InsensitiveSequenceMatcher-class.html

doc/html/api/lxml.html.diff.NoDeletes-class.html

doc/html/api/lxml.html.diff.href_token-class.html

doc/html/api/lxml.html.diff.tag_token-class.html

doc/html/api/lxml.html.diff.token-class.html

doc/html/api/lxml.html.formfill-module.html

doc/html/api/lxml.html.formfill-pysrc.html

doc/html/api/lxml.html.formfill.DefaultErrorCreator-class.html

doc/html/api/lxml.html.formfill.FormNotFound-class.html

doc/html/api/lxml.html.html5parser-module.html

doc/html/api/lxml.html.html5parser-pysrc.html

doc/html/api/lxml.html.html5parser.HTMLParser-class.html

doc/html/api/lxml.html.html5parser.XHTMLParser-class.html

doc/html/api/lxml.html.soupparser-module.html

doc/html/api/lxml.html.soupparser-pysrc.html

doc/html/api/lxml.html.usedoctest-module.html

doc/html/api/lxml.html.usedoctest-pysrc.html

doc/html/api/lxml.isoschematron-module.html

doc/html/api/lxml.isoschematron-pysrc.html

doc/html/api/lxml.isoschematron.Schematron-class.html

doc/html/api/lxml.objectify-module.html

doc/html/api/lxml.objectify.BoolElement-class.html

doc/html/api/lxml.objectify.ElementMaker-class.html

doc/html/api/lxml.objectify.FloatElement-class.html

doc/html/api/lxml.objectify.IntElement-class.html

doc/html/api/lxml.objectify.LongElement-class.html

doc/html/api/lxml.objectify.NoneElement-class.html

doc/html/api/lxml.objectify.NumberElement-class.html

doc/html/api/lxml.objectify.ObjectPath-class.html

doc/html/api/lxml.objectify.ObjectifiedDataElement-class.html

doc/html/api/lxml.objectify.ObjectifiedElement-class.html

doc/html/api/lxml.objectify.ObjectifyElementClassLookup-class.html

doc/html/api/lxml.objectify.PyType-class.html

doc/html/api/lxml.objectify.StringElement-class.html

doc/html/api/lxml.objectify._ObjectifyElementMakerCaller-class.html

doc/html/api/lxml.pyclasslookup-module.html

doc/html/api/lxml.pyclasslookup-pysrc.html

doc/html/api/lxml.sax-module.html

doc/html/api/lxml.sax-pysrc.html

doc/html/api/lxml.sax.ElementTreeContentHandler-class.html

doc/html/api/lxml.sax.ElementTreeProducer-class.html

doc/html/api/lxml.sax.SaxError-class.html

doc/html/api/lxml.tests-module.html

doc/html/api/lxml.tests-pysrc.html

doc/html/api/lxml.tests.common_imports-module.html

doc/html/api/lxml.tests.common_imports-pysrc.html

doc/html/api/lxml.tests.common_imports.HelperTestCase-class.html

doc/html/api/lxml.tests.common_imports.LargeFileLike-class.html

doc/html/api/lxml.tests.common_imports.LargeFileLikeUnicode-class.html

doc/html/api/lxml.tests.common_imports.SillyFileLike-class.html

doc/html/api/lxml.tests.test_classlookup-module.html

doc/html/api/lxml.tests.test_classlookup-pysrc.html

doc/html/api/lxml.tests.test_classlookup.ClassLookupTestCase-class.html

doc/html/api/lxml.tests.test_css-module.html

doc/html/api/lxml.tests.test_css-pysrc.html

doc/html/api/lxml.tests.test_css.CSSTestCase-class.html

doc/html/api/lxml.tests.test_dtd-module.html

doc/html/api/lxml.tests.test_dtd-pysrc.html

doc/html/api/lxml.tests.test_dtd.ETreeDtdTestCase-class.html

doc/html/api/lxml.tests.test_elementtree-module.html

doc/html/api/lxml.tests.test_elementtree-pysrc.html

doc/html/api/lxml.tests.test_elementtree.CElementTreeTestCase-class.html

doc/html/api/lxml.tests.test_elementtree.ETreeTestCase-class.html

doc/html/api/lxml.tests.test_elementtree.ElementTreeTestCase-class.html

doc/html/api/lxml.tests.test_errors-module.html

doc/html/api/lxml.tests.test_errors-pysrc.html

doc/html/api/lxml.tests.test_errors.ErrorTestCase-class.html

doc/html/api/lxml.tests.test_etree-module.html

doc/html/api/lxml.tests.test_etree-pysrc.html

doc/html/api/lxml.tests.test_etree.ETreeC14NTestCase-class.html

doc/html/api/lxml.tests.test_etree.ETreeErrorLogTest-class.html

doc/html/api/lxml.tests.test_etree.ETreeOnlyTestCase-class.html

doc/html/api/lxml.tests.test_etree.ETreeWriteTestCase-class.html

doc/html/api/lxml.tests.test_etree.ETreeXIncludeTestCase-class.html

doc/html/api/lxml.tests.test_etree.ElementIncludeTestCase-class.html

doc/html/api/lxml.tests.test_htmlparser-module.html

doc/html/api/lxml.tests.test_htmlparser-pysrc.html

doc/html/api/lxml.tests.test_htmlparser.HtmlParserTestCase-class.html

doc/html/api/lxml.tests.test_io-module.html

doc/html/api/lxml.tests.test_io-pysrc.html

doc/html/api/lxml.tests.test_io.ETreeIOTestCase-class.html

doc/html/api/lxml.tests.test_io.ElementTreeIOTestCase-class.html

doc/html/api/lxml.tests.test_isoschematron-module.html

doc/html/api/lxml.tests.test_isoschematron-pysrc.html

doc/html/api/lxml.tests.test_isoschematron.ETreeISOSchematronTestCase-class.html

doc/html/api/lxml.tests.test_nsclasses-module.html

doc/html/api/lxml.tests.test_nsclasses-pysrc.html

doc/html/api/lxml.tests.test_nsclasses.ETreeNamespaceClassesTestCase-class.html

doc/html/api/lxml.tests.test_nsclasses.ETreeNamespaceClassesTestCase.bluff_class-class.html

doc/html/api/lxml.tests.test_nsclasses.ETreeNamespaceClassesTestCase.default_class-class.html

doc/html/api/lxml.tests.test_nsclasses.ETreeNamespaceClassesTestCase.maeh_class-class.html

doc/html/api/lxml.tests.test_objectify-module.html

doc/html/api/lxml.tests.test_objectify-pysrc.html

doc/html/api/lxml.tests.test_objectify.ObjectifyTestCase-class.html

doc/html/api/lxml.tests.test_pyclasslookup-module.html

doc/html/api/lxml.tests.test_pyclasslookup-pysrc.html

doc/html/api/lxml.tests.test_pyclasslookup.PyClassLookupTestCase-class.html

doc/html/api/lxml.tests.test_relaxng-module.html

doc/html/api/lxml.tests.test_relaxng-pysrc.html

doc/html/api/lxml.tests.test_relaxng.ETreeRelaxNGTestCase-class.html

doc/html/api/lxml.tests.test_sax-module.html

doc/html/api/lxml.tests.test_sax-pysrc.html

doc/html/api/lxml.tests.test_sax.ETreeSaxTestCase-class.html

doc/html/api/lxml.tests.test_schematron-module.html

doc/html/api/lxml.tests.test_schematron-pysrc.html

doc/html/api/lxml.tests.test_schematron.ETreeSchematronTestCase-class.html

doc/html/api/lxml.tests.test_threading-module.html

doc/html/api/lxml.tests.test_threading-pysrc.html

doc/html/api/lxml.tests.test_threading.ThreadPipelineTestCase-class.html

doc/html/api/lxml.tests.test_threading.ThreadPipelineTestCase.ParseAndExtendWorker-class.html

doc/html/api/lxml.tests.test_threading.ThreadPipelineTestCase.ParseWorker-class.html

doc/html/api/lxml.tests.test_threading.ThreadPipelineTestCase.ReverseWorker-class.html

doc/html/api/lxml.tests.test_threading.ThreadPipelineTestCase.RotateWorker-class.html

doc/html/api/lxml.tests.test_threading.ThreadPipelineTestCase.SerialiseWorker-class.html

doc/html/api/lxml.tests.test_threading.ThreadPipelineTestCase.Worker-class.html

doc/html/api/lxml.tests.test_threading.ThreadingTestCase-class.html

doc/html/api/lxml.tests.test_unicode-module.html

doc/html/api/lxml.tests.test_unicode-pysrc.html

doc/html/api/lxml.tests.test_unicode.UnicodeTestCase-class.html

doc/html/api/lxml.tests.test_xmlschema-module.html

doc/html/api/lxml.tests.test_xmlschema-pysrc.html

doc/html/api/lxml.tests.test_xmlschema.ETreeXMLSchemaResolversTestCase-class.html

doc/html/api/lxml.tests.test_xmlschema.ETreeXMLSchemaResolversTestCase.simple_resolver-class.html

doc/html/api/lxml.tests.test_xmlschema.ETreeXMLSchemaTestCase-class.html

doc/html/api/lxml.tests.test_xpathevaluator-module.html

doc/html/api/lxml.tests.test_xpathevaluator-pysrc.html

doc/html/api/lxml.tests.test_xpathevaluator.ETreeETXPathClassTestCase-class.html

doc/html/api/lxml.tests.test_xpathevaluator.ETreeXPathClassTestCase-class.html

doc/html/api/lxml.tests.test_xpathevaluator.ETreeXPathExsltTestCase-class.html

doc/html/api/lxml.tests.test_xpathevaluator.ETreeXPathTestCase-class.html

doc/html/api/lxml.tests.test_xslt-module.html

doc/html/api/lxml.tests.test_xslt-pysrc.html

doc/html/api/lxml.tests.test_xslt.ETreeXSLTExtElementTestCase-class.html

doc/html/api/lxml.tests.test_xslt.ETreeXSLTExtFuncTestCase-class.html

doc/html/api/lxml.tests.test_xslt.ETreeXSLTTestCase-class.html

doc/html/api/lxml.tests.test_xslt.Py3XSLTTestCase-class.html

doc/html/api/lxml.usedoctest-module.html

doc/html/api/lxml.usedoctest-pysrc.html

doc/html/api/module-tree.html

doc/html/api/redirect.html

doc/html/api/toc-everything.html

doc/html/api/toc-lxml.builder-module.html

doc/html/api/toc-lxml.cssselect-module.html

doc/html/api/toc-lxml.etree-module.html

doc/html/api/toc-lxml.html-module.html

doc/html/api/toc-lxml.html.clean-module.html

doc/html/api/toc-lxml.html.diff-module.html

doc/html/api/toc-lxml.html.formfill-module.html

doc/html/api/toc-lxml.html.html5parser-module.html

doc/html/api/toc-lxml.isoschematron-module.html

doc/html/api/toc-lxml.tests.common_imports-module.html

doc/html/api/toc-lxml.tests.test_css-module.html

doc/html/api/toc-lxml.tests.test_elementtree-module.html

doc/html/api/toc-lxml.tests.test_etree-module.html

doc/html/api/toc-lxml.tests.test_htmlparser-module.html

doc/html/api/toc-lxml.tests.test_io-module.html

doc/html/api/toc-lxml.tests.test_unicode-module.html

doc/html/api/toc-lxml.tests.test_xslt-module.html

doc/html/api/toc.html

doc/html/api/xml.etree.ElementTree-module.html

doc/html/api/xml.etree.ElementTree-pysrc.html

doc/html/api/xml.etree.ElementTree.Element-class.html

doc/html/api/xml.etree.ElementTree.ElementTree-class.html

doc/html/api/xml.etree.ElementTree.ParseError-class.html

doc/html/api/xml.etree.ElementTree.QName-class.html

doc/html/api/xml.etree.ElementTree.TreeBuilder-class.html

doc/html/api/xml.etree.ElementTree.XMLParser-class.html

doc/html/api/xml.etree.ElementTree._IterParseIterator-class.html

doc/html/api/xml.etree.ElementTree._SimpleElementPath-class.html

doc/html/build.html

doc/html/capi.html

doc/html/compatibility.html

doc/html/credits.html

doc/html/cssselect.html

doc/html/element_classes.html

doc/html/elementsoup.html

doc/html/extensions.html

doc/html/html5parser.html

doc/html/index.html

doc/html/installation.html

doc/html/intro.html

doc/html/lxml-source-howto.html

doc/html/lxmlhtml.html

doc/html/objectify.html

doc/html/parsing.html

doc/html/performance.html

doc/html/resolvers.html

doc/html/sax.html

doc/html/sitemap.html

doc/html/tutorial.html

doc/html/validation.html

doc/html/xpathxslt.html

doc/main.txt

doc/mkhtml.py

doc/objectify.txt

doc/parsing.txt

doc/tutorial.txt

doc/validation.txt

setup.py

setupinfo.py

src/lxml.egg-info/PKG-INFO

src/lxml.egg-info/SOURCES.txt

src/lxml/__init__.py

src/lxml/_elementpath.py

src/lxml/apihelpers.pxi

src/lxml/builder.py

src/lxml/classlookup.pxi

src/lxml/cleanup.pxi

src/lxml/cssselect.py

src/lxml/docloader.pxi

src/lxml/dtd.pxi

src/lxml/extensions.pxi

src/lxml/html/__init__.py

src/lxml/html/clean.py

src/lxml/html/diff.py

src/lxml/html/formfill.py

src/lxml/html/html5parser.py

src/lxml/html/tests/test_basic.txt

src/lxml/html/tests/test_diff.txt

src/lxml/html/tests/test_forms.txt

src/lxml/isoschematron/__init__.py

src/lxml/iterparse.pxi

src/lxml/lxml.etree.c

src/lxml/lxml.etree.h

src/lxml/lxml.etree.pyx

src/lxml/lxml.etree_api.h

src/lxml/lxml.objectify.c

src/lxml/lxml.objectify.pyx

src/lxml/nsclasses.pxi

src/lxml/objectpath.pxi

src/lxml/parser.pxi

src/lxml/parsertarget.pxi

src/lxml/proxy.pxi

src/lxml/public-api.pxi

src/lxml/python.pxd

src/lxml/readonlytree.pxi

src/lxml/relaxng.pxi

src/lxml/saxparser.pxi

src/lxml/schematron.pxi

src/lxml/serializer.pxi

src/lxml/tests/common_imports.py

src/lxml/tests/test.dtd

src/lxml/tests/test_css.py

src/lxml/tests/test_dtd.py

src/lxml/tests/test_elementtree.py

src/lxml/tests/test_etree.py

src/lxml/tests/test_htmlparser.py

src/lxml/tests/test_io.py

src/lxml/tests/test_objectify.py

src/lxml/tests/test_threading.py

src/lxml/tests/test_unicode.py

src/lxml/tests/test_xslt.py

src/lxml/xinclude.pxi

src/lxml/xmlerror.pxi

src/lxml/xmlid.pxi

src/lxml/xmlschema.pxi

src/lxml/xpath.pxi

src/lxml/xslt.pxi

src/lxml/xsltext.pxi

update-error-constants.py

version.txt

versioninfo.py

Show diffs side-by-side

added added

removed removed

src/lxml/parser.pxi

# Parsers for XML and HTML

cimport xmlparser

cimport htmlparser

from lxml.includes cimport xmlparser

from lxml.includes cimport htmlparser

cdef class _ParserContext(_ResolverContext)

cdef class _SaxParserContext(_ParserContext)

"""

pass

@cython.final

@cython.internal

cdef class _ParserDictionaryContext:

# Global parser context to share the string dictionary.

183

185

__GLOBAL_PARSER_CONTEXT = _ParserDictionaryContext()

184

186

__GLOBAL_PARSER_CONTEXT.initMainParserContext()

185

187

186

cdef int _checkThreadDict(tree.xmlDict* c_dict):

187

u"""Check that c_dict is either the local thread dictionary or the global

188

parent dictionary.

189

"""

190

#if __GLOBAL_PARSER_CONTEXT._c_dict is c_dict:

191

# return 1 # main thread

192

if __GLOBAL_PARSER_CONTEXT._getThreadDict(NULL) is c_dict:

193

return 1 # local thread dict

194

return 0

195

196

188

############################################################

197

189

## support for Python unicode I/O

198

190

############################################################

199

191

200

192

# name of Python unicode encoding as known to libxml2

201

cdef char* _UNICODE_ENCODING = NULL

193

cdef const_char* _UNICODE_ENCODING = NULL

202

194

203

195

cdef int _setupPythonUnicode() except -1:

204

196

u"""Sets _UNICODE_ENCODING to the internal encoding name of Python unicode

208

200

"""

209

201

cdef tree.xmlCharEncodingHandler* enchandler

210

202

cdef Py_ssize_t l

211

cdef char* buffer

212

cdef char* enc

203

cdef const_char* buffer

204

cdef const_char* enc

213

205

utext = python.PyUnicode_DecodeUTF8("<test/>", 7, NULL)

214

206

l = python.PyUnicode_GET_DATA_SIZE(utext)

215

207

buffer = python.PyUnicode_AS_DATA(utext)

234

226

_UNICODE_ENCODING = enc

235

227

return 0

236

228

237

cdef char* _findEncodingName(char* buffer, int size):

229

cdef const_char* _findEncodingName(const_char* buffer, int size):

238

230

u"Work around bug in libxml2: find iconv name of encoding on our own."

239

231

cdef tree.xmlCharEncoding enc

240

enc = tree.xmlDetectCharEncoding(buffer, size)

232

enc = tree.xmlDetectCharEncoding(<const_xmlChar*>buffer, size)

241

233

if enc == tree.XML_CHAR_ENCODING_UTF16LE:

242

234

return "UTF-16LE"

243

235

elif enc == tree.XML_CHAR_ENCODING_UTF16BE:

258

250

## support for file-like objects

259

251

############################################################

260

252

253

@cython.final

254

@cython.internal

261

255

cdef class _FileReaderContext:

262

256

cdef object _filelike

263

257

cdef object _encoding

295

289

close()

296

290

297

291

cdef xmlparser.xmlParserInputBuffer* _createParserInputBuffer(self):

298

cdef cstd.FILE* c_stream

292

cdef stdio.FILE* c_stream

299

293

cdef xmlparser.xmlParserInputBuffer* c_buffer

300

294

c_buffer = xmlparser.xmlAllocParserInputBuffer(0)

301

295

c_stream = python.PyFile_AsFile(self._filelike)

322

316

cdef xmlDoc* _readDoc(self, xmlparser.xmlParserCtxt* ctxt, int options):

323

317

cdef xmlDoc* result

324

318

cdef char* c_encoding

325

cdef cstd.FILE* c_stream

319

cdef stdio.FILE* c_stream

326

320

cdef xmlparser.xmlInputReadCallback c_read_callback

327

321

cdef xmlparser.xmlInputCloseCallback c_close_callback

328

322

cdef void* c_callback_context

368

362

remaining = byte_count - self._bytes_read

369

363

while c_requested > remaining:

370

364

c_start = _cstr(self._bytes) + self._bytes_read

371

cstd.memcpy(c_buffer, c_start, remaining)

365

cstring_h.memcpy(c_buffer, c_start, remaining)

372

366

c_byte_count += remaining

373

367

c_buffer += remaining

374

368

c_requested -= remaining

395

389

396

390

if c_requested > 0:

397

391

c_start = _cstr(self._bytes) + self._bytes_read

398

cstd.memcpy(c_buffer, c_start, c_requested)

392

cstring_h.memcpy(c_buffer, c_start, c_requested)

399

393

c_byte_count += c_requested

400

394

self._bytes_read += c_requested

401

395

return c_byte_count

408

402

return (<_FileReaderContext>ctxt).copyToBuffer(c_buffer, c_size)

409

403

410

404

cdef int _readFileParser(void* ctxt, char* c_buffer, int c_size) nogil:

411

return cstd.fread(c_buffer, 1, c_size, <cstd.FILE*>ctxt)

405

return stdio.fread(c_buffer, 1, c_size, <stdio.FILE*>ctxt)

412

406

413

407

############################################################

414

408

## support for custom document loaders

415

409

############################################################

416

410

417

cdef xmlparser.xmlParserInput* _local_resolver(char* c_url, char* c_pubid,

411

cdef xmlparser.xmlParserInput* _local_resolver(const_char* c_url, const_char* c_pubid,

418

412

xmlparser.xmlParserCtxt* c_context) with gil:

419

413

cdef _ResolverContext context

420

414

cdef xmlparser.xmlParserInput* c_input

438

432

url = None

439

433

else:

440

434

# parsing a related document (DTD etc.) => UTF-8 encoded URL?

441

url = _decodeFilename(c_url)

435

url = _decodeFilename(<const_xmlChar*>c_url)

442

436

if c_pubid is NULL:

443

437

pubid = None

444

438

else:

445

pubid = funicode(c_pubid) # always UTF-8

439

pubid = funicode(<const_xmlChar*>c_pubid) # always UTF-8

446

440

447

441

doc_ref = context._resolvers.resolve(url, pubid, context)

448

442

except:

454

448

data = doc_ref._data_bytes

455

449

c_input = xmlparser.xmlNewInputStream(c_context)

456

450

if c_input is not NULL:

457

c_input.base = _cstr(data)

451

c_input.base = _xcstr(data)

458

452

c_input.length = python.PyBytes_GET_SIZE(data)

459

453

c_input.cur = c_input.base

460

c_input.end = &c_input.base[c_input.length]

454

c_input.end = c_input.base + c_input.length

461

455

elif doc_ref._type == PARSER_DATA_FILENAME:

462

456

data = None

463

457

c_input = xmlparser.xmlNewInputFromFile(

483

477

cdef xmlparser.xmlExternalEntityLoader __DEFAULT_ENTITY_LOADER

484

478

__DEFAULT_ENTITY_LOADER = xmlparser.xmlGetExternalEntityLoader()

485

479

486

xmlparser.xmlSetExternalEntityLoader(_local_resolver)

480

xmlparser.xmlSetExternalEntityLoader(<xmlparser.xmlExternalEntityLoader>_local_resolver)

487

481

488

482

############################################################

489

483

## Parsers

490

484

############################################################

491

485

486

@cython.internal

492

487

cdef class _ParserContext(_ResolverContext):

493

488

cdef _ErrorLog _error_log

494

489

cdef _ParserSchemaValidationContext _validator

538

533

self._lock, python.WAIT_LOCK)

539

534

if result == 0:

540

535

raise ParserError, u"parser locking failed"

541

self._error_log.connect()

536

self._error_log.clear()

537

self._c_ctxt.sax.serror = _receiveParserError

542

538

if self._validator is not None:

543

self._validator.connect(self._c_ctxt)

539

self._validator.connect(self._c_ctxt, self._error_log)

544

540

return 0

545

541

546

542

cdef int cleanup(self) except -1:

548

544

self._validator.disconnect()

549

545

self._resetParserContext()

550

546

self.clear()

551

self._error_log.disconnect()

547

self._c_ctxt.sax.serror = NULL

552

548

if config.ENABLE_THREADING and self._lock is not NULL:

553

549

python.PyThread_release_lock(self._lock)

554

550

return 0

576

572

if c_ctxt is not NULL:

577

573

context._initParserContext(c_ctxt)

578

574

575

cdef void _forwardParserError(xmlparser.xmlParserCtxt* _parser_context, xmlerror.xmlError* error) with gil:

576

(<_ParserContext>_parser_context._private)._error_log._receive(error)

577

578

cdef void _receiveParserError(void* c_context, xmlerror.xmlError* error) nogil:

579

if __DEBUG:

580

if c_context is NULL or (<xmlparser.xmlParserCtxt*>c_context)._private is NULL:

581

_forwardError(NULL, error)

582

else:

583

_forwardParserError(<xmlparser.xmlParserCtxt*>c_context, error)

584

579

585

cdef int _raiseParseError(xmlparser.xmlParserCtxt* ctxt, filename,

580

586

_ErrorLog error_log) except 0:

581

587

if filename is not None and \

618

624

if context._validator is not None and \

619

625

not context._validator.isvalid():

620

626

well_formed = 0 # actually not 'valid', but anyway ...

621

elif recover or (c_ctxt.wellFormed and \

622

c_ctxt.lastError.level < xmlerror.XML_ERR_ERROR):

627

elif recover or (c_ctxt.wellFormed and

628

c_ctxt.lastError.level < xmlerror.XML_ERR_ERROR):

623

629

well_formed = 1

624

630

elif not c_ctxt.replaceEntities and not c_ctxt.validate \

625

631

and context is not None:

652

658

_raiseParseError(c_ctxt, filename, None)

653

659

else:

654

660

if result.URL is NULL and filename is not None:

655

result.URL = tree.xmlStrdup(_cstr(filename))

661

result.URL = tree.xmlStrdup(_xcstr(filename))

656

662

if result.encoding is NULL:

657

result.encoding = tree.xmlStrdup("UTF-8")

663

result.encoding = tree.xmlStrdup(<unsigned char*>"UTF-8")

658

664

659

665

if context._validator is not None and \

660

666

context._validator._add_default_attributes:

680

686

cdef inline int _fixHtmlDictNodeNames(tree.xmlDict* c_dict,

681

687

xmlNode* c_node) nogil:

682

688

cdef xmlNode* c_attr

683

cdef char* c_name

684

689

c_name = tree.xmlDictLookup(c_dict, c_node.name, -1)

685

690

if c_name is NULL:

686

691

return -1

687

692

if c_name is not c_node.name:

688

tree.xmlFree(c_node.name)

693

tree.xmlFree(<char*>c_node.name)

689

694

c_node.name = c_name

690

695

c_attr = <xmlNode*>c_node.properties

691

696

while c_attr is not NULL:

693

698

if c_name is NULL:

694

699

return -1

695

700

if c_name is not c_attr.name:

696

tree.xmlFree(c_attr.name)

701

tree.xmlFree(<char*>c_attr.name)

697

702

c_attr.name = c_name

698

703

c_attr = c_attr.next

699

704

return 0

754

759

self._parse_options & xmlparser.XML_PARSE_DTDATTR)

755

760

pctxt = self._newParserCtxt()

756

761

if pctxt is NULL:

757

python.PyErr_NoMemory()

762

raise MemoryError()

758

763

_initParserContext(self._parser_context, self._resolvers, pctxt)

759

764

if self._remove_comments:

760

765

pctxt.sax.comment = NULL

775

780

self._parse_options & xmlparser.XML_PARSE_DTDATTR)

776

781

pctxt = self._newPushParserCtxt()

777

782

if pctxt is NULL:

778

python.PyErr_NoMemory()

783

raise MemoryError()

779

784

_initParserContext(

780

785

self._push_parser_context, self._resolvers, pctxt)

781

786

if self._remove_comments:

795

800

context._setTarget(target)

796

801

return context

797

802

803

cdef int _registerHtmlErrorHandler(self, xmlparser.xmlParserCtxt* c_ctxt) except -1:

804

cdef xmlparser.xmlSAXHandler* sax = c_ctxt.sax

805

if sax is not NULL and sax.initialized and sax.initialized != xmlparser.XML_SAX2_MAGIC:

806

# need to extend SAX1 context to SAX2 to get proper error reports

807

if <xmlparser.xmlSAXHandlerV1*>sax is &htmlparser.htmlDefaultSAXHandler:

808

sax = <xmlparser.xmlSAXHandler*> stdlib.malloc(sizeof(xmlparser.xmlSAXHandler))

809

if sax is NULL:

810

raise MemoryError()

811

cstring_h.memcpy(sax, &htmlparser.htmlDefaultSAXHandler,

812

sizeof(htmlparser.htmlDefaultSAXHandler))

813

c_ctxt.sax = sax

814

sax.initialized = xmlparser.XML_SAX2_MAGIC

815

sax.serror = _receiveParserError

816

sax.startElementNs = NULL

817

sax.endElementNs = NULL

818

sax._private = NULL

819

return 0

820

798

821

cdef xmlparser.xmlParserCtxt* _newParserCtxt(self):

822

cdef xmlparser.xmlParserCtxt* c_ctxt

799

823

if self._for_html:

800

return htmlparser.htmlCreateMemoryParserCtxt('dummy', 5)

824

c_ctxt = htmlparser.htmlCreateMemoryParserCtxt('dummy', 5)

825

self._registerHtmlErrorHandler(c_ctxt)

801

826

else:

802

return xmlparser.xmlNewParserCtxt()

827

c_ctxt = xmlparser.xmlNewParserCtxt()

828

return c_ctxt

803

829

804

830

cdef xmlparser.xmlParserCtxt* _newPushParserCtxt(self):

805

831

cdef xmlparser.xmlParserCtxt* c_ctxt

806

cdef char* c_filename

807

if self._filename is not None:

808

c_filename = _cstr(self._filename)

809

else:

810

c_filename = NULL

832

cdef char* c_filename = _cstr(self._filename) if self._filename is not None else NULL

811

833

if self._for_html:

812

834

c_ctxt = htmlparser.htmlCreatePushParserCtxt(

813

835

NULL, NULL, NULL, 0, c_filename, tree.XML_CHAR_ENCODING_NONE)

814

836

if c_ctxt is not NULL:

837

self._registerHtmlErrorHandler(c_ctxt)

815

838

htmlparser.htmlCtxtUseOptions(c_ctxt, self._parse_options)

816

839

else:

817

840

c_ctxt = xmlparser.xmlCreatePushParserCtxt(

893

916

cdef xmlparser.xmlParserCtxt* pctxt

894

917

cdef Py_ssize_t py_buffer_len

895

918

cdef int buffer_len

896

cdef char* c_text

919

cdef const_char* c_text

897

920

py_buffer_len = python.PyUnicode_GET_DATA_SIZE(utext)

898

if py_buffer_len > python.INT_MAX or _UNICODE_ENCODING is NULL:

921

if py_buffer_len > limits.INT_MAX or _UNICODE_ENCODING is NULL:

899

922

text_utf = python.PyUnicode_AsUTF8String(utext)

900

923

py_buffer_len = python.PyBytes_GET_SIZE(text_utf)

901

924

return self._parseDoc(_cstr(text_utf), py_buffer_len, c_filename)

934

957

cdef xmlDoc* result

935

958

cdef xmlparser.xmlParserCtxt* pctxt

936

959

cdef char* c_encoding

937

if c_len > python.INT_MAX:

960

if c_len > limits.INT_MAX:

938

961

raise ParserError, u"string is too long to parse it with libxml2"

939

962

940

963

context = self._getParserContext()

1065

1088

cdef _ParserContext context

1066

1089

cdef xmlparser.xmlParserCtxt* pctxt

1067

1090

cdef Py_ssize_t py_buffer_len

1068

cdef char* c_data

1069

cdef char* c_encoding

1091

cdef const_char* c_data

1092

cdef const_char* c_encoding

1070

1093

cdef int buffer_len

1071

1094

cdef int error

1072

1095

cdef bint recover = self._parse_options & xmlparser.XML_PARSE_RECOVER

1094

1117

context.prepare()

1095

1118

self._feed_parser_running = 1

1096

1119

__GLOBAL_PARSER_CONTEXT.initParserDict(pctxt)

1097

1098

if py_buffer_len > python.INT_MAX:

1099

buffer_len = python.INT_MAX

1100

else:

1101

buffer_len = <int>py_buffer_len

1102

1120

if self._for_html:

1103

error = _htmlCtxtResetPush(pctxt, c_data, buffer_len,

1104

c_encoding, self._parse_options)

1121

error = _htmlCtxtResetPush(

1122

pctxt, NULL, 0, c_encoding, self._parse_options)

1105

1123

else:

1106

1124

xmlparser.xmlCtxtUseOptions(pctxt, self._parse_options)

1107

1125

error = xmlparser.xmlCtxtResetPush(

1108

pctxt, c_data, buffer_len, NULL, c_encoding)

1109

py_buffer_len -= buffer_len

1110

c_data += buffer_len

1126

pctxt, NULL, 0, NULL, c_encoding)

1111

1127

1112

1128

#print pctxt.charset, 'NONE' if c_encoding is NULL else c_encoding

1113

1129

1114

1130

while py_buffer_len > 0 and (error == 0 or recover):

1115

1131

with nogil:

1116

if py_buffer_len > python.INT_MAX:

1117

buffer_len = python.INT_MAX

1132

if py_buffer_len > limits.INT_MAX:

1133

buffer_len = limits.INT_MAX

1118

1134

else:

1119

1135

buffer_len = <int>py_buffer_len

1120

1136

if self._for_html:

1178

1194

return result

1179

1195

1180

1196

cdef int _htmlCtxtResetPush(xmlparser.xmlParserCtxt* c_ctxt,

1181

char* c_data, int buffer_len,

1182

char* c_encoding, int parse_options) except -1:

1197

const_char* c_data, int buffer_len,

1198

const_char* c_encoding, int parse_options) except -1:

1183

1199

cdef xmlparser.xmlParserInput* c_input_stream

1184

1200

# libxml2 crashes if spaceTab is not initialised

1185

1201

if _LIBXML_VERSION_INT < 20629 and c_ctxt.spaceTab is NULL:

1444

1460

c_filename = _cstr(filename_utf)

1445

1461

if python.PyUnicode_Check(text):

1446

1462

c_len = python.PyUnicode_GET_DATA_SIZE(text)

1447

if c_len > python.INT_MAX:

1463

if c_len > limits.INT_MAX:

1448

1464

return (<_BaseParser>parser)._parseDocFromFilelike(

1449

1465

StringIO(text), filename)

1450

1466

return (<_BaseParser>parser)._parseUnicodeDoc(text, c_filename)

1451

1467

else:

1452

1468

c_len = python.PyBytes_GET_SIZE(text)

1453

if c_len > python.INT_MAX:

1469

if c_len > limits.INT_MAX:

1454

1470

return (<_BaseParser>parser)._parseDocFromFilelike(

1455

1471

BytesIO(text), filename)

1456

1472

c_text = _cstr(text)

1471

1487

cdef xmlDoc* result

1472

1488

result = tree.xmlNewDoc(NULL)

1473

1489

if result is NULL:

1474

python.PyErr_NoMemory()

1490

raise MemoryError()

1475

1491

if result.encoding is NULL:

1476

result.encoding = tree.xmlStrdup("UTF-8")

1492

result.encoding = tree.xmlStrdup(<unsigned char*>"UTF-8")

1477

1493

__GLOBAL_PARSER_CONTEXT.initDocDict(result)

1478

1494

return result

1479

1495

1481

1497

cdef xmlDoc* result

1482

1498

result = tree.htmlNewDoc(NULL, NULL)

1483

1499

if result is NULL:

1484

python.PyErr_NoMemory()

1500

raise MemoryError()

1485

1501

__GLOBAL_PARSER_CONTEXT.initDocDict(result)

1486

1502

return result

1487

1503

1493

1509

else:

1494

1510

result = tree.xmlCopyDoc(c_doc, 0)

1495

1511

if result is NULL:

1496

python.PyErr_NoMemory()

1512

raise MemoryError()

1497

1513

__GLOBAL_PARSER_CONTEXT.initDocDict(result)

1498

1514

return result

1499

1515

1506

1522

with nogil:

1507

1523

c_node = tree.xmlDocCopyNode(c_new_root, result, 1) # recursive

1508

1524

if c_node is NULL:

1509

python.PyErr_NoMemory()

1525

raise MemoryError()

1510

1526

tree.xmlDocSetRootElement(result, c_node)

1511

1527

_copyTail(c_new_root.next, c_node)

1512

1528

return result

1516

1532

cdef xmlNode* c_root

1517

1533

c_root = tree.xmlDocCopyNode(c_node, c_doc, 1) # recursive

1518

1534

if c_root is NULL:

1519

python.PyErr_NoMemory()

1535

raise MemoryError()

1520

1536

_copyTail(c_node.next, c_root)

1521

1537

return c_root

1522

1538

1535

1551

if base_url is not None:

1536

1552

base_url = _encodeFilenameUTF8(base_url)

1537

1553

if doc._c_doc.URL is not NULL:

1538

tree.xmlFree(doc._c_doc.URL)

1539

doc._c_doc.URL = tree.xmlStrdup(_cstr(base_url))

1554

tree.xmlFree(<char*>doc._c_doc.URL)

1555

doc._c_doc.URL = tree.xmlStrdup(_xcstr(base_url))

1540

1556

return doc

1541

1557

1542

1558

if base_url is not None:

1555

1571

return _parseFilelikeDocument(

1556

1572

source, _encodeFilenameUTF8(url), parser)

1557

1573

1558

raise TypeError, u"cannot parse from '%s'" % funicode(python._fqtypename(source))

1574

raise TypeError, u"cannot parse from '%s'" % python._fqtypename(source).decode('UTF-8')

1559

1575

1560

1576

cdef _Document _parseDocumentFromURL(url, _BaseParser parser):

1561

1577

cdef xmlDoc* c_doc

Older »