~ubuntu-branches/ubuntu/precise/xom/precise

« back to all changes in this revision

Viewing changes to src/nu/xom/canonical/Canonicalizer.java

Committer: Bazaar Package Importer
Author(s): Varun Hiremath
Date: 2007-11-25 15:50:40 UTC
Revision ID: james.westby@ubuntu.com-20071125155040-r75ikcqf1vu0cei7

Tags: upstream-1.1

Import upstream version 1.1

files added:

LICENSE.txt

README.txt

Todo.txt

build.xml

classes15

classes15/nu

classes15/nu/xom

data

data/!file.xml

data/$file.xml

data/%file.xml

data/&file.xml

data/'file.xml

data/()file.xml

data/+file.xml

data/097.ent

data/097.xml

data/;file.xml

data/=file.xml

data/@file.xml

data/BaseURIWithEntitiesTest.xml

data/[file].xml

data/^file.xml

data/`file.xml

data/baserelative

data/baserelative/dir

data/baserelative/dir/test.dtd

data/baserelative/test.xml

data/canonical

data/canonical/input

data/canonical/input/commentbeforeroot.xml

data/canonical/input/doc.dtd

data/canonical/input/emptyelement.xml

data/canonical/input/escapeattributevalue.xml

data/canonical/input/rootelementindefaultnamespace.xml

data/canonical/input/specialcharactersinattributevalue.xml

data/canonical/input/spectest1.xml

data/canonical/input/test3.3.xml

data/canonical/input/test3.4.xml

data/canonical/input/test3.5.xml

data/canonical/input/test3.6.xml

data/canonical/input/world.txt

data/canonical/output

data/canonical/output/commentbeforeroot.xml.out

data/canonical/output/emptyelement.xml.out

data/canonical/output/escapeattributevalue.xml.out

data/canonical/output/rootelementindefaultnamespace.xml.out

data/canonical/output/specialcharactersinattributevalue.xml.out

data/canonical/output/spectest1.xml.out

data/canonical/output/test3.3.xml.out

data/canonical/output/test3.4.xml.out

data/canonical/output/test3.5.xml.out

data/canonical/output/test3.6.xml.out

data/canonical/wocommentsoutput

data/canonical/wocommentsoutput/commentbeforeroot.xml.out

data/canonical/wocommentsoutput/emptyelement.xml.out

data/canonical/wocommentsoutput/escapeattributevalue.xml.out

data/canonical/wocommentsoutput/rootelementindefaultnamespace.xml.out

data/canonical/wocommentsoutput/specialcharactersinattributevalue.xml.out

data/canonical/wocommentsoutput/spectest1.xml.out

data/canonical/wocommentsoutput/test3.3.xml.out

data/canonical/wocommentsoutput/test3.4.xml.out

data/canonical/wocommentsoutput/test3.5.xml.out

data/canonical/wocommentsoutput/test3.6.xml.out

data/comp.xml

data/content.dtd

data/contentindtd.xml

data/data_ISO-8859-2.txt

data/data_ISO-8859-2.xml

data/data_ISO-8859-7.xml

data/data_ISO-8859-8.xml

data/data_UTF-8.xml

data/dtd

data/dtd/xhtml-lat1.ent

data/dtd/xhtml-special.ent

data/dtd/xhtml-symbol.ent

data/dtd/xhtml1-strict.dtd

data/dtd/xhtml1-transitional.dtd

data/dtdtest.xhtml

data/ent21.xml

data/entities

data/entities/external.xml

data/entitytest.xml

data/external.dtd

data/external.xml

data/externalDTDtest.xml

data/fibonacci_ebcdic.txt

data/file name.xml

data/ge.dtd

data/ge.txt

data/ge.xml

data/hoschektest.xml

data/internalandexternaldtdsubsettest.xml

data/internaldtdsubsettest.xml

data/namespacetest.xsl

data/nfctest.xml

data/nfctests.xml

data/outer21.xml

data/pe.dtd

data/pe.txt

data/pe.xml

data/prettytest.xml

data/prettyxml.xml

data/rddltest.html

data/schematest.xml

data/schematest.xsd

data/simplehoschektest.xml

data/soapresponse.xml

data/test.xml

data/test_ebcdic.xml

data/undeclare.xml

data/xinclude

data/xinclude/debug

data/xinclude/input

data/xinclude/input/EBCDIC.xml

data/xinclude/input/UCS4BE.xml

data/xinclude/input/UCS4LE.xml

data/xinclude/input/UTF16BigEndianWithByteOrderMark.xml

data/xinclude/input/UTF16LittleEndianWithByteOrderMark.xml

data/xinclude/input/UTF32BE.xml

data/xinclude/input/UTF32LE.xml

data/xinclude/input/UTF8WithByteOrderMark.xml

data/xinclude/input/UnicodeBigUnmarked.xml

data/xinclude/input/UnicodeLittleUnmarked.xml

data/xinclude/input/_0123456789.txt

data/xinclude/input/_ABCDEFGHIJKLMNOPQRSTUVWXYZ.txt

data/xinclude/input/a

data/xinclude/input/a/a.xml

data/xinclude/input/abcdefghijklmnopqrstuvwxyz.txt

data/xinclude/input/acceptenglish.xml

data/xinclude/input/acceptfrench.xml

data/xinclude/input/accepthtml.xml

data/xinclude/input/acceptplaintext.xml

data/xinclude/input/b

data/xinclude/input/b/b.xml

data/xinclude/input/badelementschemedata.xml

data/xinclude/input/badencoding.xml

data/xinclude/input/badparseattribute.xml

data/xinclude/input/badxptr.xml

data/xinclude/input/badxptr2.xml

data/xinclude/input/badxptr3.xml

data/xinclude/input/badxptr4.xml

data/xinclude/input/basedata

data/xinclude/input/basedata/red.xml

data/xinclude/input/baseinclude.xml

data/xinclude/input/basewithfragmentid.xml

data/xinclude/input/basewithfragmentidchild.xml

data/xinclude/input/bdisclaimer.xml

data/xinclude/input/c1.xml

data/xinclude/input/c2.xml

data/xinclude/input/c3.xml

data/xinclude/input/c5.xml

data/xinclude/input/circle1.xml

data/xinclude/input/circle2a.xml

data/xinclude/input/circle2b.xml

data/xinclude/input/circleback.xml

data/xinclude/input/circlepointer1.xml

data/xinclude/input/circlepointer2.xml

data/xinclude/input/circlepointer3.xml

data/xinclude/input/colonizedschemename.xml

data/xinclude/input/count.txt

data/xinclude/input/d1.xml

data/xinclude/input/data.xml

data/xinclude/input/digitencoding.xml

data/xinclude/input/disclaimer.xml

data/xinclude/input/docwith2id.xml

data/xinclude/input/docwithid.xml

data/xinclude/input/docwithidandtumbler.xml

data/xinclude/input/docwithxmlid.xml

data/xinclude/input/emptyencoding.xml

data/xinclude/input/emptyfallback.xml

data/xinclude/input/encodingheuristicstest.xml

data/xinclude/input/extraattributes.xml

data/xinclude/input/fallbackbadparseattribute.xml

data/xinclude/input/fallbackbadxpointer.xml

data/xinclude/input/fallbackcontainsfallback.xml

data/xinclude/input/fallbackinternalxpointer.xml

data/xinclude/input/fallbacknohreforparse.xml

data/xinclude/input/fallbacktest.xml

data/xinclude/input/fallbacktest2.xml

data/xinclude/input/fallbacktest3.xml

data/xinclude/input/fallbacktotext.xml

data/xinclude/input/fallbackxpointerpointsnowhere.xml

data/xinclude/input/french.xml

data/xinclude/input/french2.xml

data/xinclude/input/hiddenerror.xml

data/xinclude/input/hiddenerror2.xml

data/xinclude/input/hiddenerror3.xml

data/xinclude/input/ignoresfragmentid.xml

data/xinclude/input/includedocumentwithintradocumentreferences.xml

data/xinclude/input/includefromsamedocumentwithbase.xml

data/xinclude/input/internalcircular.xml

data/xinclude/input/internalcircularviaancestor.xml

data/xinclude/input/langtest1.xml

data/xinclude/input/langtest2.xml

data/xinclude/input/langtest3.xml

data/xinclude/input/laterfailure.xml

data/xinclude/input/laterfailure2.xml

data/xinclude/input/latin1.xml

data/xinclude/input/legalcircle.xml

data/xinclude/input/lineends.txt

data/xinclude/input/lineends.xml

data/xinclude/input/lowercasealphabet.xml

data/xinclude/input/lowerpunctuation.xml

data/xinclude/input/marshtest.xml

data/xinclude/input/marshtestwithxmlbase.xml

data/xinclude/input/marshtestwithxmlbaseandemptyhref.xml

data/xinclude/input/meaninglessfragmentid.xml

data/xinclude/input/metafallbacktest.xml

data/xinclude/input/metafallbacktest2.xml

data/xinclude/input/metafallbacktest3.xml

data/xinclude/input/metafallbacktest4.xml

data/xinclude/input/metafallbacktest5.xml

data/xinclude/input/metafallbacktest6.xml

data/xinclude/input/metafallbacktestwithfragmentid.xml

data/xinclude/input/metafallbacktestwithxpointer.xml

data/xinclude/input/metafallbacktestwithxpointer2.xml

data/xinclude/input/metafallbacktotexttest.xml

data/xinclude/input/metafallbackwithbadxpointertest.xml

data/xinclude/input/metamissingfallbacktestwithxpointer.xml

data/xinclude/input/middlepunctuationerror.xml

data/xinclude/input/missingfile.xml

data/xinclude/input/missinghref.xml

data/xinclude/input/multiplefallbacks.xml

data/xinclude/input/multiplefallbacks2.xml

data/xinclude/input/nakedfallback.xml

data/xinclude/input/namespaceinner.xml

data/xinclude/input/namespacetest.xml

data/xinclude/input/nestedxinclude.xml

data/xinclude/input/nestedxincludenamespace.xml

data/xinclude/input/nofallbacktest.xml

data/xinclude/input/nolang.xml

data/xinclude/input/numeric.xml

data/xinclude/input/onedown.xml

data/xinclude/input/onlyxpointer.xml

data/xinclude/input/paralleltest.xml

data/xinclude/input/parseequalxml.xml

data/xinclude/input/punctuation.xml

data/xinclude/input/recursewithinsamedocument.xml

data/xinclude/input/red.dtd

data/xinclude/input/relative.xml

data/xinclude/input/resolvethruxpointer.xml

data/xinclude/input/rootfailuretest.xml

data/xinclude/input/roottest.xml

data/xinclude/input/roottest2.xml

data/xinclude/input/simple.xml

data/xinclude/input/simple2.xml

data/xinclude/input/test.xml

data/xinclude/input/test0.xml

data/xinclude/input/test2.xml

data/xinclude/input/test3.xml

data/xinclude/input/text

data/xinclude/input/text/.AppleFileInfo

data/xinclude/input/text/.AppleFileInfo/UnicodeBigUnmarked.xml..RF

data/xinclude/input/text/.AppleFileInfo/UnicodeLittleUnmarked.xml..RF

data/xinclude/input/text/EBCDIC.xml

data/xinclude/input/text/UTF32BE.xml

data/xinclude/input/text/UTF32LE.xml

data/xinclude/input/text/UTF8.xml

data/xinclude/input/text/UnicodeBigUnmarked.xml

data/xinclude/input/text/UnicodeLittleUnmarked.xml

data/xinclude/input/tobinbottom.xml

data/xinclude/input/tobinmiddle.xml

data/xinclude/input/tobintop.xml

data/xinclude/input/toplevel.xml

data/xinclude/input/ucs4bigendian.xml

data/xinclude/input/ucs4littleendian.xml

data/xinclude/input/unrecognizedscheme.xml

data/xinclude/input/unrecognizedschemewithfallback.xml

data/xinclude/input/uppercase.txt

data/xinclude/input/uppercasealphabet.xml

data/xinclude/input/utf16.txt

data/xinclude/input/utf16.xml

data/xinclude/input/utf16be.txt

data/xinclude/input/utf16be.xml

data/xinclude/input/utf16le.xml

data/xinclude/input/utf8.xml

data/xinclude/input/utf8bom.xml

data/xinclude/input/xmlbasetest.xml

data/xinclude/input/xmlbasetest2.xml

data/xinclude/input/xmlbasetest3.xml

data/xinclude/input/xmlidtest.xml

data/xinclude/input/xpointeroverridesfragmentid.xml

data/xinclude/input/xpointerselectsnonelements.xml

data/xinclude/input/xpointerwithpercentescape.xml

data/xinclude/input/xptr2tumblertest.xml

data/xinclude/input/xptrdoublechildsequence.xml

data/xinclude/input/xptrdoubleelementtest.xml

data/xinclude/input/xptrdoubletumblertest.xml

data/xinclude/input/xptrfallback.xml

data/xinclude/input/xptridandtumblertest.xml

data/xinclude/input/xptridtest.xml

data/xinclude/input/xptridtest2.xml

data/xinclude/input/xptrsyntaxerrorbutfallback.xml

data/xinclude/input/xptrtumblerfailsbutfallback.xml

data/xinclude/input/xptrtumblertest.xml

data/xinclude/input/xptrtumblertest2.xml

data/xinclude/input/xptrtumblertest3.xml

data/xinclude/output

data/xinclude/output/EBCDIC.xml

data/xinclude/output/UTF16BigEndianWithByteOrderMark.xml

data/xinclude/output/UTF16LittleEndianWithByteOrderMark.xml

data/xinclude/output/UTF32BE.xml

data/xinclude/output/UTF32LE.xml

data/xinclude/output/UTF8WithByteOrderMark.xml

data/xinclude/output/UnicodeBigUnmarked.xml

data/xinclude/output/UnicodeLittleUnmarked.xml

data/xinclude/output/acceptascii.xml

data/xinclude/output/acceptenglish.xml

data/xinclude/output/acceptfrench.xml

data/xinclude/output/accepthtml.xml

data/xinclude/output/acceptjis.xml

data/xinclude/output/acceptplaintext.xml

data/xinclude/output/badelementschemedata.xml

data/xinclude/output/basewithfragmentid.xml

data/xinclude/output/c1.xml

data/xinclude/output/c1a.xml

data/xinclude/output/c1b.xml

data/xinclude/output/c2.xml

data/xinclude/output/c2a.xml

data/xinclude/output/c2b.xml

data/xinclude/output/c2c.xml

data/xinclude/output/c2d.xml

data/xinclude/output/c3.xml

data/xinclude/output/c5.xml

data/xinclude/output/d1.xml

data/xinclude/output/disclaimer.xml

data/xinclude/output/emptyfallback.xml

data/xinclude/output/encodingheuristicstest.xml

data/xinclude/output/fallbacktest.xml

data/xinclude/output/fallbacktest2.xml

data/xinclude/output/ignoresfragmentid.xml

data/xinclude/output/includedocumentwithintradocumentreferences.xml

data/xinclude/output/includefromsamedocumentwithbase.xml

data/xinclude/output/langtest1.xml

data/xinclude/output/langtest2.xml

data/xinclude/output/langtest3.xml

data/xinclude/output/latin1.xml

data/xinclude/output/legalcircle.xml

data/xinclude/output/lineends.xml

data/xinclude/output/lowercasealphabet.xml

data/xinclude/output/lowerpunctuation.xml

data/xinclude/output/marshtest.xml

data/xinclude/output/marshtestwithxmlbase.xml

data/xinclude/output/metafallbacktest.xml

data/xinclude/output/metafallbacktest2.xml

data/xinclude/output/metafallbacktest5.xml

data/xinclude/output/metafallbacktest6.xml

data/xinclude/output/metafallbacktestwithxpointer.xml

data/xinclude/output/metafallbacktestwithxpointer2.xml

data/xinclude/output/metafallbacktotexttest.xml

data/xinclude/output/middlepunctuation.xml

data/xinclude/output/namespacetest.xml

data/xinclude/output/numeric.xml

data/xinclude/output/onlyxpointer.xml

data/xinclude/output/paralleltest.xml

data/xinclude/output/punctuation.xml

data/xinclude/output/recursewithinsamedocument.xml

data/xinclude/output/relative.xml

data/xinclude/output/resolvethruxpointer.xml

data/xinclude/output/roottest.xml

data/xinclude/output/roottest2.xml

data/xinclude/output/simple.xml

data/xinclude/output/test.xml

data/xinclude/output/tobintop.xml

data/xinclude/output/triple.xml

data/xinclude/output/unrecognizedschemewithfallback.xml

data/xinclude/output/uppercasealphabet.xml

data/xinclude/output/utf16.txt

data/xinclude/output/utf16.xml

data/xinclude/output/xmlbasetest.xml

data/xinclude/output/xmlbasetest2.xml

data/xinclude/output/xmlbasetest3.xml

data/xinclude/output/xmlidtest.xml

data/xinclude/output/xpointeroverridesfragmentid.xml

data/xinclude/output/xptrdandtumblertest.xml

data/xinclude/output/xptrdoubleelementtest.xml

data/xinclude/output/xptrfallback.xml

data/xinclude/output/xptridandtumblertest.xml

data/xinclude/output/xptridtest.xml

data/xinclude/output/xptridtest2.xml

data/xinclude/output/xptrtumblertest.xml

data/xmlbasetest.xml

data/xmlid

data/xmlid/catalog.xml

data/xmlid/tests

data/xmlid/tests/001_normalize.xml

data/xmlid/tests/002_undecl.xml

data/xmlid/tests/003_dtd.xml

data/xmlid/tests/004_schema.xml

data/xmlid/tests/005_errdtdbad.xml

data/xmlid/tests/005_errdup.xml

data/xmlid/tests/006_errschemabad.xml

data/xmlid/tests/007_errdup.xml

data/xmlid/tests/008_ok10.xml

data/xmlid/tests/009_ok11.xml

data/xmlid/tests/010_okxref.xml

data/xmlid/tests/011_oknormalize.xml

data/xmlid/tests/badschema.xsd

data/xmlid/tests/badxml.xsd

data/xmlid/tests/schema.xsd

data/xmlid/tests/xml.xsd

data/xmlspacetest.xml

data/xslt

data/xslt/debug

data/xslt/debug/8-12.xml

data/xslt/debug/8-15.xml

data/xslt/debug/8-8.xml

data/xslt/input

data/xslt/input/8-1.xml

data/xslt/input/8-10.xsl

data/xslt/input/8-12.xsl

data/xslt/input/8-14.xml

data/xslt/input/8-15.xsl

data/xslt/input/8-2.xsl

data/xslt/input/8-4.xsl

data/xslt/input/8-5.xsl

data/xslt/input/8-6.xsl

data/xslt/input/8-7.xsl

data/xslt/input/8-8.xsl

data/xslt/input/commentwithparent.xsl

data/xslt/input/fragment.xsl

data/xslt/input/id_transform.xsl

data/xslt/input/identity.xsl

data/xslt/input/illegaltransform.xsl

data/xslt/input/namespaceparamtest.xsl

data/xslt/input/paramtest.xsl

data/xslt/input/piwithparent.xsl

data/xslt/input/singlestring.xsl

data/xslt/input/textmethod.xsl

data/xslt/output

data/xslt/output/8-12.xml

data/xslt/output/8-15.xml

data/xslt/output/8-8.xml

data/xslt/output/8-8c.xml

data/xtest.xml

data/{file}.xml

fatsrc

fatsrc/nu

fatsrc/nu/xom

fatsrc/nu/xom/Text.java

lgpl.txt

lib/LICENSE-DOM.html

lib/LICENSE-Jaxen.txt

lib/LICENSE-SAX.html

lib/XalanLicense.txt

lib/XercesLicense.txt

lib/junit_license.html

overview.html

project.xml

src/nu

src/nu/xom

src/nu/xom/ASCIIWriter.java

src/nu/xom/Attribute.java

src/nu/xom/Builder.java

src/nu/xom/CDATASection.java

src/nu/xom/Comment.java

src/nu/xom/CycleException.java

src/nu/xom/DocType.java

src/nu/xom/Document.java

src/nu/xom/DocumentFragment.java

src/nu/xom/EBCDICWriter.java

src/nu/xom/Element.java

src/nu/xom/Elements.java

src/nu/xom/GenericWriter.java

src/nu/xom/ISOArabicWriter.java

src/nu/xom/ISOCyrillicWriter.java

src/nu/xom/ISOGreekWriter.java

src/nu/xom/ISOHebrewWriter.java

src/nu/xom/ISOThaiWriter.java

src/nu/xom/IllegalAddException.java

src/nu/xom/IllegalCharacterDataException.java

src/nu/xom/IllegalDataException.java

src/nu/xom/IllegalNameException.java

src/nu/xom/IllegalTargetException.java

src/nu/xom/Info.java

src/nu/xom/JaxenConnector.java

src/nu/xom/JaxenNavigator.java

src/nu/xom/Latin10Writer.java

src/nu/xom/Latin1Writer.java

src/nu/xom/Latin2Writer.java

src/nu/xom/Latin3Writer.java

src/nu/xom/Latin4Writer.java

src/nu/xom/Latin5Writer.java

src/nu/xom/Latin6Writer.java

src/nu/xom/Latin7Writer.java

src/nu/xom/Latin8Writer.java

src/nu/xom/Latin9Writer.java

src/nu/xom/MalformedURIException.java

src/nu/xom/MultipleParentException.java

src/nu/xom/Namespace.java

src/nu/xom/NamespaceConflictException.java

src/nu/xom/Namespaces.java

src/nu/xom/NoSuchAttributeException.java

src/nu/xom/NoSuchChildException.java

src/nu/xom/Node.java

src/nu/xom/NodeFactory.java

src/nu/xom/Nodes.java

src/nu/xom/NonVerifyingHandler.java

src/nu/xom/ParentNode.java

src/nu/xom/ParsingException.java

src/nu/xom/ProcessingInstruction.java

src/nu/xom/Serializer.java

src/nu/xom/Text.java

src/nu/xom/TextWriter.java

src/nu/xom/TextWriterFactory.java

src/nu/xom/UCSWriter.java

src/nu/xom/URIUtil.java

src/nu/xom/UnavailableCharacterException.java

src/nu/xom/UnicodeUtil.java

src/nu/xom/UnicodeWriter.java

src/nu/xom/UnsynchronizedBufferedWriter.java

src/nu/xom/ValidityException.java

src/nu/xom/Verifier.java

src/nu/xom/WellformednessException.java

src/nu/xom/XML1_0Parser.java

src/nu/xom/XMLException.java

src/nu/xom/XOMHandler.java

src/nu/xom/XPathContext.java

src/nu/xom/XPathException.java

src/nu/xom/XPathTypeException.java

src/nu/xom/benchmarks

src/nu/xom/benchmarks/BigText.java

src/nu/xom/benchmarks/DOMConverterBench.java

src/nu/xom/benchmarks/DocumentModifier.java

src/nu/xom/benchmarks/ElementCopyBench.java

src/nu/xom/benchmarks/FastReproducer.java

src/nu/xom/benchmarks/MemoryTest.java

src/nu/xom/benchmarks/Reproducer.java

src/nu/xom/benchmarks/ToXMLBench.java

src/nu/xom/benchmarks/TreeWalker.java

src/nu/xom/benchmarks/package.html

src/nu/xom/canonical

src/nu/xom/canonical/CanonicalizationException.java

src/nu/xom/canonical/Canonicalizer.java

src/nu/xom/canonical/package.html

src/nu/xom/characters.dat

src/nu/xom/compositions.dat

src/nu/xom/converters

src/nu/xom/converters/DOMConverter.java

src/nu/xom/converters/SAXConverter.java

src/nu/xom/converters/package.html

src/nu/xom/doc-files

src/nu/xom/doc-files/xom.png

src/nu/xom/package.html

src/nu/xom/samples

src/nu/xom/samples/Account.java

src/nu/xom/samples/Agency.java

src/nu/xom/samples/AttributesToElements.java

src/nu/xom/samples/AttributesXMLBudget.java

src/nu/xom/samples/Budget.java

src/nu/xom/samples/BudgetData.java

src/nu/xom/samples/Bureau.java

src/nu/xom/samples/CanonicalizerDriver.java

src/nu/xom/samples/CommentReader.java

src/nu/xom/samples/CrimsonPrinter.java

src/nu/xom/samples/DTDGenerator.java

src/nu/xom/samples/DatabaseBuilder.java

src/nu/xom/samples/DatabaseConverter.java

src/nu/xom/samples/DocumentMerger.java

src/nu/xom/samples/EZSerializer.java

src/nu/xom/samples/ElementLister.java

src/nu/xom/samples/EncodingDemo.java

src/nu/xom/samples/ExampleExtractor.java

src/nu/xom/samples/ExampleLister.java

src/nu/xom/samples/FibonacciAttributes.java

src/nu/xom/samples/FibonacciEBCDIC.java

src/nu/xom/samples/FibonacciFile.java

src/nu/xom/samples/FibonacciLatin1.java

src/nu/xom/samples/FibonacciSOAPClient.java

src/nu/xom/samples/FibonacciServlet.java

src/nu/xom/samples/FibonacciXML.java

src/nu/xom/samples/FibonacciXMLRPCClient.java

src/nu/xom/samples/FibonacciXOMSOAPServlet.java

src/nu/xom/samples/FibonacciXOMXMLRPCServlet.java

src/nu/xom/samples/FilterDriver.java

src/nu/xom/samples/FlatXMLBudget.java

src/nu/xom/samples/HelloNamespaces.java

src/nu/xom/samples/HelloWorld.java

src/nu/xom/samples/HelloXMLBase.java

src/nu/xom/samples/HierarchicalXMLBudget.java

src/nu/xom/samples/IDFilter.java

src/nu/xom/samples/IDTagger.java

src/nu/xom/samples/Linkset.java

src/nu/xom/samples/MathMLFibonacci.java

src/nu/xom/samples/MinimalNodeFactory.java

src/nu/xom/samples/NodeLister.java

src/nu/xom/samples/NonRecursiveSerializer.java

src/nu/xom/samples/NormalizingFactory.java

src/nu/xom/samples/PoliteSpider.java

src/nu/xom/samples/PrettyFibonacci.java

src/nu/xom/samples/PrettyPrinter.java

src/nu/xom/samples/ProcessingInstructionLister.java

src/nu/xom/samples/PropertyPrinter.java

src/nu/xom/samples/PseudoAttributes.java

src/nu/xom/samples/PureValidator.java

src/nu/xom/samples/RDDLFilter.java

src/nu/xom/samples/RDDLStripper.java

src/nu/xom/samples/RDDLToTable.java

src/nu/xom/samples/ROT13File.java

src/nu/xom/samples/ROT13XML.java

src/nu/xom/samples/RSSHeadlines.java

src/nu/xom/samples/ResourceToTable.java

src/nu/xom/samples/Restructurer.java

src/nu/xom/samples/SQLToXML.java

src/nu/xom/samples/SchemaValidator.java

src/nu/xom/samples/SimpleSVG.java

src/nu/xom/samples/SourceCodeGenerator.java

src/nu/xom/samples/SourceCodeSerializer.java

src/nu/xom/samples/StreamingCommentReader.java

src/nu/xom/samples/StreamingElementLister.java

src/nu/xom/samples/StreamingExampleExtractor.java

src/nu/xom/samples/StreamingNodeLister.java

src/nu/xom/samples/StreamingProcessingInstructionLister.java

src/nu/xom/samples/StreamingROT13.java

src/nu/xom/samples/StreamingTextExtractor.java

src/nu/xom/samples/StreamingTreeReporter.java

src/nu/xom/samples/StreamingTypeCounter.java

src/nu/xom/samples/StreamingXHTMLPurifier.java

src/nu/xom/samples/StreamingXHTMLQualifier.java

src/nu/xom/samples/Subfunction.java

src/nu/xom/samples/TextExtractor.java

src/nu/xom/samples/TextMerger.java

src/nu/xom/samples/TextSerializer.java

src/nu/xom/samples/Transformer.java

src/nu/xom/samples/TreePrinter.java

src/nu/xom/samples/TreeReporter.java

src/nu/xom/samples/TreeViewer.java

src/nu/xom/samples/ValidFibonacci.java

src/nu/xom/samples/Validator.java

src/nu/xom/samples/WrappingSerializer.java

src/nu/xom/samples/XHTMLPurifier.java

src/nu/xom/samples/XHTMLQualifier.java

src/nu/xom/samples/XHTMLValidator.java

src/nu/xom/samples/XIncludeDriver.java

src/nu/xom/samples/XLinkSpider.java

src/nu/xom/samples/XMLPrinter.java

src/nu/xom/samples/XOMChecker.java

src/nu/xom/samples/XPathDriver.java

src/nu/xom/samples/XPathHeadlines.java

src/nu/xom/samples/package.html

src/nu/xom/tests

src/nu/xom/tests/AttributeTest.java

src/nu/xom/tests/AttributeTypeTest.java

src/nu/xom/tests/AttributesTest.java

src/nu/xom/tests/BaseURITest.java

src/nu/xom/tests/BuilderTest.java

src/nu/xom/tests/CDATASectionTest.java

src/nu/xom/tests/CanonicalizationExceptionTest.java

src/nu/xom/tests/CanonicalizerTest.java

src/nu/xom/tests/CommentTest.java

src/nu/xom/tests/DOMConverterTest.java

src/nu/xom/tests/DocTypeTest.java

src/nu/xom/tests/DocumentTest.java

src/nu/xom/tests/EBCDICTest.java

src/nu/xom/tests/ElementTest.java

src/nu/xom/tests/EncodingTest.java

src/nu/xom/tests/FastTests.java

src/nu/xom/tests/IDTest.java

src/nu/xom/tests/InfoTest.java

src/nu/xom/tests/LeafNodeTest.java

src/nu/xom/tests/MegaTest.java

src/nu/xom/tests/NamespaceNodeTest.java

src/nu/xom/tests/NamespacesTest.java

src/nu/xom/tests/NodeFactoryTest.java

src/nu/xom/tests/NodesTest.java

src/nu/xom/tests/ParentNodeTest.java

src/nu/xom/tests/ParsingExceptionTest.java

src/nu/xom/tests/ProcessingInstructionTest.java

src/nu/xom/tests/RoundTripTest.java

src/nu/xom/tests/SAXConverterTest.java

src/nu/xom/tests/SerializerTest.java

src/nu/xom/tests/SubclassTest.java

src/nu/xom/tests/TextTest.java

src/nu/xom/tests/ValidityExceptionTest.java

src/nu/xom/tests/VerifierTest.java

src/nu/xom/tests/XIncludeExceptionTest.java

src/nu/xom/tests/XIncludeTest.java

src/nu/xom/tests/XMLExceptionTest.java

src/nu/xom/tests/XMLWriter.java

src/nu/xom/tests/XOMTestCase.java

src/nu/xom/tests/XOMTestCaseTest.java

src/nu/xom/tests/XOMTests.java

src/nu/xom/tests/XPathExceptionTest.java

src/nu/xom/tests/XPathTest.java

src/nu/xom/tests/XSLExceptionTest.java

src/nu/xom/tests/XSLTransformTest.java

src/nu/xom/tests/package.html

src/nu/xom/tools

src/nu/xom/tools/XHTMLJavaDoc.java

src/nu/xom/tools/package.html

src/nu/xom/xinclude

src/nu/xom/xinclude/BadEncodingAttributeException.java

src/nu/xom/xinclude/BadHTTPHeaderException.java

src/nu/xom/xinclude/BadHrefAttributeException.java

src/nu/xom/xinclude/BadParseAttributeException.java

src/nu/xom/xinclude/EncodingHeuristics.java

src/nu/xom/xinclude/InclusionLoopException.java

src/nu/xom/xinclude/MisplacedFallbackException.java

src/nu/xom/xinclude/NoIncludeLocationException.java

src/nu/xom/xinclude/XIncludeException.java

src/nu/xom/xinclude/XIncluder.java

src/nu/xom/xinclude/XPointer.java

src/nu/xom/xinclude/XPointerException.java

src/nu/xom/xinclude/XPointerResourceException.java

src/nu/xom/xinclude/XPointerSyntaxException.java

src/nu/xom/xinclude/package.html

src/nu/xom/xslt

src/nu/xom/xslt/XOMInputSource.java

src/nu/xom/xslt/XOMReader.java

src/nu/xom/xslt/XOMResult.java

src/nu/xom/xslt/XOMSource.java

src/nu/xom/xslt/XSLException.java

src/nu/xom/xslt/XSLTHandler.java

src/nu/xom/xslt/XSLTransform.java

src/nu/xom/xslt/package.html

src15

src15/nu

src15/nu/xom

src15/nu/xom/JDK15XML1_0Parser.java

xom.graffle

Show diffs side-by-side

added added

removed removed

src/nu/xom/canonical/Canonicalizer.java

This library is free software; you can redistribute it and/or modify

it under the terms of version 2.1 of the GNU Lesser General Public

License as published by the Free Software Foundation.

This library is distributed in the hope that it will be useful,

but WITHOUT ANY WARRANTY; without even the implied warranty of

MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

GNU Lesser General Public License for more details.

You should have received a copy of the GNU Lesser General Public

License along with this library; if not, write to the

Free Software Foundation, Inc., 59 Temple Place, Suite 330,

Boston, MA 02111-1307 USA

You can contact Elliotte Rusty Harold by sending e-mail to

elharo@metalab.unc.edu. Please include the word "XOM" in the

subject line. The XOM home page is located at http://www.xom.nu/

package nu.xom.canonical;

import java.io.IOException;

import java.io.OutputStream;

import java.util.ArrayList;

import java.util.Arrays;

import java.util.Comparator;

import java.util.Iterator;

import java.util.List;

import java.util.Map;

import java.util.SortedMap;

import java.util.StringTokenizer;

import java.util.TreeMap;

import java.util.Map.Entry;

import org.xml.sax.helpers.NamespaceSupport;

import nu.xom.Attribute;

import nu.xom.Comment;

import nu.xom.DocType;

import nu.xom.Document;

import nu.xom.Element;

import nu.xom.Namespace;

import nu.xom.Node;

import nu.xom.Nodes;

import nu.xom.ParentNode;

import nu.xom.ProcessingInstruction;

import nu.xom.Serializer;

import nu.xom.Text;

import nu.xom.XPathContext;

/**

*

* Writes XML in the format specified by <a target="_top"

* href="http://www.w3.org/TR/2001/REC-xml-c14n-20010315">Canonical

* XML Version 1.0</a> or <a target="_top"

* href="http://www.w3.org/TR/2002/REC-xml-exc-c14n-20020718/">Exclusive

* XML Canonicalization Version 1.0</a>.

*

* @author Elliotte Rusty Harold

* @version 1.1b4

public class Canonicalizer {

private boolean withComments;

private boolean exclusive = false;

private CanonicalXMLSerializer serializer;

private List inclusiveNamespacePrefixes = new ArrayList();

private static Comparator comparator = new AttributeComparator();

public final static String CANONICAL_XML =

"http://www.w3.org/TR/2001/REC-xml-c14n-20010315";

public final static String CANONICAL_XML_WITH_COMMENTS =

"http://www.w3.org/TR/2001/REC-xml-c14n-20010315#WithComments";

public final static String EXCLUSIVE_XML_CANONICALIZATION =

"http://www.w3.org/2001/10/xml-exc-c14n#";

public final static String EXCLUSIVE_XML_CANONICALIZATION_WITH_COMMENTS =

"http://www.w3.org/2001/10/xml-exc-c14n#WithComments";

private static class AttributeComparator implements Comparator {

public int compare(Object o1, Object o2) {

Attribute a1 = (Attribute) o1;

Attribute a2 = (Attribute) o2;

String namespace1 = a1.getNamespaceURI();

String namespace2 = a2.getNamespaceURI();

if (namespace1.equals(namespace2)) {

return a1.getLocalName().compareTo(a2.getLocalName());

}

else if (namespace1.equals("")) {

return -1;

}

100

else if (namespace2.equals("")) {

101

return 1;

102

}

103

else { // compare namespace URIs

104

return namespace1.compareTo(namespace2);

105

}

106

107

}

108

109

}

110

111

112

/**

113

*

114

* Creates a <code>Canonicalizer</code> that outputs a

115

* canonical XML document with comments.

116

*

117

118

* @param out the output stream the document

119

* is written onto

120

121

public Canonicalizer(OutputStream out) {

122

this(out, true, false);

123

}

124

125

126

/**

127

*

128

* Creates a <code>Canonicalizer</code> that outputs a

129

* canonical XML document with or without comments.

130

*

131

132

* @param out the output stream the document

133

* is written onto

134

* @param withComments true if comments should be included

135

* in the output, false otherwise

136

137

public Canonicalizer(

138

OutputStream out, boolean withComments) {

139

this(out, withComments, false);

140

}

141

142

143

/**

144

*

145

* Creates a <code>Canonicalizer</code> that outputs a

146

* canonical XML document with or without comments,

147

* using either the original or the exclusive canonicalization

148

* algorithm.

149

*

150

151

* @param out the output stream the document

152

* is written onto

153

* @param withComments true if comments should be included

154

* in the output, false otherwise

155

* @param exclusive true if exclusive XML canonicalization

156

* should be performed, false if regular XML canonicalization

157

* should be performed

158

159

private Canonicalizer(

160

OutputStream out, boolean withComments, boolean exclusive) {

161

162

this.serializer = new CanonicalXMLSerializer(out);

163

serializer.setLineSeparator("\n");

164

this.withComments = withComments;

165

this.exclusive = exclusive;

166

167

}

168

169

170

/**

171

*

172

* Creates a <code>Canonicalizer</code> that outputs a

173

* canonical XML document using the specified algorithm.

174

* Currently, four algorithms are defined and supported:

175

*

176

177

* <ul>

178

* <li>Canonical XML without comments:

179

* <code>http://www.w3.org/TR/2001/REC-xml-c14n-20010315</code></li>

180

* <li>Canonical XML with comments:

181

* <code>http://www.w3.org/TR/2001/REC-xml-c14n-20010315#WithComments</code></li>

182

* <li>Exclusive XML canonicalization without comments:

183

* <code>http://www.w3.org/2001/10/xml-exc-c14n#</code></li>

184

* <li>Exclusive XML canonicalization with comments:

185

* <code>http://www.w3.org/2001/10/xml-exc-c14n#WithComments</code></li>

186

* </ul>

187

188

* @param out the output stream the document

189

* is written onto

190

* @param algorithm the URI for the canonicalization algorithm

191

192

* @throws CanonicalizationException if the algorithm is

193

* not recognized

194

* @throws NullPointerException if the algorithm is null

195

196

197

public Canonicalizer(

198

OutputStream out, String algorithm) {

199

200

if (algorithm == null) {

201

throw new NullPointerException("Null algorithm");

202

}

203

this.serializer = new CanonicalXMLSerializer(out);

204

serializer.setLineSeparator("\n");

205

if (algorithm.equals(CANONICAL_XML)) {

206

this.withComments = false;

207

this.exclusive = false;

208

}

209

else if (algorithm.equals(CANONICAL_XML_WITH_COMMENTS)) {

210

this.withComments = true;

211

this.exclusive = false;

212

}

213

else if (algorithm.equals(EXCLUSIVE_XML_CANONICALIZATION)) {

214

this.withComments = false;

215

this.exclusive = true;

216

}

217

else if (algorithm.equals(EXCLUSIVE_XML_CANONICALIZATION_WITH_COMMENTS)) {

218

this.withComments = true;

219

this.exclusive = true;

220

}

221

else {

222

throw new CanonicalizationException(

223

"Unsupported canonicalization algorithm: " + algorithm);

224

}

225

226

}

227

228

229

private class CanonicalXMLSerializer extends Serializer {

230

231

// If nodes is null we're canonicalizing all nodes;

232

// the entire document; this is somewhat easier than when

233

// canonicalizing only a document subset embedded in nodes

234

private Nodes nodes;

235

private NamespaceSupport inScope;

236

237

/**

238

*

239

* Creates a <code>Serializer</code> that outputs a

240

* canonical XML document with or without comments.

241

*

242

243

* @param out the <code>OutputStream</code> the document

244

* is written onto

245

* @param withComments true if comments should be included

246

* in the output, false otherwise

247

248

CanonicalXMLSerializer(OutputStream out) {

249

super(out);

250

setLineSeparator("\n");

251

}

252

253

254

/**

255

*

256

* Serializes a document onto the output

257

* stream using the canonical XML algorithm.

258

*

259

260

* @param doc the <code>Document</code> to serialize

261

262

* @throws IOException if the underlying <code>OutputStream</code>

263

* encounters an I/O error

264

265

public final void write(Document doc) throws IOException {

266

267

inScope = new NamespaceSupport();

268

int position = 0;

269

while (true) {

270

Node child = doc.getChild(position);

271

if (nodes == null || child instanceof Element || nodes.contains(child)) {

272

writeChild(child);

273

if (child instanceof ProcessingInstruction) breakLine();

274

else if (child instanceof Comment && withComments) {

275

breakLine();

276

}

277

}

278

position++;

279

if (child instanceof Element) break;

280

}

281

282

for (int i = position; i < doc.getChildCount(); i++) {

283

Node child = doc.getChild(i);

284

if (nodes == null || child instanceof Element || nodes.contains(child)) {

285

if (child instanceof ProcessingInstruction) breakLine();

286

else if (child instanceof Comment && withComments) {

287

breakLine();

288

}

289

writeChild(child);

290

}

291

}

292

293

flush();

294

295

}

296

297

298

/**

299

*

300

* Serializes an element onto the output stream using the canonical

301

* XML algorithm. The result is guaranteed to be well-formed.

302

* If <code>element</code> does not have a parent element, it will

303

* also be namespace well-formed.

304

*

305

306

* @param element the <code>Element</code> to serialize

307

308

* @throws IOException if the underlying <code>OutputStream</code>

309

* encounters an I/O error

310

311

protected final void write(Element element)

312

throws IOException {

313

314

// treat empty elements differently to avoid an

315

// instanceof test

316

if (element.getChildCount() == 0) {

317

writeStartTag(element, false);

318

writeEndTag(element);

319

}

320

else {

321

Node current = element;

322

boolean end = false;

323

int index = -1;

324

int[] indexes = new int[10];

325

int top = 0;

326

indexes[0] = -1;

327

while (true) {

328

if (!end && current.getChildCount() > 0) {

329

writeStartTag((Element) current, false);

330

current = current.getChild(0);

331

index = 0;

332

top++;

333

indexes = grow(indexes, top);

334

indexes[top] = 0;

335

}

336

else {

337

if (end) {

338

writeEndTag((Element) current);

339

if (current == element) break;

340

}

341

else {

342

writeChild(current);

343

}

344

end = false;

345

ParentNode parent = current.getParent();

346

if (parent.getChildCount() - 1 == index) {

347

current = parent;

348

top--;

349

if (current != element) {

350

index = indexes[top];

351

}

352

end = true;

353

}

354

else {

355

index++;

356

indexes[top] = index;

357

current = parent.getChild(index);

358

}

359

}

360

}

361

}

362

363

}

364

365

366

private int[] grow(int[] indexes, int top) {

367

368

if (top < indexes.length) return indexes;

369

int[] result = new int[indexes.length*2];

370

System.arraycopy(indexes, 0, result, 0, indexes.length);

371

return result;

372

373

}

374

375

376

protected void writeStartTag(Element element, boolean isEmpty)

377

throws IOException {

378

379

boolean writeElement = nodes == null || nodes.contains(element);

380

if (writeElement) {

381

inScope.pushContext();

382

writeRaw("<");

383

writeRaw(element.getQualifiedName());

384

}

385

386

SortedMap map = new TreeMap();

387

if (nodes == null) {

388

ParentNode parent = element.getParent();

389

Element parentElement = null;

390

if (parent instanceof Element) {

391

parentElement = (Element) parent;

392

}

393

for (int i = 0;

394

i < element.getNamespaceDeclarationCount();

395

i++) {

396

String prefix = element.getNamespacePrefix(i);

397

String uri = element.getNamespaceURI(prefix);

398

399

if (uri.equals(inScope.getURI(prefix))) {

400

continue;

401

}

402

else if (exclusive) {

403

if (needToDeclareNamespace(element, prefix, uri)) {

404

map.put(prefix, uri);

405

}

406

}

407

else if (uri.equals("")) {

408

// no need to say xmlns=""

409

if (parentElement == null) continue;

410

if ("".equals(parentElement.getNamespaceURI(""))) {

411

continue;

412

}

413

map.put(prefix, uri);

414

}

415

else {

416

map.put(prefix, uri);

417

}

418

419

}

420

421

writeNamespaceDeclarations(map);

422

423

}

424

else {

425

int position = indexOf(element);

426

// do we need to undeclare a default namespace?

427

// You know, should I instead create an output tree and then just

428

// canonicalize that? probably not

429

if (position != -1 && "".equals(element.getNamespaceURI())) {

430

ParentNode parent = element.getParent();

431

// Here we have to check for the nearest default on parents in the

432

// output tree, not the input tree

433

while (parent instanceof Element

434

&& !(nodes.contains(parent))) {

435

parent = parent.getParent();

436

}

437

if (parent instanceof Element) {

438

String uri = ((Element) parent).getNamespaceURI("");

439

if (! "".equals(uri)) {

440

map.put("", "");

441

}

442

}

443

}

444

445

for (int i = position+1; i < nodes.size(); i++) {

446

Node next = nodes.get(i);

447

if ( !(next instanceof Namespace) ) break;

448

Namespace namespace = (Namespace) next;

449

String prefix = namespace.getPrefix();

450

String uri = namespace.getValue();

451

452

if (uri.equals(inScope.getURI(prefix))) {

453

continue;

454

}

455

else if (exclusive) {

456

if (needToDeclareNamespace(element, prefix, uri)) {

457

map.put(prefix, uri);

458

}

459

}

460

else {

461

map.put(prefix, uri);

462

}

463

464

}

465

466

writeNamespaceDeclarations(map);

467

468

}

469

470

Attribute[] sorted = sortAttributes(element);

471

for (int i = 0; i < sorted.length; i++) {

472

if (nodes == null || nodes.contains(sorted[i])

473

|| (sorted[i].getNamespaceURI().equals(Namespace.XML_NAMESPACE)

474

&& sorted[i].getParent() != element)) {

475

write(sorted[i]);

476

}

477

}

478

479

if (writeElement) {

480

writeRaw(">");

481

}

482

483

}

484

485

486

private void writeNamespaceDeclarations(SortedMap map) throws IOException {

487

488

Iterator prefixes = map.entrySet().iterator();

489

while (prefixes.hasNext()) {

490

Map.Entry entry = (Entry) prefixes.next();

491

String prefix = (String) entry.getKey();

492

String uri = (String) entry.getValue();

493

writeRaw(" ");

494

writeNamespaceDeclaration(prefix, uri);

495

inScope.declarePrefix(prefix, uri);

496

}

497

498

}

499

500

501

private boolean needToDeclareNamespace(

502

Element parent, String prefix, String uri) {

503

504

boolean match = visiblyUtilized(parent, prefix, uri);

505

506

if (match || inclusiveNamespacePrefixes.contains(prefix)) {

507

return noOutputAncestorUsesPrefix(parent, prefix, uri);

508

}

509

510

return false;

511

512

}

513

514

515

private boolean visiblyUtilized(Element element, String prefix, String uri) {

516

517

boolean match = false;

518

String pfx = element.getNamespacePrefix();

519

String local = element.getNamespaceURI();

520

if (prefix.equals(pfx) && local.equals(uri)) {

521

match = true;

522

}

523

else {

524

for (int i = 0; i < element.getAttributeCount(); i++) {

525

Attribute attribute = element.getAttribute(i);

526

if (nodes == null || nodes.contains(attribute)) {

527

pfx = attribute.getNamespacePrefix();

528

if (prefix.equals(pfx)) {

529

match = true;

530

break;

531

}

532

}

533

}

534

}

535

return match;

536

}

537

538

539

private boolean noOutputAncestorUsesPrefix(Element original, String prefix, String uri) {

540

541

ParentNode parent = original.getParent();

542

if (parent instanceof Document && "".equals(uri)) {

543

return false;

544

}

545

546

while (parent != null && !(parent instanceof Document)) {

547

if (nodes == null || nodes.contains(parent)) {

548

Element element = (Element) parent;

549

String pfx = element.getNamespacePrefix();

550

if (pfx.equals(prefix)) {

551

String newURI = element.getNamespaceURI(prefix);

552

return ! newURI.equals(uri);

553

}

554

555

for (int i = 0; i < element.getAttributeCount(); i++) {

556

Attribute attribute = element.getAttribute(i);

557

String current = attribute.getNamespacePrefix();

558

if (current.equals(prefix)) {

559

String newURI = element.getNamespaceURI(prefix);

560

return ! newURI.equals(uri);

561

}

562

}

563

}

564

parent = parent.getParent();

565

}

566

return true;

567

568

}

569

570

571

// ???? move into Nodes?

572

private int indexOf(Element element) {

573

for (int i = 0; i < nodes.size(); i++) {

574

if (nodes.get(i) == element) return i;

575

}

576

return -1;

577

}

578

579

580

protected void write(Attribute attribute) throws IOException {

581

582

writeRaw(" ");

583

writeRaw(attribute.getQualifiedName());

584

writeRaw("=\"");

585

writeRaw(prepareAttributeValue(attribute));

586

writeRaw("\"");

587

588

}

589

590

591

protected void writeEndTag(Element element) throws IOException {

592

593

if (nodes == null || nodes.contains(element)) {

594

writeRaw("</");

595

writeRaw(element.getQualifiedName());

596

writeRaw(">");

597

inScope.popContext();

598

}

599

600

}

601

602

private final XPathContext xmlcontext = new XPathContext("xml", Namespace.XML_NAMESPACE);

603

604

private Attribute[] sortAttributes(Element element) {

605

606

Map nearest = new TreeMap();

607

// add in any inherited xml: attributes

608

if (!exclusive && nodes != null && nodes.contains(element)

609

&& ! nodes.contains(element.getParent())) {

610

// grab all xml: attributes

611

Nodes attributes = element.query("ancestor::*/@xml:*", xmlcontext);

612

if (attributes.size() != 0) {

613

// It's important to count backwards here because

614

// XPath returns all nodes in document order, which

615

// is top-down. To get the nearest we need to go

616

// bottom up instead.

617

for (int i = attributes.size()-1; i >= 0; i--) {

618

Attribute a = (Attribute) attributes.get(i);

619

String name = a.getLocalName();

620

if (element.getAttribute(name, Namespace.XML_NAMESPACE) != null) {

621

// this element already has that attribute

622

continue;

623

}

624

if (! nearest.containsKey(name)) {

625

Element parent = (Element) a.getParent();

626

if (! nodes.contains(parent)) {

627

nearest.put(name, a);

628

}

629

else {

630

nearest.put(name, null);

631

}

632

}

633

}

634

}

635

636

// remove null values

637

Iterator iterator = nearest.values().iterator();

638

while (iterator.hasNext()) {

639

if (iterator.next() == null) iterator.remove();

640

}

641

642

}

643

644

int localCount = element.getAttributeCount();

645

Attribute[] result

646

= new Attribute[localCount + nearest.size()];

647

for (int i = 0; i < localCount; i++) {

648

result[i] = element.getAttribute(i);

649

}

650

651

Iterator iterator = nearest.values().iterator();

652

for (int j = localCount; j < result.length; j++) {

653

result[j] = (Attribute) iterator.next();

654

}

655

656

Arrays.sort(result, comparator);

657

658

return result;

659

660

}

661

662

663

private String prepareAttributeValue(Attribute attribute) {

664

665

String value = attribute.getValue();

666

StringBuffer result = new StringBuffer(value.length());

667

668

if (attribute.getType().equals(Attribute.Type.CDATA)

669

|| attribute.getType().equals(Attribute.Type.UNDECLARED)) {

670

char[] data = value.toCharArray();

671

for (int i = 0; i < data.length; i++) {

672

char c = data[i];

673

if (c == '\t') {

674

result.append("	");

675

}

676

else if (c == '\n') {

677

result.append("
");

678

}

679

else if (c == '\r') {

680

result.append("");

681

}

682

else if (c == '\"') {

683

result.append(""");

684

}

685

else if (c == '&') {

686

result.append("&");

687

}

688

else if (c == '<') {

689

result.append("<");

690

}

691

else {

692

result.append(c);

693

}

694

}

695

}

696

else {

697

// According to the spec, "Whitespace character references

698

// other than   are not affected by attribute value

699

// normalization. For parsed documents, the parser will

700

// still replace these with the actual character. I am

701

// going to assume that if one is found here, that the

702

// user meant to put it there; and so we will escape it

703

// with a character reference

704

char[] data = value.toCharArray();

705

boolean seenFirstNonSpace = false;

706

for (int i = 0; i < data.length; i++) {

707

if (data[i] == ' ') {

708

if (i != data.length-1 && data[i+1] != ' ' && seenFirstNonSpace) {

709

result.append(data[i]);

710

}

711

continue;

712

}

713

seenFirstNonSpace = true;

714

if (data[i] == '\t') {

715

result.append("	");

716

}

717

else if (data[i] == '\n') {

718

result.append("
");

719

}

720

else if (data[i] == '\r') {

721

result.append("");

722

}

723

else if (data[i] == '\"') {

724

result.append(""");

725

}

726

else if (data[i] == '&') {

727

result.append("&");

728

}

729

else if (data[i] == '<') {

730

result.append("<");

731

}

732

else {

733

result.append(data[i]);

734

}

735

}

736

}

737

738

return result.toString();

739

740

}

741

742

743

/**

744

*

745

* Serializes a <code>Text</code> object

746

* onto the output stream using the UTF-8 encoding.

747

* The reserved characters <, >, and &

748

* are escaped using the standard entity references such as

749

* <code>&lt;</code>, <code>&gt;</code>,

750

* and <code>&amp;</code>.

751

*

752

753

* @param text the <code>Text</code> to serialize

754

755

* @throws IOException if the underlying <code>OutputStream</code>

756

* encounters an I/O error

757

758

protected final void write(Text text) throws IOException {

759

760

if (nodes == null || nodes.contains(text)) {

761

String input = text.getValue();

762

StringBuffer result = new StringBuffer(input.length());

763

for (int i = 0; i < input.length(); i++) {

764

char c = input.charAt(i);

765

if (c == '\r') {

766

result.append("");

767

}

768

else if (c == '&') {

769

result.append("&");

770

}

771

else if (c == '<') {

772

result.append("<");

773

}

774

else if (c == '>') {

775

result.append(">");

776

}

777

else {

778

result.append(c);

779

}

780

}

781

writeRaw(result.toString());

782

}

783

784

}

785

786

787

/**

788

*

789

* Serializes a <code>Comment</code> object

790

* onto the output stream if and only if this

791

* serializer is configured to produce canonical XML

792

* with comments.

793

*

794

795

* @param comment the <code>Comment</code> to serialize

796

797

* @throws IOException if the underlying <code>OutputStream</code>

798

* encounters an I/O error

799

800

protected final void write(Comment comment)

801

throws IOException {

802

if (withComments && (nodes == null || nodes.contains(comment))) {

803

super.write(comment);

804

}

805

}

806

807

808

protected final void write(ProcessingInstruction pi)

809

throws IOException {

810

if (nodes == null || nodes.contains(pi)) {

811

super.write(pi);

812

}

813

}

814

815

816

/**

817

*

818

* Does nothing because canonical XML does not include

819

* document type declarations.

820

*

821

822

* @param doctype the document type declaration to serialize

823

824

protected final void write(DocType doctype) {

825

// DocType is not serialized in canonical XML

826

}

827

828

829

public void write(Node node) throws IOException {

830

831

if (node instanceof Document) {

832

write((Document) node);

833

}

834

else if (node instanceof Attribute) {

835

write((Attribute) node);

836

}

837

else if (node instanceof Namespace) {

838

write((Namespace) node);

839

}

840

else {

841

writeChild(node);

842

}

843

844

}

845

846

847

private void write(Namespace namespace) throws IOException {

848

849

String prefix = namespace.getPrefix();

850

String uri = namespace.getValue();

851

writeRaw(" xmlns" );

852

if (!"".equals(prefix)) {

853

writeRaw(":");

854

writeRaw(prefix);

855

}

856

writeRaw("=\"");

857

writeAttributeValue(uri);

858

writeRaw("\"");

859

860

}

861

862

}

863

864

865

/**

866

*

867

* Serializes a node onto the output stream using the specified

868

* canonicalization algorithm. If the node is a document or an

869

* element, then the node's entire subtree is written out.

870

*

871

872

* @param node the node to canonicalize

873

874

* @throws IOException if the underlying <code>OutputStream</code>

875

* encounters an I/O error

876

877

public final void write(Node node) throws IOException {

878

879

// See this thread:

880

// http://lists.ibiblio.org/pipermail/xom-interest/2005-October/002656.html

881

if (node instanceof Element) {

882

Document doc = node.getDocument();

883

Element pseudoRoot = null;

884

if (doc == null) {

885

pseudoRoot = new Element("pseudo");

886

doc = new Document(pseudoRoot);

887

ParentNode root = (ParentNode) node;

888

while (root.getParent() != null) root = root.getParent();

889

pseudoRoot.appendChild(root);

890

}

891

try {

892

write(node.query(".//. | .//@* | .//namespace::*"));

893

}

894

finally {

895

if (pseudoRoot != null) pseudoRoot.removeChild(0);

896

}

897

}

898

else {

899

serializer.nodes = null;

900

serializer.write(node);

901

}

902

serializer.flush();

903

904

}

905

906

907

/**

908

*

909

* Serializes a document subset onto the output stream using the

910

* canonical XML algorithm. All nodes in the list must come from

911

* same document. Furthermore, they must come from a document.

912

* They cannot be detached. The nodes need not be sorted. This

913

* method will sort them into the appropriate order for

914

* canonicalization.

915

*

916

917

*

918

* In most common use cases, these nodes will be the result of

919

* evaluating an XPath expression. For example,

920

*

921

922

* <pre><code> Canonicalizer canonicalizer

923

* = new Canonicalizer(System.out, Canonicalizer.CANONICAL_XML);

924

* Nodes result = doc.query("//. | //@* | //namespace::*");

925

* canonicalizer.write(result);

926

* </code></pre>

927

928

*

929

* Children are not output unless the subset also includes them.

930

* Including an element in the subset does not automatically

931

* select all the element's children, attributes, and namespaces.

932

* Furthermore, not selecting an element does not imply that its

933

* children, namespaces, attributes will not be output.

934

*

935

936

* @param documentSubset the nodes to serialize

937

938

* @throws IOException if the underlying <code>OutputStream</code>

939

* encounters an I/O error

940

* @throws CanonicalizationException if the nodes come from more

941

* than one document; or if a detached node is in the list

942

943

public final void write(Nodes documentSubset) throws IOException {

944

945

if (documentSubset.size() > 0) {

946

Document doc = documentSubset.get(0).getDocument();

947

if (doc == null) {

948

throw new CanonicalizationException(

949

"Canonicalization is not defined for detached nodes");

950

}

951

Nodes result = sort(documentSubset);

952

serializer.nodes = result;

953

serializer.write(doc);

954

serializer.flush();

955

}

956

957

}

958

959

960

/**

961

*

962

* Specifies the prefixes that will be output as specified in

963

* regular canonical XML, even when doing exclusive

964

* XML canonicalization.

965

*

966

967

* @param inclusiveNamespacePrefixes a whitespace separated list

968

* of namespace prefixes that will always be included in the

969

* output, even in exclusive canonicalization

970

971

public final void setInclusiveNamespacePrefixList(String inclusiveNamespacePrefixes)

972

throws IOException {

973

974

this.inclusiveNamespacePrefixes.clear();

975

if (this.exclusive && inclusiveNamespacePrefixes != null) {

976

StringTokenizer tokenizer = new StringTokenizer(

977

inclusiveNamespacePrefixes, " \t\r\n", false);

978

while (tokenizer.hasMoreTokens()) {

979

this.inclusiveNamespacePrefixes.add(tokenizer.nextToken());

980

}

981

}

982

983

}

984

985

986

// XXX remove recursion

987

// recursively descend through document; in document

988

// order, and add results as they are found

989

private Nodes sort(Nodes in) {

990

991

Node root = in.get(0).getDocument();

992

if (in.size() > 1) {

993

Nodes out = new Nodes();

994

List list = new ArrayList(in.size());

995

List namespaces = new ArrayList();

996

for (int i = 0; i < in.size(); i++) {

997

Node node = in.get(i);

998

list.add(node);

999

if (node instanceof Namespace) namespaces.add(node);

1000

}

1001

sort(list, namespaces, out, (ParentNode) root);

1002

if (! list.isEmpty() ) {

1003

// Are these just duplicates; or is there really a node

1004

// from a different document?

1005

Iterator iterator = list.iterator();

1006

while (iterator.hasNext()) {

1007

Node next = (Node) iterator.next();

1008

if (root != next.getDocument()) {

1009

throw new CanonicalizationException(

1010

"Cannot canonicalize subsets that contain nodes from more than one document");

1011

}

1012

}

1013

}

1014

return out;

1015

}

1016

else {

1017

return new Nodes(in.get(0));

1018

}

1019

1020

}

1021

1022

1023

private static void sort(List in, List namespaces, Nodes out, ParentNode parent) {

1024

1025

if (in.isEmpty()) return;

1026

if (in.contains(parent)) {

1027

out.append(parent);

1028

in.remove(parent);

1029

// I'm fairly sure this next line is unreachable, but just

1030

// in case it isn't I'll leave this comment here.

1031

// if (in.isEmpty()) return;

1032

}

1033

1034

int childCount = parent.getChildCount();

1035

for (int i = 0; i < childCount; i++) {

1036

Node child = parent.getChild(i);

1037

if (child instanceof Element) {

1038

Element element = (Element) child;

1039

if (in.contains(element)) {

1040

out.append(element);

1041

in.remove(element);

1042

}

1043

// attach namespaces

1044

if (!namespaces.isEmpty()) {

1045

Iterator iterator = in.iterator();

1046

while (iterator.hasNext()) {

1047

Object o = iterator.next();

1048

if (o instanceof Namespace) {

1049

Namespace n = (Namespace) o;

1050

if (element == n.getParent()) {

1051

out.append(n);

1052

iterator.remove();

1053

}

1054

}

1055

}

1056

}

1057

1058

// attach attributes

1059

for (int a = 0; a < element.getAttributeCount(); a++) {

1060

Attribute att = element.getAttribute(a);

1061

if (in.contains(att)) {

1062

out.append(att);

1063

in.remove(att);

1064

if (in.isEmpty()) return;

1065

}

1066

}

1067

sort(in, namespaces, out, element);

1068

}

1069

else {

1070

if (in.contains(child)) {

1071

out.append(child);

1072

in.remove(child);

1073

if (in.isEmpty()) return;

1074

}

1075

}

1076

}

1077

1078

}

1079

1080

1081

}

b'\\ No newline at end of file'

Older »