← Back to branch summary

~ubuntu-branches/ubuntu/jaunty/python-docutils/jaunty

~ubuntu-branches/ubuntu/jaunty/python-docutils/jaunty

« back to all changes in this revision

Viewing changes to docutils/io.py

Committer: Bazaar Package Importer
Author(s): Simon McVittie
Date: 2008-07-24 10:39:53 UTC
mfrom: (1.1.4 upstream) (3.1.7 intrepid)
Revision ID: james.westby@ubuntu.com-20080724103953-8gh4uezg17g9ysgy

Tags: 0.5-2

http://bugs.debian.org/474941

* Upload docutils 0.5 to unstable
* Update rst.el to upstream Subversion r5596, which apparently fixes
all its performance problems (17_speed_up_rst_el.dpatch, closes: #474941)

files added:
debian/50python-docutils.el

debian/NEWS

debian/README.source

debian/patches/12_more_usrbinenv.dpatch

debian/patches/15_emacs_debian_paths.dpatch

debian/patches/16_disable_picins.dpatch

debian/patches/17_speed_up_rst_el.dpatch

debian/python-docutils.install

debian/python-roman.install

debian/rsthelp2man.xsl

debian/watch

docs/howto/security.txt

docutils/languages/he.py

docutils/parsers/rst/languages/he.py

docutils/writers/html4css1/template.txt

docutils/writers/newlatex2e/notes.txt

docutils/writers/newlatex2e/tests.txt

test/data/full-template.txt

test/functional/input/data/latex2e.txt

test/test_parsers/test_rst/test_directives/include12.txt

test/test_parsers/test_rst/test_directives/include13.txt

test/test_parsers/test_rst/test_directives/test_block_quotes.py

test/test_parsers/test_rst/test_directives/test_class.py

test/test_parsers/test_rst/test_directives/test_parsed_literals.py

test/test_parsers/test_rst/test_directives/test_sectnum.py

test/test_parsers/test_rst/test_directives/test_title.py

test/test_pickle.py

test/test_traversals.py

test/test_writers/test_html4css1_parts.py

test/test_writers/test_html4css1_template.py

test/test_writers/test_s5.py

tools/editors/emacs/tests/README.txt

files removed:
debian/emacs-start.el

debian/patches/01_upstream_04_branch_r4646.dpatch

debian/patches/12_remove_unnecessary_hashbang.dpatch

debian/patches/13_nodes_namespace.dpatch

debian/patches/99_old-diffs.dpatch

debian/python-roman.override

debian/rst2html.1

test/test_writers/test_html4css1.py

tools/editors/emacs/tests/README

files modified:
BUGS.txt

COPYING.txt

FAQ.txt

HISTORY.txt

PKG-INFO

README.txt

RELEASE-NOTES.txt

THANKS.txt

debian/README.Debian

debian/changelog

debian/control

debian/patches/00list

debian/patches/10_doc_debian_paths.dpatch

debian/patches/11_not_usrbinenv_python.dpatch

debian/patches/14_distutils_setup.dpatch

debian/python-docutils.manpages

debian/rules

docs/api/cmdline-tool.txt

docs/api/publisher.txt

docs/api/runtime-settings.txt

docs/dev/distributing.txt

docs/dev/enthought-plan.txt

docs/dev/hacking.txt

docs/dev/policies.txt

docs/dev/pysource.dtd

docs/dev/pysource.txt

docs/dev/release.txt

docs/dev/repository.txt

docs/dev/rst/alternatives.txt

docs/dev/rst/problems.txt

docs/dev/semantics.txt

docs/dev/testing.txt

docs/dev/todo.txt

docs/dev/website.txt

docs/howto/html-stylesheets.txt

docs/howto/i18n.txt

docs/howto/rst-directives.txt

docs/howto/rst-roles.txt

docs/index.txt

docs/peps/pep-0256.txt

docs/peps/pep-0257.txt

docs/peps/pep-0258.txt

docs/peps/pep-0287.txt

docs/ref/doctree.txt

docs/ref/docutils.dtd

docs/ref/rst/definitions.txt

docs/ref/rst/directives.txt

docs/ref/rst/introduction.txt

docs/ref/rst/restructuredtext.txt

docs/ref/rst/roles.txt

docs/ref/transforms.txt

docs/user/config.txt

docs/user/emacs.txt

docs/user/latex.txt

docs/user/links.txt

docs/user/mailing-lists.txt

docs/user/rst/cheatsheet.txt

docs/user/rst/demo.txt

docs/user/rst/quickref.html

docs/user/rst/quickstart.txt

docs/user/slide-shows.txt

docs/user/tools.txt

docutils/__init__.py

docutils/core.py

docutils/examples.py

docutils/frontend.py

docutils/io.py

docutils/languages/__init__.py

docutils/languages/af.py

docutils/languages/ca.py

docutils/languages/cs.py

docutils/languages/de.py

docutils/languages/en.py

docutils/languages/eo.py

docutils/languages/es.py

docutils/languages/fi.py

docutils/languages/fr.py

docutils/languages/it.py

docutils/languages/ja.py

docutils/languages/nl.py

docutils/languages/pt_br.py

docutils/languages/ru.py

docutils/languages/sk.py

docutils/languages/sv.py

docutils/languages/zh_cn.py

docutils/languages/zh_tw.py

docutils/nodes.py

docutils/parsers/__init__.py

docutils/parsers/null.py

docutils/parsers/rst/__init__.py

docutils/parsers/rst/directives/__init__.py

docutils/parsers/rst/directives/admonitions.py

docutils/parsers/rst/directives/body.py

docutils/parsers/rst/directives/html.py

docutils/parsers/rst/directives/images.py

docutils/parsers/rst/directives/misc.py

docutils/parsers/rst/directives/parts.py

docutils/parsers/rst/directives/references.py

docutils/parsers/rst/directives/tables.py

docutils/parsers/rst/include/s5defs.txt

docutils/parsers/rst/languages/__init__.py

docutils/parsers/rst/languages/af.py

docutils/parsers/rst/languages/ca.py

docutils/parsers/rst/languages/cs.py

docutils/parsers/rst/languages/de.py

docutils/parsers/rst/languages/en.py

docutils/parsers/rst/languages/eo.py

docutils/parsers/rst/languages/es.py

docutils/parsers/rst/languages/fi.py

docutils/parsers/rst/languages/fr.py

docutils/parsers/rst/languages/it.py

docutils/parsers/rst/languages/ja.py

docutils/parsers/rst/languages/nl.py

docutils/parsers/rst/languages/pt_br.py

docutils/parsers/rst/languages/ru.py

docutils/parsers/rst/languages/sk.py

docutils/parsers/rst/languages/sv.py

docutils/parsers/rst/languages/zh_cn.py

docutils/parsers/rst/languages/zh_tw.py

docutils/parsers/rst/roles.py

docutils/parsers/rst/states.py

docutils/parsers/rst/tableparser.py

docutils/readers/__init__.py

docutils/readers/doctree.py

docutils/readers/pep.py

docutils/readers/python/__init__.py

docutils/readers/python/moduleparser.py

docutils/readers/python/pynodes.py

docutils/readers/standalone.py

docutils/statemachine.py

docutils/transforms/__init__.py

docutils/transforms/components.py

docutils/transforms/frontmatter.py

docutils/transforms/misc.py

docutils/transforms/parts.py

docutils/transforms/peps.py

docutils/transforms/references.py

docutils/transforms/universal.py

docutils/transforms/writer_aux.py

docutils/urischemes.py

docutils/utils.py

docutils/writers/__init__.py

docutils/writers/docutils_xml.py

docutils/writers/html4css1/__init__.py

docutils/writers/html4css1/html4css1.css

docutils/writers/latex2e/__init__.py

docutils/writers/newlatex2e/__init__.py

docutils/writers/newlatex2e/base.tex

docutils/writers/newlatex2e/unicode_map.py

docutils/writers/null.py

docutils/writers/pep_html/__init__.py

docutils/writers/pep_html/pep.css

docutils/writers/pep_html/template.txt

docutils/writers/pseudoxml.py

docutils/writers/s5_html/__init__.py

extras/textwrap.py

setup.py

test/DocutilsTestSupport.py

test/alltests.py

test/coverage.sh

test/data/config_1.txt

test/functional/expected/compact_lists.html

test/functional/expected/dangerous.html

test/functional/expected/field_name_limit.html

test/functional/expected/latex_docinfo.tex

test/functional/expected/misc_rst_html4css1.html

test/functional/expected/pep_html.html

test/functional/expected/standalone_rst_html4css1.html

test/functional/expected/standalone_rst_latex.tex

test/functional/expected/standalone_rst_pseudoxml.txt

test/functional/expected/standalone_rst_s5_html_1.html

test/functional/expected/standalone_rst_s5_html_2.html

test/functional/input/data/custom_roles.txt

test/functional/input/data/standard.txt

test/functional/input/standalone_rst_latex.txt

test/package_unittest.py

test/test_dependencies.py

test/test_functional.py

test/test_io.py

test/test_language.py

test/test_nodes.py

test/test_parsers/test_rst/test_SimpleTableParser.py

test/test_parsers/test_rst/test_TableParser.py

test/test_parsers/test_rst/test_block_quotes.py

test/test_parsers/test_rst/test_bullet_lists.py

test/test_parsers/test_rst/test_citations.py

test/test_parsers/test_rst/test_comments.py

test/test_parsers/test_rst/test_definition_lists.py

test/test_parsers/test_rst/test_directives/test_admonitions.py

test/test_parsers/test_rst/test_directives/test_compound.py

test/test_parsers/test_rst/test_directives/test_container.py

test/test_parsers/test_rst/test_directives/test_contents.py

test/test_parsers/test_rst/test_directives/test_date.py

test/test_parsers/test_rst/test_directives/test_decorations.py

test/test_parsers/test_rst/test_directives/test_default_role.py

test/test_parsers/test_rst/test_directives/test_figures.py

test/test_parsers/test_rst/test_directives/test_images.py

test/test_parsers/test_rst/test_directives/test_include.py

test/test_parsers/test_rst/test_directives/test_line_blocks.py

test/test_parsers/test_rst/test_directives/test_meta.py

test/test_parsers/test_rst/test_directives/test_raw.py

test/test_parsers/test_rst/test_directives/test_replace.py

test/test_parsers/test_rst/test_directives/test_role.py

test/test_parsers/test_rst/test_directives/test_rubrics.py

test/test_parsers/test_rst/test_directives/test_sidebars.py

test/test_parsers/test_rst/test_directives/test_tables.py

test/test_parsers/test_rst/test_directives/test_target_notes.py

test/test_parsers/test_rst/test_directives/test_test_directives.py

test/test_parsers/test_rst/test_directives/test_topics.py

test/test_parsers/test_rst/test_directives/test_unicode.py

test/test_parsers/test_rst/test_directives/test_unknown.py

test/test_parsers/test_rst/test_doctest_blocks.py

test/test_parsers/test_rst/test_east_asian_text.py

test/test_parsers/test_rst/test_enumerated_lists.py

test/test_parsers/test_rst/test_field_lists.py

test/test_parsers/test_rst/test_footnotes.py

test/test_parsers/test_rst/test_functions.py

test/test_parsers/test_rst/test_inline_markup.py

test/test_parsers/test_rst/test_interpreted.py

test/test_parsers/test_rst/test_line_blocks.py

test/test_parsers/test_rst/test_literal_blocks.py

test/test_parsers/test_rst/test_option_lists.py

test/test_parsers/test_rst/test_outdenting.py

test/test_parsers/test_rst/test_paragraphs.py

test/test_parsers/test_rst/test_section_headers.py

test/test_parsers/test_rst/test_substitutions.py

test/test_parsers/test_rst/test_tables.py

test/test_parsers/test_rst/test_targets.py

test/test_parsers/test_rst/test_transitions.py

test/test_publisher.py

test/test_readers/test_pep/test_inline_markup.py

test/test_readers/test_pep/test_rfc2822.py

test/test_readers/test_python/test_functions.py

test/test_readers/test_python/test_parser.py

test/test_readers/test_python/test_token_parser.py

test/test_settings.py

test/test_statemachine.py

test/test_transforms/test___init__.py

test/test_transforms/test_class.py

test/test_transforms/test_contents.py

test/test_transforms/test_docinfo.py

test/test_transforms/test_doctitle.py

test/test_transforms/test_expose_internals.py

test/test_transforms/test_filter.py

test/test_transforms/test_footnotes.py

test/test_transforms/test_hyperlinks.py

test/test_transforms/test_messages.py

test/test_transforms/test_peps.py

test/test_transforms/test_sectnum.py

test/test_transforms/test_strip_comments.py

test/test_transforms/test_substitutions.py

test/test_transforms/test_target_notes.py

test/test_transforms/test_transitions.py

test/test_transforms/test_writer_aux.py

test/test_utils.py

test/test_viewlist.py

test/test_writers/test_docutils_xml.py

test/test_writers/test_html4css1_misc.py

test/test_writers/test_latex2e.py

test/test_writers/test_null.py

test/test_writers/test_pseudoxml.py

tools/buildhtml.py

tools/dev/create_unimap.py

tools/dev/profile_docutils.py

tools/dev/unicode2rstsubs.py

tools/editors/README.txt

tools/editors/emacs/README.txt

tools/editors/emacs/rst.el

tools/editors/emacs/tests/Makefile

tools/editors/emacs/tests/tests-adjust-section.el

tools/editors/emacs/tests/tests-basic.el

tools/editors/emacs/tests/tests-runner.el

tools/quicktest.py

tools/rst2html.py

tools/rst2latex.py

tools/rst2newlatex.py

tools/rst2pseudoxml.py

tools/rst2s5.py

tools/rst2xml.py

tools/rstpep2html.py

Show diffs side-by-side

added added

removed removed

1

# Author: David Goodger

2

# Contact: goodger@users.sourceforge.net

3

# Revision: $Revision: 3654 $

4

# Date: $Date: 2005-07-03 17:02:15 +0200 (Sun, 03 Jul 2005) $

1

# $Id: io.py 4750 2006-09-16 21:32:29Z wiemann $

2

# Author: David Goodger <goodger@python.org>

5

3

# Copyright: This module has been placed in the public domain.

6

4

7

5

"""

16

14

import locale

17

15

except:

18

16

pass

17

import re

19

18

from types import UnicodeType

20

19

from docutils import TransformSpec

21

20

74

73

if isinstance(data, UnicodeType):

75

74

# Accept unicode even if self.encoding != 'unicode'.

76

75

return data

77

encodings = [self.encoding]

78

if not self.encoding:

79

# Apply heuristics only if no encoding is explicitly given.

80

encodings.append('utf-8')

81

try:

82

encodings.append(locale.nl_langinfo(locale.CODESET))

83

except:

84

pass

85

try:

86

encodings.append(locale.getlocale()[1])

87

except:

88

pass

89

try:

90

encodings.append(locale.getdefaultlocale()[1])

91

except:

92

pass

93

encodings.append('latin-1')

76

if self.encoding:

77

# We believe the user/application when the encoding is

78

# explicitly given.

79

encodings = [self.encoding]

80

else:

81

data_encoding = self.determine_encoding_from_data(data)

82

if data_encoding:

83

# If the data declares its encoding (explicitly or via a BOM),

84

# we believe it.

85

encodings = [data_encoding]

86

else:

87

# Apply heuristics only if no encoding is explicitly given and

88

# no BOM found. Start with UTF-8, because that only matches

89

# data that *IS* UTF-8:

90

encodings = ['utf-8']

91

try:

92

# for Python 2.2 compatibility

93

encodings.append(locale.nl_langinfo(locale.CODESET))

94

except:

95

pass

96

try:

97

encodings.append(locale.getlocale()[1])

98

except:

99

pass

100

try:

101

encodings.append(locale.getdefaultlocale()[1])

102

except:

103

pass

104

# fallback encoding:

105

encodings.append('latin-1')

94

106

error = None

95

107

error_details = ''

96

108

for enc in encodings:

111

123

% (', '.join([repr(enc) for enc in encodings if enc]),

112

124

error_details))

113

125

126

coding_slug = re.compile("coding[:=]\s*([-\w.]+)")

127

"""Encoding declaration pattern."""

128

129

byte_order_marks = (('\xef\xbb\xbf', 'utf-8'),

130

('\xfe\xff', 'utf-16-be'),

131

('\xff\xfe', 'utf-16-le'),)

132

"""Sequence of (start_bytes, encoding) tuples to for encoding detection.

133

The first bytes of input data are checked against the start_bytes strings.

134

A match indicates the given encoding."""

135

136

def determine_encoding_from_data(self, data):

137

"""

138

Try to determine the encoding of `data` by looking *in* `data`.

139

Check for a byte order mark (BOM) or an encoding declaration.

140

"""

141

# check for a byte order mark:

142

for start_bytes, encoding in self.byte_order_marks:

143

if data.startswith(start_bytes):

144

return encoding

145

# check for an encoding declaration pattern in first 2 lines of file:

146

for line in data.splitlines()[:2]:

147

match = self.coding_slug.search(line)

148

if match:

149

return match.group(1)

150

return None

151

114

152

115

153

class Output(TransformSpec):

116

154

159

197

else:

160

198

try:

161

199

return data.encode(self.encoding, self.error_handler)

162

except ValueError:

163

# ValueError is raised if there are unencodable chars

164

# in data and the error_handler isn't found.

200

except (LookupError, ValueError):

201

# LookupError is raised if there are unencodable chars

202

# in data and the error_handler isn't found. In old

203

# Python versions, ValueError is raised.

165

204

if self.error_handler == 'xmlcharrefreplace':

166

205

# We are using xmlcharrefreplace with a Python

167

# version that doesn't support it (2.1 or 2.2), so

168

# we emulate its behavior.

206

# version that doesn't support it (2.1, 2.2, or

207

# IronPython 1.0) so we emulate its behavior.

169

208

return ''.join([self.xmlcharref_encode(char)

170

209

for char in data])

171

210

else:

Older »