~ubuntu-branches/ubuntu/hardy/python-docutils/hardy

« back to all changes in this revision

Viewing changes to extras/difflib.py

Committer: Bazaar Package Importer
Author(s): martin f. krafft
Date: 2006-07-10 11:45:05 UTC
mfrom: (2.1.4 edgy)
Revision ID: james.westby@ubuntu.com-20060710114505-otkhqcslevewxmz5

Tags: 0.4-3

http://bugs.debian.org/377580

Added build dependency on python-central (closes: #377580).

files added:
BUGS.txt

PKG-INFO

RELEASE-NOTES.txt

THANKS.txt

debian/patches

debian/patches/00list

debian/patches/01_upstream_04_branch_r4646.dpatch

debian/patches/10_doc_debian_paths.dpatch

debian/patches/11_not_usrbinenv_python.dpatch

debian/patches/12_remove_unnecessary_hashbang.dpatch

debian/patches/13_nodes_namespace.dpatch

debian/patches/14_distutils_setup.dpatch

debian/patches/99_old-diffs.dpatch

debian/rst2html.1

docs/api

docs/api/cmdline-tool.txt

docs/api/publisher.txt

docs/api/runtime-settings.txt

docs/dev

docs/dev/distributing.txt

docs/dev/enthought-plan.txt

docs/dev/enthought-rfp.txt

docs/dev/hacking.txt

docs/dev/policies.txt

docs/dev/pysource.dtd

docs/dev/pysource.txt

docs/dev/release.txt

docs/dev/repository.txt

docs/dev/rst

docs/dev/rst/alternatives.txt

docs/dev/rst/problems.txt

docs/dev/semantics.txt

docs/dev/testing.txt

docs/dev/todo.txt

docs/dev/website.txt

docs/howto

docs/howto/html-stylesheets.txt

docs/howto/i18n.txt

docs/howto/rst-directives.txt

docs/howto/rst-roles.txt

docs/index.txt

docs/peps

docs/peps/pep-0256.txt

docs/peps/pep-0257.txt

docs/peps/pep-0258.txt

docs/peps/pep-0287.txt

docs/ref

docs/ref/doctree.txt

docs/ref/docutils.dtd

docs/ref/rst

docs/ref/rst/definitions.txt

docs/ref/rst/directives.txt

docs/ref/rst/introduction.txt

docs/ref/rst/restructuredtext.txt

docs/ref/rst/roles.txt

docs/ref/soextblx.dtd

docs/ref/transforms.txt

docs/user

docs/user/Makefile.docutils-update

docs/user/config.txt

docs/user/emacs.txt

docs/user/images

docs/user/images/big-black.png

docs/user/images/big-white.png

docs/user/images/default.png

docs/user/images/happy_monkey.png

docs/user/images/medium-black.png

docs/user/images/medium-white.png

docs/user/images/rsp-all.png

docs/user/images/rsp-breaks.png

docs/user/images/rsp-covers.png

docs/user/images/rsp-cuts.png

docs/user/images/rsp-empty.png

docs/user/images/rsp-objects.png

docs/user/images/rsp.svg

docs/user/images/s5-files.png

docs/user/images/s5-files.svg

docs/user/images/small-black.png

docs/user/images/small-white.png

docs/user/latex.txt

docs/user/links.txt

docs/user/mailing-lists.txt

docs/user/rst

docs/user/rst/cheatsheet.txt

docs/user/rst/demo.txt

docs/user/rst/images

docs/user/rst/images/ball1.gif

docs/user/rst/images/biohazard.png

docs/user/rst/images/title.png

docs/user/rst/quickref.html

docs/user/rst/quickstart.txt

docs/user/slide-shows.txt

docs/user/tools.txt

docutils/docutils.conf

docutils/languages/ca.py

docutils/languages/fi.py

docutils/languages/ja.py

docutils/languages/nl.py

docutils/languages/zh_cn.py

docutils/languages/zh_tw.py

docutils/parsers/null.py

docutils/parsers/rst/directives/tables.py

docutils/parsers/rst/include

docutils/parsers/rst/include/README.txt

docutils/parsers/rst/include/isoamsa.txt

docutils/parsers/rst/include/isoamsb.txt

docutils/parsers/rst/include/isoamsc.txt

docutils/parsers/rst/include/isoamsn.txt

docutils/parsers/rst/include/isoamso.txt

docutils/parsers/rst/include/isoamsr.txt

docutils/parsers/rst/include/isobox.txt

docutils/parsers/rst/include/isocyr1.txt

docutils/parsers/rst/include/isocyr2.txt

docutils/parsers/rst/include/isodia.txt

docutils/parsers/rst/include/isogrk1.txt

docutils/parsers/rst/include/isogrk2.txt

docutils/parsers/rst/include/isogrk3.txt

docutils/parsers/rst/include/isogrk4-wide.txt

docutils/parsers/rst/include/isogrk4.txt

docutils/parsers/rst/include/isolat1.txt

docutils/parsers/rst/include/isolat2.txt

docutils/parsers/rst/include/isomfrk-wide.txt

docutils/parsers/rst/include/isomfrk.txt

docutils/parsers/rst/include/isomopf-wide.txt

docutils/parsers/rst/include/isomopf.txt

docutils/parsers/rst/include/isomscr-wide.txt

docutils/parsers/rst/include/isomscr.txt

docutils/parsers/rst/include/isonum.txt

docutils/parsers/rst/include/isopub.txt

docutils/parsers/rst/include/isotech.txt

docutils/parsers/rst/include/mmlalias.txt

docutils/parsers/rst/include/mmlextra-wide.txt

docutils/parsers/rst/include/mmlextra.txt

docutils/parsers/rst/include/s5defs.txt

docutils/parsers/rst/include/xhtml1-lat1.txt

docutils/parsers/rst/include/xhtml1-special.txt

docutils/parsers/rst/include/xhtml1-symbol.txt

docutils/parsers/rst/languages/ca.py

docutils/parsers/rst/languages/fi.py

docutils/parsers/rst/languages/ja.py

docutils/parsers/rst/languages/nl.py

docutils/parsers/rst/languages/zh_cn.py

docutils/parsers/rst/languages/zh_tw.py

docutils/readers/doctree.py

docutils/transforms/writer_aux.py

docutils/writers/html4css1

docutils/writers/html4css1/__init__.py

docutils/writers/html4css1/html4css1.css

docutils/writers/latex2e

docutils/writers/latex2e/__init__.py

docutils/writers/latex2e/latex2e.tex

docutils/writers/newlatex2e

docutils/writers/newlatex2e/__init__.py

docutils/writers/newlatex2e/base.tex

docutils/writers/newlatex2e/unicode_map.py

docutils/writers/null.py

docutils/writers/pep_html

docutils/writers/pep_html/__init__.py

docutils/writers/pep_html/pep.css

docutils/writers/pep_html/template.txt

docutils/writers/s5_html

docutils/writers/s5_html/__init__.py

docutils/writers/s5_html/themes

docutils/writers/s5_html/themes/README.txt

docutils/writers/s5_html/themes/big-black

docutils/writers/s5_html/themes/big-black/__base__

docutils/writers/s5_html/themes/big-black/framing.css

docutils/writers/s5_html/themes/big-black/pretty.css

docutils/writers/s5_html/themes/big-white

docutils/writers/s5_html/themes/big-white/framing.css

docutils/writers/s5_html/themes/big-white/pretty.css

docutils/writers/s5_html/themes/default

docutils/writers/s5_html/themes/default/blank.gif

docutils/writers/s5_html/themes/default/framing.css

docutils/writers/s5_html/themes/default/iepngfix.htc

docutils/writers/s5_html/themes/default/opera.css

docutils/writers/s5_html/themes/default/outline.css

docutils/writers/s5_html/themes/default/pretty.css

docutils/writers/s5_html/themes/default/print.css

docutils/writers/s5_html/themes/default/s5-core.css

docutils/writers/s5_html/themes/default/slides.css

docutils/writers/s5_html/themes/default/slides.js

docutils/writers/s5_html/themes/medium-black

docutils/writers/s5_html/themes/medium-black/__base__

docutils/writers/s5_html/themes/medium-black/pretty.css

docutils/writers/s5_html/themes/medium-white

docutils/writers/s5_html/themes/medium-white/framing.css

docutils/writers/s5_html/themes/medium-white/pretty.css

docutils/writers/s5_html/themes/small-black

docutils/writers/s5_html/themes/small-black/__base__

docutils/writers/s5_html/themes/small-black/pretty.css

docutils/writers/s5_html/themes/small-white

docutils/writers/s5_html/themes/small-white/framing.css

docutils/writers/s5_html/themes/small-white/pretty.css

test/coverage.sh

test/data/csv_data.txt

test/data/csv_dep.txt

test/data/dependencies.txt

test/data/include.txt

test/data/raw.txt

test/data/stylesheet.txt

test/docutils_difflib.py

test/functional

test/functional/README.txt

test/functional/expected

test/functional/expected/compact_lists.html

test/functional/expected/dangerous.html

test/functional/expected/field_name_limit.html

test/functional/expected/latex_docinfo.tex

test/functional/expected/misc_rst_html4css1.html

test/functional/expected/pep_html.html

test/functional/expected/standalone_rst_html4css1.html

test/functional/expected/standalone_rst_latex.tex

test/functional/expected/standalone_rst_pseudoxml.txt

test/functional/expected/standalone_rst_s5_html_1.html

test/functional/expected/standalone_rst_s5_html_2.html

test/functional/expected/ui

test/functional/expected/ui/default

test/functional/expected/ui/default/blank.gif

test/functional/expected/ui/default/framing.css

test/functional/expected/ui/default/iepngfix.htc

test/functional/expected/ui/default/opera.css

test/functional/expected/ui/default/outline.css

test/functional/expected/ui/default/pretty.css

test/functional/expected/ui/default/print.css

test/functional/expected/ui/default/s5-core.css

test/functional/expected/ui/default/slides.css

test/functional/expected/ui/default/slides.js

test/functional/expected/ui/small-black

test/functional/expected/ui/small-black/blank.gif

test/functional/expected/ui/small-black/framing.css

test/functional/expected/ui/small-black/iepngfix.htc

test/functional/expected/ui/small-black/opera.css

test/functional/expected/ui/small-black/outline.css

test/functional/expected/ui/small-black/pretty.css

test/functional/expected/ui/small-black/print.css

test/functional/expected/ui/small-black/s5-core.css

test/functional/expected/ui/small-black/slides.css

test/functional/expected/ui/small-black/slides.js

test/functional/input

test/functional/input/compact_lists.txt

test/functional/input/dangerous.txt

test/functional/input/data

test/functional/input/data/custom_roles.txt

test/functional/input/data/errors.txt

test/functional/input/data/header_footer.txt

test/functional/input/data/latex.txt

test/functional/input/data/list_table.txt

test/functional/input/data/nonalphanumeric.txt

test/functional/input/data/standard.txt

test/functional/input/data/table_colspan.txt

test/functional/input/data/table_complex.txt

test/functional/input/data/table_rowspan.txt

test/functional/input/data/unicode.txt

test/functional/input/field_list.txt

test/functional/input/latex_docinfo.txt

test/functional/input/pep_html.txt

test/functional/input/simple.txt

test/functional/input/standalone_rst_html4css1.txt

test/functional/input/standalone_rst_latex.txt

test/functional/input/standalone_rst_newlatex.txt

test/functional/input/standalone_rst_pseudoxml.txt

test/functional/input/standalone_rst_s5_html.txt

test/functional/output

test/functional/output/README.txt

test/functional/tests

test/functional/tests/_default.py

test/functional/tests/_standalone_rst_defaults.py

test/functional/tests/compact_lists.py

test/functional/tests/dangerous.py

test/functional/tests/field_name_limit.py

test/functional/tests/latex_docinfo.py

test/functional/tests/misc_rst_html4css1.py

test/functional/tests/pep_html.py

test/functional/tests/standalone_rst_html4css1.py

test/functional/tests/standalone_rst_latex.py

test/functional/tests/standalone_rst_pseudoxml.py

test/functional/tests/standalone_rst_s5_html_1.py

test/functional/tests/standalone_rst_s5_html_2.py

test/test_dependencies.py

test/test_functional.py

test/test_io.py

test/test_parsers/test_rst/__init__.py

test/test_parsers/test_rst/test_directives/__init__.py

test/test_parsers/test_rst/test_directives/empty.txt

test/test_parsers/test_rst/test_directives/include 11.txt

test/test_parsers/test_rst/test_directives/test_compound.py

test/test_parsers/test_rst/test_directives/test_container.py

test/test_parsers/test_rst/test_directives/test_date.py

test/test_parsers/test_rst/test_directives/test_decorations.py

test/test_parsers/test_rst/test_directives/test_default_role.py

test/test_parsers/test_rst/test_directives/test_line_blocks.py

test/test_parsers/test_rst/test_directives/test_sidebars.py

test/test_parsers/test_rst/test_directives/test_tables.py

test/test_parsers/test_rst/test_directives/test_target_notes.py

test/test_parsers/test_rst/test_directives/utf-16.csv

test/test_parsers/test_rst/test_east_asian_text.py

test/test_parsers/test_rst/test_line_blocks.py

test/test_publisher.py

test/test_readers/test_pep/__init__.py

test/test_transforms/test___init__.py

test/test_transforms/test_expose_internals.py

test/test_transforms/test_strip_comments.py

test/test_transforms/test_target_notes.py

test/test_transforms/test_transitions.py

test/test_transforms/test_writer_aux.py

test/test_writers/test_html4css1.py

test/test_writers/test_html4css1_misc.py

test/test_writers/test_null.py

tools/dev

tools/dev/README.txt

tools/dev/create_unimap.py

tools/dev/profile_docutils.py

tools/dev/unicode2rstsubs.py

tools/editors/emacs/README.txt

tools/editors/emacs/docutils.conf

tools/editors/emacs/rst.el

tools/editors/emacs/tests

tools/editors/emacs/tests/Makefile

tools/editors/emacs/tests/README

tools/editors/emacs/tests/tests-adjust-section.el

tools/editors/emacs/tests/tests-basic.el

tools/editors/emacs/tests/tests-runner.el

tools/rst2newlatex.py

tools/rst2pseudoxml.py

tools/rst2s5.py

tools/rst2xml.py

tools/rstpep2html.py

files removed:
COPYING-orig.txt

MANIFEST.in

debian/NEWS.Debian

debian/python-difflib.copyright

debian/python-textwrap.copyright

debian/python2.1-difflib.copyright

debian/python2.1-textwrap.copyright

debian/python2.2-docutils.copyright

debian/python2.2-textwrap.copyright

debian/python2.3-docutils.copyright

docs/config.txt

docs/latex.txt

docs/rst

docs/rst/quickref.html

docs/rst/quickstart.txt

docs/tools.txt

docutils/writers/html4css1.py

docutils/writers/latex2e.py

docutils/writers/pep_html.py

extras/difflib.py

man/pep2html.1

man/rest2html.1

man/rest2latex.1

man/rest2xml.1

roman.py

setup_difflib.py

setup_roman.py

setup_textwrap.py

spec

spec/doctree.txt

spec/docutils.dtd

spec/howto

spec/howto/i18n.txt

spec/howto/rst-directives.txt

spec/howto/rst-roles.txt

spec/notes.txt

spec/pep-0256.txt

spec/pep-0257.txt

spec/pep-0258.txt

spec/pep-0287.txt

spec/pysource.dtd

spec/pysource.txt

spec/rst

spec/rst/alternatives.txt

spec/rst/directives.txt

spec/rst/interpreted.txt

spec/rst/introduction.txt

spec/rst/problems.txt

spec/rst/reStructuredText.txt

spec/semantics.txt

spec/transforms.txt

test/difflib.py

test/test_pep

test/test_pep/__init__.py

test/test_pep/test_inline_markup.py

test/test_pep/test_rfc2822.py

test/test_rst

test/test_rst/__init__.py

test/test_rst/test_SimpleTableParser.py

test/test_rst/test_TableParser.py

test/test_rst/test_block_quotes.py

test/test_rst/test_bullet_lists.py

test/test_rst/test_citations.py

test/test_rst/test_comments.py

test/test_rst/test_definition_lists.py

test/test_rst/test_directives

test/test_rst/test_directives/__init__.py

test/test_rst/test_directives/test_admonitions.py

test/test_rst/test_directives/test_contents.py

test/test_rst/test_directives/test_figures.py

test/test_rst/test_directives/test_images.py

test/test_rst/test_directives/test_meta.py

test/test_rst/test_directives/test_test_directives.py

test/test_rst/test_directives/test_unknown.py

test/test_rst/test_doctest_blocks.py

test/test_rst/test_enumerated_lists.py

test/test_rst/test_field_lists.py

test/test_rst/test_footnotes.py

test/test_rst/test_functions.py

test/test_rst/test_inline_markup.py

test/test_rst/test_literal_blocks.py

test/test_rst/test_option_lists.py

test/test_rst/test_outdenting.py

test/test_rst/test_paragraphs.py

test/test_rst/test_section_headers.py

test/test_rst/test_substitutions.py

test/test_rst/test_tables.py

test/test_rst/test_targets.py

test/test_rst/test_transitions.py

test/test_transforms/test_final_checks.py

test/test_writers/test_html4css1

test/test_writers/test_html4css1/__init__.py

test/test_writers/test_html4css1/test_parts.py

tools/default.css

tools/docutils-xml.py

tools/editors/emacs/restructuredtext.el

tools/editors/emacs/rst-html.el

tools/editors/emacs/rst-mode.el

tools/html.py

tools/pep-html-template

tools/pep.py

tools/pep2html.py

tools/publish.py

tools/stylesheets

tools/stylesheets/default.css

tools/stylesheets/pep.css

tools/stylesheets/style.tex

tools/test.txt

tools/unicode2rstsubs.py

files modified:
COPYING.txt

FAQ.txt

HISTORY.txt

README.txt

debian/README.Debian

debian/changelog

debian/compat

debian/control

debian/emacs-start.el

debian/python-docutils.copyright

debian/python-docutils.manpages

debian/python-roman.copyright

debian/rules

docutils/__init__.py

docutils/core.py

docutils/examples.py

docutils/frontend.py

docutils/io.py

docutils/languages/__init__.py

docutils/languages/af.py

docutils/languages/cs.py

docutils/languages/de.py

docutils/languages/en.py

docutils/languages/eo.py

docutils/languages/es.py

docutils/languages/fr.py

docutils/languages/it.py

docutils/languages/pt_br.py

docutils/languages/ru.py

docutils/languages/sk.py

docutils/languages/sv.py

docutils/nodes.py

docutils/parsers/__init__.py

docutils/parsers/rst/__init__.py

docutils/parsers/rst/directives/__init__.py

docutils/parsers/rst/directives/admonitions.py

docutils/parsers/rst/directives/body.py

docutils/parsers/rst/directives/html.py

docutils/parsers/rst/directives/images.py

docutils/parsers/rst/directives/misc.py

docutils/parsers/rst/directives/parts.py

docutils/parsers/rst/directives/references.py

docutils/parsers/rst/languages/__init__.py

docutils/parsers/rst/languages/af.py

docutils/parsers/rst/languages/cs.py

docutils/parsers/rst/languages/de.py

docutils/parsers/rst/languages/en.py

docutils/parsers/rst/languages/eo.py

docutils/parsers/rst/languages/es.py

docutils/parsers/rst/languages/fr.py

docutils/parsers/rst/languages/it.py

docutils/parsers/rst/languages/pt_br.py

docutils/parsers/rst/languages/ru.py

docutils/parsers/rst/languages/sk.py

docutils/parsers/rst/languages/sv.py

docutils/parsers/rst/roles.py

docutils/parsers/rst/states.py

docutils/parsers/rst/tableparser.py

docutils/readers/__init__.py

docutils/readers/pep.py

docutils/readers/python/__init__.py

docutils/readers/python/moduleparser.py

docutils/readers/python/pynodes.py

docutils/readers/standalone.py

docutils/statemachine.py

docutils/transforms/__init__.py

docutils/transforms/components.py

docutils/transforms/frontmatter.py

docutils/transforms/misc.py

docutils/transforms/parts.py

docutils/transforms/peps.py

docutils/transforms/references.py

docutils/transforms/universal.py

docutils/urischemes.py

docutils/utils.py

docutils/writers/__init__.py

docutils/writers/docutils_xml.py

docutils/writers/pseudoxml.py

extras/optparse.py

extras/textwrap.py

install.py

setup.py

test/DocutilsTestSupport.py

test/alltests.py

test/data/config_1.txt

test/data/config_2.txt

test/docutils.conf

test/package_unittest.py

test/test_language.py *

test/test_nodes.py

test/test_parsers/__init__.py

test/test_parsers/test_rst/test_SimpleTableParser.py *

test/test_parsers/test_rst/test_TableParser.py

test/test_parsers/test_rst/test_block_quotes.py

test/test_parsers/test_rst/test_bullet_lists.py

test/test_parsers/test_rst/test_citations.py

test/test_parsers/test_rst/test_comments.py

test/test_parsers/test_rst/test_definition_lists.py

test/test_parsers/test_rst/test_directives/test_admonitions.py

test/test_parsers/test_rst/test_directives/test_contents.py

test/test_parsers/test_rst/test_directives/test_figures.py

test/test_parsers/test_rst/test_directives/test_images.py

test/test_parsers/test_rst/test_directives/test_include.py

test/test_parsers/test_rst/test_directives/test_meta.py

test/test_parsers/test_rst/test_directives/test_raw.py

test/test_parsers/test_rst/test_directives/test_replace.py

test/test_parsers/test_rst/test_directives/test_role.py

test/test_parsers/test_rst/test_directives/test_rubrics.py

test/test_parsers/test_rst/test_directives/test_test_directives.py

test/test_parsers/test_rst/test_directives/test_topics.py *

test/test_parsers/test_rst/test_directives/test_unicode.py

test/test_parsers/test_rst/test_directives/test_unknown.py

test/test_parsers/test_rst/test_doctest_blocks.py

test/test_parsers/test_rst/test_enumerated_lists.py

test/test_parsers/test_rst/test_field_lists.py

test/test_parsers/test_rst/test_footnotes.py

test/test_parsers/test_rst/test_functions.py

test/test_parsers/test_rst/test_inline_markup.py

test/test_parsers/test_rst/test_interpreted.py *

test/test_parsers/test_rst/test_literal_blocks.py

test/test_parsers/test_rst/test_option_lists.py

test/test_parsers/test_rst/test_outdenting.py

test/test_parsers/test_rst/test_paragraphs.py

test/test_parsers/test_rst/test_section_headers.py

test/test_parsers/test_rst/test_substitutions.py

test/test_parsers/test_rst/test_tables.py

test/test_parsers/test_rst/test_targets.py

test/test_parsers/test_rst/test_transitions.py

test/test_readers/__init__.py

test/test_readers/test_pep/test_inline_markup.py *

test/test_readers/test_pep/test_rfc2822.py *

test/test_readers/test_python/__init__.py

test/test_readers/test_python/test_functions.py *

test/test_readers/test_python/test_parser.py *

test/test_readers/test_python/test_token_parser.py *

test/test_settings.py

test/test_statemachine.py

test/test_transforms/__init__.py

test/test_transforms/test_class.py

test/test_transforms/test_contents.py

test/test_transforms/test_docinfo.py

test/test_transforms/test_doctitle.py

test/test_transforms/test_filter.py *

test/test_transforms/test_footnotes.py

test/test_transforms/test_hyperlinks.py

test/test_transforms/test_messages.py

test/test_transforms/test_peps.py *

test/test_transforms/test_sectnum.py *

test/test_transforms/test_substitutions.py

test/test_utils.py

test/test_viewlist.py *

test/test_writers/__init__.py

test/test_writers/test_docutils_xml.py *

test/test_writers/test_latex2e.py *

test/test_writers/test_pseudoxml.py *

tools/buildhtml.py

tools/docutils.conf

tools/editors/README.txt

tools/quicktest.py

tools/rst2html.py

tools/rst2latex.py

Show diffs side-by-side

added added

removed removed

extras/difflib.py

#!/usr/bin/python2.1

"""

Module difflib -- helpers for computing deltas between objects.

Function get_close_matches(word, possibilities, n=3, cutoff=0.6):

Use SequenceMatcher to return list of the best "good enough" matches.

Function ndiff(a, b):

Return a delta: the difference between `a` and `b` (lists of strings).

Function restore(delta, which):

Return one of the two sequences that generated an ndiff delta.

Class SequenceMatcher:

A flexible class for comparing pairs of sequences of any type.

Class Differ:

For producing human-readable deltas from sequences of lines of text.

"""

__all__ = ['get_close_matches', 'ndiff', 'restore', 'SequenceMatcher',

'Differ']

TRACE = 0

class SequenceMatcher:

"""

SequenceMatcher is a flexible class for comparing pairs of sequences of

any type, so long as the sequence elements are hashable. The basic

algorithm predates, and is a little fancier than, an algorithm

published in the late 1980's by Ratcliff and Obershelp under the

hyperbolic name "gestalt pattern matching". The basic idea is to find

the longest contiguous matching subsequence that contains no "junk"

elements (R-O doesn't address junk). The same idea is then applied

recursively to the pieces of the sequences to the left and to the right

of the matching subsequence. This does not yield minimal edit

sequences, but does tend to yield matches that "look right" to people.

SequenceMatcher tries to compute a "human-friendly diff" between two

sequences. Unlike e.g. UNIX(tm) diff, the fundamental notion is the

longest *contiguous* & junk-free matching subsequence. That's what

catches peoples' eyes. The Windows(tm) windiff has another interesting

notion, pairing up elements that appear uniquely in each sequence.

That, and the method here, appear to yield more intuitive difference

reports than does diff. This method appears to be the least vulnerable

to synching up on blocks of "junk lines", though (like blank lines in

ordinary text files, or maybe "<P>" lines in HTML files). That may be

because this is the only method of the 3 that has a *concept* of

"junk" <wink>.

Example, comparing two strings, and considering blanks to be "junk":

>>> s = SequenceMatcher(lambda x: x == " ",

... "private Thread currentThread;",

... "private volatile Thread currentThread;")

>>>

.ratio() returns a float in [0, 1], measuring the "similarity" of the

sequences. As a rule of thumb, a .ratio() value over 0.6 means the

sequences are close matches:

>>> print round(s.ratio(), 3)

0.866

>>>

If you're only interested in where the sequences match,

.get_matching_blocks() is handy:

>>> for block in s.get_matching_blocks():

... print "a[%d] and b[%d] match for %d elements" % block

a[0] and b[0] match for 8 elements

a[8] and b[17] match for 6 elements

a[14] and b[23] match for 15 elements

a[29] and b[38] match for 0 elements

Note that the last tuple returned by .get_matching_blocks() is always a

dummy, (len(a), len(b), 0), and this is the only case in which the last

tuple element (number of elements matched) is 0.

If you want to know how to change the first sequence into the second,

use .get_opcodes():

>>> for opcode in s.get_opcodes():

... print "%6s a[%d:%d] b[%d:%d]" % opcode

equal a[0:8] b[0:8]

insert a[8:8] b[8:17]

equal a[8:14] b[17:23]

equal a[14:29] b[23:38]

See the Differ class for a fancy human-friendly file differencer, which

uses SequenceMatcher both to compare sequences of lines, and to compare

sequences of characters within similar (near-matching) lines.

See also function get_close_matches() in this module, which shows how

simple code building on SequenceMatcher can be used to do useful work.

Timing: Basic R-O is cubic time worst case and quadratic time expected

100

case. SequenceMatcher is quadratic time for the worst case and has

101

expected-case behavior dependent in a complicated way on how many

102

elements the sequences have in common; best case time is linear.

103

104

Methods:

105

106

__init__(isjunk=None, a='', b='')

107

Construct a SequenceMatcher.

108

109

set_seqs(a, b)

110

Set the two sequences to be compared.

111

112

set_seq1(a)

113

Set the first sequence to be compared.

114

115

set_seq2(b)

116

Set the second sequence to be compared.

117

118

find_longest_match(alo, ahi, blo, bhi)

119

Find longest matching block in a[alo:ahi] and b[blo:bhi].

120

121

get_matching_blocks()

122

Return list of triples describing matching subsequences.

123

124

get_opcodes()

125

Return list of 5-tuples describing how to turn a into b.

126

127

ratio()

128

Return a measure of the sequences' similarity (float in [0,1]).

129

130

quick_ratio()

131

Return an upper bound on .ratio() relatively quickly.

132

133

real_quick_ratio()

134

Return an upper bound on ratio() very quickly.

135

"""

136

137

def __init__(self, isjunk=None, a='', b=''):

138

"""Construct a SequenceMatcher.

139

140

Optional arg isjunk is None (the default), or a one-argument

141

function that takes a sequence element and returns true iff the

142

element is junk. None is equivalent to passing "lambda x: 0", i.e.

143

no elements are considered to be junk. For example, pass

144

lambda x: x in " \\t"

145

if you're comparing lines as sequences of characters, and don't

146

want to synch up on blanks or hard tabs.

147

148

Optional arg a is the first of two sequences to be compared. By

149

default, an empty string. The elements of a must be hashable. See

150

also .set_seqs() and .set_seq1().

151

152

Optional arg b is the second of two sequences to be compared. By

153

default, an empty string. The elements of b must be hashable. See

154

also .set_seqs() and .set_seq2().

155

"""

156

157

# Members:

158

# a

159

# first sequence

160

# b

161

# second sequence; differences are computed as "what do

162

# we need to do to 'a' to change it into 'b'?"

163

# b2j

164

# for x in b, b2j[x] is a list of the indices (into b)

165

# at which x appears; junk elements do not appear

166

# b2jhas

167

# b2j.has_key

168

# fullbcount

169

# for x in b, fullbcount[x] == the number of times x

170

# appears in b; only materialized if really needed (used

171

# only for computing quick_ratio())

172

# matching_blocks

173

# a list of (i, j, k) triples, where a[i:i+k] == b[j:j+k];

174

# ascending & non-overlapping in i and in j; terminated by

175

# a dummy (len(a), len(b), 0) sentinel

176

# opcodes

177

# a list of (tag, i1, i2, j1, j2) tuples, where tag is

178

# one of

179

# 'replace' a[i1:i2] should be replaced by b[j1:j2]

180

# 'delete' a[i1:i2] should be deleted

181

# 'insert' b[j1:j2] should be inserted

182

# 'equal' a[i1:i2] == b[j1:j2]

183

# isjunk

184

# a user-supplied function taking a sequence element and

185

# returning true iff the element is "junk" -- this has

186

# subtle but helpful effects on the algorithm, which I'll

187

# get around to writing up someday <0.9 wink>.

188

# DON'T USE! Only __chain_b uses this. Use isbjunk.

189

# isbjunk

190

# for x in b, isbjunk(x) == isjunk(x) but much faster;

191

# it's really the has_key method of a hidden dict.

192

# DOES NOT WORK for x in a!

193

194

self.isjunk = isjunk

195

self.a = self.b = None

196

self.set_seqs(a, b)

197

198

def set_seqs(self, a, b):

199

"""Set the two sequences to be compared.

200

201

>>> s = SequenceMatcher()

202

>>> s.set_seqs("abcd", "bcde")

203

>>> s.ratio()

204

0.75

205

"""

206

207

self.set_seq1(a)

208

self.set_seq2(b)

209

210

def set_seq1(self, a):

211

"""Set the first sequence to be compared.

212

213

The second sequence to be compared is not changed.

214

215

>>> s = SequenceMatcher(None, "abcd", "bcde")

216

>>> s.ratio()

217

0.75

218

>>> s.set_seq1("bcde")

219

>>> s.ratio()

220

1.0

221

>>>

222

223

SequenceMatcher computes and caches detailed information about the

224

second sequence, so if you want to compare one sequence S against

225

many sequences, use .set_seq2(S) once and call .set_seq1(x)

226

repeatedly for each of the other sequences.

227

228