~openerp-groupes/openobject-server/6.0-fix-setup-windows

« back to all changes in this revision

Viewing changes to bin/reportlab/tools/docco/t_parse.py

Committer: pinky
Date: 2006-12-07 13:41:40 UTC
Revision ID: pinky-3f10ee12cea3c4c75cef44ab04ad33ef47432907

New trunk

files added:

MANIFEST.in

bin/PKG-INFO

bin/__init__.py

bin/addons

bin/addons/__init__.py

bin/addons/base

bin/addons/base/__init__.py

bin/addons/base/__terp__.py

bin/addons/base/base.sql

bin/addons/base/base_data.xml

bin/addons/base/base_demo.xml

bin/addons/base/base_menu.xml

bin/addons/base/base_update.xml

bin/addons/base/ir

bin/addons/base/ir/__init__.py

bin/addons/base/ir/ir.xml

bin/addons/base/ir/ir_actions.py

bin/addons/base/ir/ir_attachment.py

bin/addons/base/ir/ir_cron.py

bin/addons/base/ir/ir_default.py

bin/addons/base/ir/ir_exports.py

bin/addons/base/ir/ir_fields_description.py

bin/addons/base/ir/ir_model.py

bin/addons/base/ir/ir_report_custom.py

bin/addons/base/ir/ir_sequence.py

bin/addons/base/ir/ir_translation.py

bin/addons/base/ir/ir_ui_menu.py

bin/addons/base/ir/ir_ui_view.py

bin/addons/base/ir/ir_values.py

bin/addons/base/ir/workflow

bin/addons/base/ir/workflow/__init__.py

bin/addons/base/ir/workflow/instance_print.py

bin/addons/base/ir/workflow/print_instance.py

bin/addons/base/ir/workflow/pydot

bin/addons/base/ir/workflow/pydot/LICENSE

bin/addons/base/ir/workflow/pydot/PKG-INFO

bin/addons/base/ir/workflow/pydot/README

bin/addons/base/ir/workflow/pydot/__init__.py

bin/addons/base/ir/workflow/pydot/dot_parser.py

bin/addons/base/ir/workflow/pydot/pydot.py

bin/addons/base/ir/workflow/pydot/setup.py

bin/addons/base/ir/workflow/workflow.py

bin/addons/base/ir/workflow/workflow_print.py

bin/addons/base/ir/workflow/workflow_view.xml

bin/addons/base/module

bin/addons/base/module/__init__.py

bin/addons/base/module/module.py

bin/addons/base/module/module.py.old

bin/addons/base/module/module_data.xml

bin/addons/base/module/module_report.xml

bin/addons/base/module/module_view.xml

bin/addons/base/module/module_wizard.xml

bin/addons/base/module/report

bin/addons/base/module/report/__init__.py

bin/addons/base/module/report/ir_module_reference.rml

bin/addons/base/module/report/ir_module_reference.sxw

bin/addons/base/module/report/ir_module_reference_print.py

bin/addons/base/module/wizard

bin/addons/base/module/wizard/__init__.py

bin/addons/base/module/wizard/add_new.py

bin/addons/base/module/wizard/wizard_export_lang.py

bin/addons/base/module/wizard/wizard_import_lang.py

bin/addons/base/module/wizard/wizard_install_module.py

bin/addons/base/module/wizard/wizard_module_info_get.py

bin/addons/base/module/wizard/wizard_module_lang_install.py

bin/addons/base/module/wizard/wizard_module_upgrade.py

bin/addons/base/module/wizard/wizard_update_module.py

bin/addons/base/report

bin/addons/base/report/custom.xsl

bin/addons/base/report/custom_default.xsl

bin/addons/base/report/custom_new.xsl

bin/addons/base/report/custom_rml.xsl

bin/addons/base/report/rml_template.xsl

bin/addons/base/res

bin/addons/base/res/__init__.py

bin/addons/base/res/ir_property.py

bin/addons/base/res/ir_property_view.xml

bin/addons/base/res/partner

bin/addons/base/res/partner/__init__.py

bin/addons/base/res/partner/crm.py

bin/addons/base/res/partner/crm_demo.xml

bin/addons/base/res/partner/crm_view.xml

bin/addons/base/res/partner/partner.py

bin/addons/base/res/partner/partner_data.xml

bin/addons/base/res/partner/partner_demo.xml

bin/addons/base/res/partner/partner_report.xml

bin/addons/base/res/partner/partner_view.xml

bin/addons/base/res/partner/partner_wizard.xml

bin/addons/base/res/partner/report

bin/addons/base/res/partner/report/__init__.py

bin/addons/base/res/partner/report/business_card.xml

bin/addons/base/res/partner/report/business_card.xsl

bin/addons/base/res/partner/report/partner_address.xml

bin/addons/base/res/partner/report/partner_address.xsl

bin/addons/base/res/partner/wizard

bin/addons/base/res/partner/wizard/__init__.py

bin/addons/base/res/partner/wizard/wizard_clear_ids.py

bin/addons/base/res/partner/wizard/wizard_ean_check.py

bin/addons/base/res/partner/wizard/wizard_sms.py

bin/addons/base/res/partner/wizard/wizard_spam.py

bin/addons/base/res/res_company.py

bin/addons/base/res/res_currency.py

bin/addons/base/res/res_currency_view.xml

bin/addons/base/res/res_request.py

bin/addons/base/res/res_request_view.xml

bin/addons/base/res/res_user.py

bin/addons/gen_graph.sh

bin/addons/module_graph.py

bin/gpl.txt

bin/i18n

bin/i18n/VERSION

bin/i18n/cs_CZ.csv

bin/i18n/de_DE.csv

bin/i18n/es_AR.csv

bin/i18n/es_ES.csv

bin/i18n/fr_CH.csv

bin/i18n/fr_FR.csv

bin/i18n/hu_HU.csv

bin/i18n/it_IT.csv

bin/i18n/nl_NL.csv

bin/i18n/pt_BR.csv

bin/i18n/pt_PT.csv

bin/i18n/ro_RO.csv

bin/i18n/ru_RU.csv

bin/i18n/sv_SE.csv

bin/i18n/zh_CN.csv

bin/i18n/zh_TW.csv

bin/ir

bin/ir/__init__.py

bin/ir/ir.py

bin/netsvc.py

bin/osv

bin/osv/__init__.py

bin/osv/fields.py

bin/osv/orm.py

bin/osv/osv.py

bin/pooler.py

bin/pychart

bin/pychart/__init__.py

bin/pychart/afm

bin/pychart/afm/AvantGarde_Book.py

bin/pychart/afm/AvantGarde_BookOblique.py

bin/pychart/afm/AvantGarde_Demi.py

bin/pychart/afm/AvantGarde_DemiOblique.py

bin/pychart/afm/Bookman_Demi.py

bin/pychart/afm/Bookman_DemiItalic.py

bin/pychart/afm/Bookman_Light.py

bin/pychart/afm/Bookman_LightItalic.py

bin/pychart/afm/Courier.py

bin/pychart/afm/Courier_Bold.py

bin/pychart/afm/Courier_BoldOblique.py

bin/pychart/afm/Courier_Oblique.py

bin/pychart/afm/Helvetica.py

bin/pychart/afm/Helvetica_Bold.py

bin/pychart/afm/Helvetica_BoldOblique.py

bin/pychart/afm/Helvetica_Light.py

bin/pychart/afm/Helvetica_LightOblique.py

bin/pychart/afm/Helvetica_Narrow.py

bin/pychart/afm/Helvetica_Narrow_Bold.py

bin/pychart/afm/Helvetica_Narrow_BoldOblique.py

bin/pychart/afm/Helvetica_Narrow_Oblique.py

bin/pychart/afm/Helvetica_Oblique.py

bin/pychart/afm/NewCenturySchlbk_Bold.py

bin/pychart/afm/NewCenturySchlbk_BoldItalic.py

bin/pychart/afm/NewCenturySchlbk_Italic.py

bin/pychart/afm/NewCenturySchlbk_Roman.py

bin/pychart/afm/Palatino_Bold.py

bin/pychart/afm/Palatino_BoldItalic.py

bin/pychart/afm/Palatino_Italic.py

bin/pychart/afm/Palatino_Roman.py

bin/pychart/afm/Symbol.py

bin/pychart/afm/Times_Bold.py

bin/pychart/afm/Times_BoldItalic.py

bin/pychart/afm/Times_Italic.py

bin/pychart/afm/Times_Roman.py

bin/pychart/afm/Utopia_Bold.py

bin/pychart/afm/Utopia_BoldItalic.py

bin/pychart/afm/Utopia_Italic.py

bin/pychart/afm/Utopia_Regular.py

bin/pychart/afm/ZapfChancery_MediumItalic.py

bin/pychart/afm/ZapfDingbats.py

bin/pychart/afm/__init__.py

bin/pychart/afm/dir.py

bin/pychart/area.py

bin/pychart/area_doc.py

bin/pychart/arrow.py

bin/pychart/arrow_doc.py

bin/pychart/axis.py

bin/pychart/axis_doc.py

bin/pychart/axis_x_doc.py

bin/pychart/axis_y_doc.py

bin/pychart/bar_plot.py

bin/pychart/bar_plot_doc.py

bin/pychart/basecanvas.py

bin/pychart/canvas.py

bin/pychart/category_coord.py

bin/pychart/chart_data.py

bin/pychart/chart_object.py

bin/pychart/color.py

bin/pychart/color_doc.py

bin/pychart/coord.py

bin/pychart/doc_support.py

bin/pychart/empty_docs.py

bin/pychart/error_bar.py

bin/pychart/error_bar_doc.py

bin/pychart/fill_style.py

bin/pychart/fill_style_doc.py

bin/pychart/font.py

bin/pychart/generate_docs.py

bin/pychart/gs_frontend.py

bin/pychart/interval_bar_plot.py

bin/pychart/legend.py

bin/pychart/legend_doc.py

bin/pychart/line_plot.py

bin/pychart/line_plot_doc.py

bin/pychart/line_style.py

bin/pychart/line_style_doc.py

bin/pychart/linear_coord.py

bin/pychart/log_coord.py

bin/pychart/object_set.py

bin/pychart/pdfcanvas.py

bin/pychart/pie_plot.py

bin/pychart/pie_plot_doc.py

bin/pychart/pngcanvas.py

bin/pychart/pscanvas.py

bin/pychart/pychart_types.py

bin/pychart/pychart_util.py

bin/pychart/range_plot.py

bin/pychart/range_plot_doc.py

bin/pychart/rose_plot.py

bin/pychart/scaling.py

bin/pychart/svgcanvas.py

bin/pychart/text_box.py

bin/pychart/text_box_doc.py

bin/pychart/theme.py

bin/pychart/tick_mark.py

bin/pychart/tick_mark_doc.py

bin/pychart/typechecker.py

bin/pychart/version.py

bin/pychart/x11canvas.py

bin/pychart/zap.py

bin/report

bin/report/__init__.py

bin/report/common.py

bin/report/custom.py

bin/report/int_to_text.py

bin/report/interface.py

bin/report/misc.py

bin/report/print_fnc.py

bin/report/print_xml.py

bin/report/printscreen

bin/report/printscreen/__init__.py

bin/report/printscreen/ps_form.py

bin/report/printscreen/ps_list.py

bin/report/render

bin/report/render/__init__.py

bin/report/render/render.py

bin/report/render/rml.py

bin/report/render/rml2html

bin/report/render/rml2html/__init__.py

bin/report/render/rml2html/rml2html.py

bin/report/render/rml2html/utils.py

bin/report/render/rml2pdf

bin/report/render/rml2pdf/__init__.py

bin/report/render/rml2pdf/color.py

bin/report/render/rml2pdf/trml2pdf.py

bin/report/render/rml2pdf/utils.py

bin/report/render/simple.py

bin/report/report_sxw.py

bin/reportlab

bin/reportlab/__init__.py

bin/reportlab/extensions

bin/reportlab/extensions/README

bin/reportlab/extensions/__init__.py

bin/reportlab/fonts

bin/reportlab/fonts/00readme.txt

bin/reportlab/fonts/Dustismo_Roman.ttf

bin/reportlab/fonts/PenguinAttack.ttf

bin/reportlab/fonts/Wargames.afm

bin/reportlab/fonts/Wargames.pfb

bin/reportlab/graphics

bin/reportlab/graphics/__init__.py

bin/reportlab/graphics/charts

bin/reportlab/graphics/charts/__init__.py

bin/reportlab/graphics/charts/areas.py

bin/reportlab/graphics/charts/axes.py

bin/reportlab/graphics/charts/barcharts.py

bin/reportlab/graphics/charts/dotbox.py

bin/reportlab/graphics/charts/doughnut.py

bin/reportlab/graphics/charts/legends.py

bin/reportlab/graphics/charts/linecharts.py

bin/reportlab/graphics/charts/lineplots.py

bin/reportlab/graphics/charts/markers.py

bin/reportlab/graphics/charts/piecharts.py

bin/reportlab/graphics/charts/slidebox.py

bin/reportlab/graphics/charts/spider.py

bin/reportlab/graphics/charts/textlabels.py

bin/reportlab/graphics/charts/utils.py

bin/reportlab/graphics/charts/utils3d.py

bin/reportlab/graphics/renderPDF.py

bin/reportlab/graphics/renderPM.py

bin/reportlab/graphics/renderPS.py

bin/reportlab/graphics/renderSVG.py

bin/reportlab/graphics/renderbase.py

bin/reportlab/graphics/samples

bin/reportlab/graphics/samples/__init__.py

bin/reportlab/graphics/samples/bubble.py

bin/reportlab/graphics/samples/clustered_bar.py

bin/reportlab/graphics/samples/clustered_column.py

bin/reportlab/graphics/samples/excelcolors.py

bin/reportlab/graphics/samples/exploded_pie.py

bin/reportlab/graphics/samples/filled_radar.py

bin/reportlab/graphics/samples/line_chart.py

bin/reportlab/graphics/samples/linechart_with_markers.py

bin/reportlab/graphics/samples/radar.py

bin/reportlab/graphics/samples/runall.py

bin/reportlab/graphics/samples/scatter.py

bin/reportlab/graphics/samples/scatter_lines.py

bin/reportlab/graphics/samples/scatter_lines_markers.py

bin/reportlab/graphics/samples/simple_pie.py

bin/reportlab/graphics/samples/stacked_bar.py

bin/reportlab/graphics/samples/stacked_column.py

bin/reportlab/graphics/shapes.py

bin/reportlab/graphics/testdrawings.py

bin/reportlab/graphics/testshapes.py

bin/reportlab/graphics/widgetbase.py

bin/reportlab/graphics/widgets

bin/reportlab/graphics/widgets/__init__.py

bin/reportlab/graphics/widgets/eventcal.py

bin/reportlab/graphics/widgets/flags.py

bin/reportlab/graphics/widgets/grids.py

bin/reportlab/graphics/widgets/markers.py

bin/reportlab/graphics/widgets/signsandsymbols.py

bin/reportlab/lib

bin/reportlab/lib/PyFontify.py

bin/reportlab/lib/__init__.py

bin/reportlab/lib/abag.py

bin/reportlab/lib/attrmap.py

bin/reportlab/lib/codecharts.py

bin/reportlab/lib/colors.py

bin/reportlab/lib/corp.py

bin/reportlab/lib/enums.py

bin/reportlab/lib/extformat.py

bin/reportlab/lib/fonts.py

bin/reportlab/lib/formatters.py

bin/reportlab/lib/logger.py

bin/reportlab/lib/normalDate.py

bin/reportlab/lib/pagesizes.py

bin/reportlab/lib/randomtext.py

bin/reportlab/lib/rparsexml.py

bin/reportlab/lib/sequencer.py

bin/reportlab/lib/set_ops.py

bin/reportlab/lib/styles.py

bin/reportlab/lib/tocindex.py

bin/reportlab/lib/units.py

bin/reportlab/lib/utils.py

bin/reportlab/lib/validators.py

bin/reportlab/lib/xmllib.py

bin/reportlab/lib/yaml.py

bin/reportlab/pdfbase

bin/reportlab/pdfbase/__init__.py

bin/reportlab/pdfbase/_cidfontdata.py

bin/reportlab/pdfbase/_fontdata.py

bin/reportlab/pdfbase/cidfonts.py

bin/reportlab/pdfbase/pdfdoc.py

bin/reportlab/pdfbase/pdfform.py

bin/reportlab/pdfbase/pdfmetrics.py

bin/reportlab/pdfbase/pdfpattern.py

bin/reportlab/pdfbase/pdfutils.py

bin/reportlab/pdfbase/ttfonts.py

bin/reportlab/pdfgen

bin/reportlab/pdfgen/__init__.py

bin/reportlab/pdfgen/canvas.py

bin/reportlab/pdfgen/pathobject.py

bin/reportlab/pdfgen/pdfgeom.py

bin/reportlab/pdfgen/pdfimages.py

bin/reportlab/pdfgen/pycanvas.py

bin/reportlab/pdfgen/textobject.py

bin/reportlab/platypus

bin/reportlab/platypus/__init__.py

bin/reportlab/platypus/doctemplate.py

bin/reportlab/platypus/figures.py

bin/reportlab/platypus/flowables.py

bin/reportlab/platypus/frames.py

bin/reportlab/platypus/para.py

bin/reportlab/platypus/paragraph.py

bin/reportlab/platypus/paraparser.py

bin/reportlab/platypus/tableofcontents.py

bin/reportlab/platypus/tables.py

bin/reportlab/platypus/xpreformatted.py

bin/reportlab/rl_config.py

bin/reportlab/tools

bin/reportlab/tools/README

bin/reportlab/tools/__init__.py

bin/reportlab/tools/docco

bin/reportlab/tools/docco/README

bin/reportlab/tools/docco/__init__.py

bin/reportlab/tools/docco/codegrab.py

bin/reportlab/tools/docco/docpy.py

bin/reportlab/tools/docco/examples.py

bin/reportlab/tools/docco/graphdocpy.py

bin/reportlab/tools/docco/rl_doc_utils.py

bin/reportlab/tools/docco/rltemplate.py

bin/reportlab/tools/docco/stylesheet.py

bin/reportlab/tools/docco/t_parse.py

bin/reportlab/tools/docco/yaml.py

bin/reportlab/tools/docco/yaml2pdf.py

bin/reportlab/tools/py2pdf

bin/reportlab/tools/py2pdf/README

bin/reportlab/tools/py2pdf/__init__.py

bin/reportlab/tools/py2pdf/demo-config.txt

bin/reportlab/tools/py2pdf/demo.py

bin/reportlab/tools/py2pdf/idle_print.py

bin/reportlab/tools/py2pdf/py2pdf.py

bin/reportlab/tools/py2pdf/vertpython.jpg

bin/reportlab/tools/pythonpoint

bin/reportlab/tools/pythonpoint/README

bin/reportlab/tools/pythonpoint/__init__.py

bin/reportlab/tools/pythonpoint/customshapes.py

bin/reportlab/tools/pythonpoint/demos

bin/reportlab/tools/pythonpoint/demos/htu.xml

bin/reportlab/tools/pythonpoint/demos/leftlogo.a85

bin/reportlab/tools/pythonpoint/demos/leftlogo.gif

bin/reportlab/tools/pythonpoint/demos/lj8100.jpg

bin/reportlab/tools/pythonpoint/demos/monterey.xml

bin/reportlab/tools/pythonpoint/demos/outline.gif

bin/reportlab/tools/pythonpoint/demos/pplogo.gif

bin/reportlab/tools/pythonpoint/demos/python.gif

bin/reportlab/tools/pythonpoint/demos/pythonpoint.xml

bin/reportlab/tools/pythonpoint/demos/spectrum.png

bin/reportlab/tools/pythonpoint/demos/vertpython.gif

bin/reportlab/tools/pythonpoint/pythonpoint.dtd

bin/reportlab/tools/pythonpoint/pythonpoint.py

bin/reportlab/tools/pythonpoint/stdparser.py

bin/reportlab/tools/pythonpoint/styles

bin/reportlab/tools/pythonpoint/styles/__init__.py

bin/reportlab/tools/pythonpoint/styles/horrible.py

bin/reportlab/tools/pythonpoint/styles/htu.py

bin/reportlab/tools/pythonpoint/styles/modern.py

bin/reportlab/tools/pythonpoint/styles/projection.py

bin/reportlab/tools/pythonpoint/styles/standard.py

bin/server.cert

bin/server.pkey

bin/service

bin/service/__init__.py

bin/service/security.py

bin/service/web_services.py

bin/sql_db.py

bin/ssl

bin/ssl/SecureXMLRPCServer.py

bin/ssl/__init__.py

bin/ssl/server.cert

bin/ssl/server.pkey

bin/tinyerp-server.py

bin/tools

bin/tools/__init__.py

bin/tools/amount_to_text.py

bin/tools/config.py

bin/tools/convert.py

bin/tools/decimal.py

bin/tools/import_email.py

bin/tools/misc.py

bin/tools/threadinglocal.py

bin/tools/translate.py

bin/tools/upgrade.py

bin/wizard

bin/wizard/__init__.py

bin/workflow

bin/workflow/__init__.py

bin/workflow/common.py

bin/workflow/instance.py

bin/workflow/wkf_expr.py

bin/workflow/wkf_logs.py

bin/workflow/wkf_service.py

bin/workflow/workitem.py

doc/COPYING

doc/Changelog

doc/INSTALL

doc/README

doc/README.pychart

doc/migrate

doc/migrate/3.3.0-3.4.0

doc/migrate/3.3.0-3.4.0/README

doc/migrate/3.3.0-3.4.0/post.py

doc/migrate/3.3.0-3.4.0/pre.py

doc/migrate/3.4.0-4.0.0

doc/migrate/3.4.0-4.0.0/pre.py

doc/tinyerp-icon.ico

doc/tinyerp-icon.png

man/terp_serverrc.5

man/tinyerp-server.1

setup.py

Show diffs side-by-side

added added

removed removed

bin/reportlab/tools/docco/t_parse.py

#Copyright ReportLab Europe Ltd. 2000-2004

#see license.txt for license details

#history http://www.reportlab.co.uk/cgi-bin/viewcvs.cgi/public/reportlab/trunk/reportlab/tools/docco/t_parse.py

"""

Template parsing module inspired by REXX (with thanks to Donn Cave for discussion).

Template initialization has the form:

T = Template(template_string, wild_card_marker, single_char_marker,

x = regex_x, y = regex_y, ...)

Parsing has the form

([match1, match2, ..., matchn], lastindex) = T.PARSE(string)

Only the first argument is mandatory.

The resultant object efficiently parses strings that match the template_string,

giving a list of substrings that correspond to each "directive" of the template.

Template directives:

Wildcard:

The template may be initialized with a wildcard that matches any string

up to the string matching the next directive (which may not be a wild

card or single character marker) or the next literal sequence of characters

of the template. The character that represents a wildcard is specified

by the wild_card_marker parameter, which has no default.

For example, using X as the wildcard:

>>> T = Template("prefixXinteriorX", "X")

>>> T.PARSE("prefix this is before interior and this is after")

([' this is before ', ' and this is after'], 47)

>>> T = Template("<X>X<X>", "X")

>>> T.PARSE('<A HREF="index.html">go to index</A>')

(['A HREF="index.html"', 'go to index', '/A'], 36)

Obviously the character used to represent the wildcard must be distinct

from the characters used to represent literals or other directives.

Fixed length character sequences:

The template may have a marker character which indicates a fixed

length field. All adjacent instances of this marker will be matched

by a substring of the same length in the parsed string. For example:

>>> T = Template("NNN-NN-NNNN", single_char_marker="N")

>>> T.PARSE("1-2-34-5-12")

(['1-2', '34', '5-12'], 11)

>>> T.PARSE("111-22-3333")

(['111', '22', '3333'], 11)

>>> T.PARSE("1111-22-3333")

ValueError: literal not found at (3, '-')

A template may have multiple fixed length markers, which allows fixed

length fields to be adjacent, but recognized separately. For example:

>>> T = Template("MMDDYYX", "X", "MDY")

>>> T.PARSE("112489 Somebody's birthday!")

(['11', '24', '89', " Somebody's birthday!"], 27)

Regular expression markers:

The template may have markers associated with regular expressions.

the regular expressions may be either string represenations of compiled.

For example:

>>> T = Template("v: s i", v=id, s=str, i=int)

>>> T.PARSE("this_is_an_identifier: 'a string' 12344")

(['this_is_an_identifier', "'a string'", '12344'], 39)

>>>

Here id, str, and int are regular expression conveniences provided by

this module.

Directive markers may be mixed and matched, except that wildcards cannot precede

wildcards or single character markers.

Example:

>>> T = Template("ssnum: NNN-NN-NNNN, fn=X, ln=X, age=I, quote=Q", "X", "N", I=int, Q=str)

>>> T.PARSE("ssnum: 123-45-6789, fn=Aaron, ln=Watters, age=13, quote='do be do be do'")

(['123', '45', '6789', 'Aaron', 'Watters', '13', "'do be do be do'"], 72)

>>>

"""

import re, string

from types import StringType

from string import find

# template parsing

# EG: T = Template("(NNN)NNN-NNNN X X", "X", "N")

# ([area, exch, ext, fn, ln], index) = T.PARSE("(908)949-2726 Aaron Watters")

class Template:

def __init__(self,

template,

wild_card_marker=None,

single_char_marker=None,

**marker_to_regex_dict):

self.template = template

self.wild_card = wild_card_marker

100

self.char = single_char_marker

101

# determine the set of markers for this template

102

markers = marker_to_regex_dict.keys()

103

if wild_card_marker:

104

markers.append(wild_card_marker)

105

if single_char_marker:

106

for ch in single_char_marker: # allow multiple scm's

107

markers.append(ch)

108

self.char = single_char_primary = single_char_marker[0]

109

self.markers = markers

110

for mark in markers:

111

if len(mark)>1:

112

raise ValueError, "Marks must be single characters: "+`mark`

113

# compile the regular expressions if needed

114

self.marker_dict = marker_dict = {}

115

for (mark, rgex) in marker_to_regex_dict.items():

116

if type(rgex) == StringType:

117

rgex = re.compile(rgex)

118

marker_dict[mark] = rgex

119

# determine the parse sequence

120

parse_seq = []

121

# dummy last char

122

lastchar = None

123

index = 0

124

last = len(template)

125

# count the number of directives encountered

126

ndirectives = 0

127

while index<last:

128

start = index

129

thischar = template[index]

130

# is it a wildcard?

131

if thischar == wild_card_marker:

132

if lastchar == wild_card_marker:

133

raise ValueError, "two wild cards in sequence is not allowed"

134

parse_seq.append( (wild_card_marker, None) )

135

index = index+1

136

ndirectives = ndirectives+1

137

# is it a sequence of single character markers?

138

elif single_char_marker and thischar in single_char_marker:

139

if lastchar == wild_card_marker:

140

raise ValueError, "wild card cannot precede single char marker"

141

while index<last and template[index] == thischar:

142

index = index+1

143

parse_seq.append( (single_char_primary, index-start) )

144

ndirectives = ndirectives+1

145

# is it a literal sequence?

146

elif not thischar in markers:

147

while index<last and not template[index] in markers:

148

index = index+1

149

parse_seq.append( (None, template[start:index]) )

150

# otherwise it must be a re marker

151

else:

152

rgex = marker_dict[thischar]

153

parse_seq.append( (thischar, rgex) )

154

ndirectives = ndirectives+1

155

index = index+1

156

lastchar = template[index-1]

157

self.parse_seq = parse_seq

158

self.ndirectives = ndirectives

159

160

def PARSE(self, str, start=0):

161

ndirectives = self.ndirectives

162

wild_card = self.wild_card

163

single_char = self.char

164

parse_seq = self.parse_seq

165

lparse_seq = len(parse_seq) - 1

166

# make a list long enough for substitutions for directives

167

result = [None] * ndirectives

168

current_directive_index = 0

169

currentindex = start

170

# scan through the parse sequence, recognizing

171

for parse_index in xrange(lparse_seq + 1):

172

(indicator, data) = parse_seq[parse_index]

173

# is it a literal indicator?

174

if indicator is None:

175

if find(str, data, currentindex) != currentindex:

176

raise ValueError, "literal not found at "+`(currentindex,data)`

177

currentindex = currentindex + len(data)

178

else:

179

# anything else is a directive

180

# is it a wildcard?

181

if indicator == wild_card:

182

# if it is the last directive then it matches the rest of the string

183

if parse_index == lparse_seq:

184

last = len(str)

185

# otherwise must look at next directive to find end of wildcard

186

else:

187

# next directive must be re or literal

188

(nextindicator, nextdata) = parse_seq[parse_index+1]

189

if nextindicator is None:

190

# search for literal

191

last = find(str, nextdata, currentindex)

192

if last<currentindex:

193

raise ValueError, \

194

"couldn't terminate wild with lit "+`currentindex`

195

else:

196

# data is a re, search for it

197

last = nextdata.search(str, currentindex)

198

if last<currentindex:

199

raise ValueError, \

200

"couldn't terminate wild with re "+`currentindex`

201

elif indicator == single_char:

202

# data is length to eat

203

last = currentindex + data

204

else:

205

# other directives are always regular expressions

206

last = data.match(str, currentindex) + currentindex

207

if last<currentindex:

208

raise ValueError, "couldn't match re at "+`currentindex`

209

#print "accepting", str[currentindex:last]

210

result[current_directive_index] = str[currentindex:last]

211

current_directive_index = current_directive_index+1

212

currentindex = last

213

# sanity check

214

if current_directive_index != ndirectives:

215

raise SystemError, "not enough directives found?"

216

return (result, currentindex)

217

218

# some useful regular expressions

219

USERNAMEREGEX = \

220

"["+string.letters+"]["+string.letters+string.digits+"_]*"

221

STRINGLITREGEX = "'[^\n']*'"

222

SIMPLEINTREGEX = "["+string.digits+"]+"

223

id = re.compile(USERNAMEREGEX)

224

str = re.compile(STRINGLITREGEX)

225

int = re.compile(SIMPLEINTREGEX)

226

227

def test():

228

global T, T1, T2, T3

229

230

T = Template("(NNN)NNN-NNNN X X", "X", "N")

231

print T.PARSE("(908)949-2726 Aaron Watters")

232

233

T1 = Template("s --> s blah", s=str)

234

s = "' <-- a string --> ' --> 'blah blah another string blah' blah"

235

print T1.PARSE(s)

236

237

T2 = Template("s --> NNNiX", "X", "N", s=str, i=int)

238

print T2.PARSE("'A STRING' --> 15964653alpha beta gamma")

239

240

T3 = Template("XsXi", "X", "N", s=str, i=int)

241

print T3.PARSE("prefix'string'interior1234junk not parsed")

242

243

T4 = Template("MMDDYYX", "X", "MDY")

244

print T4.PARSE("122961 Somebody's birthday!")

245

246

247

if __name__=="__main__": test()

b'\\ No newline at end of file'

Older »