~ubuntu-branches/debian/squeeze/sword/squeeze

« back to all changes in this revision

Viewing changes to utilities/osis2mod.cpp

Committer: Bazaar Package Importer
Author(s): Jonathan Marsden, Jonathan Marsden, Dmitrijs Ledkovs, Closed Bugs
Date: 2009-05-30 11:55:55 UTC
mfrom: (1.3.1 upstream) (6.1.1 experimental)
Revision ID: james.westby@ubuntu.com-20090530115555-r427zsn3amivdpfu

Tags: 1.6.0+dfsg-1

http://bugs.debian.org/507960

https://launchpad.net/bugs/320558

http://bugs.debian.org/513448

https://launchpad.net/bugs/322638

https://launchpad.net/bugs/305172

[ Jonathan Marsden ]
* New upstream release. (Closes: #507960) (LP: #320558)
* debian/patches/02_libver.diff:
  - Bump SONAME to 8 -- SWORD 1.6 is not backward compatible with 1.5.11.
* debian/patches/series:
  - Remove 10_diatheke.diff -- included in upstream source.
* debian/patches/:
  - Remove several old unused .diff files.
  - Add 11_regex_only_when_needed.diff to conditionally include regex lib.
  - Add 12_fix_compiler_warnings.diff to remove all compiler warnings.
  - Add 13_fix_osis2mod_compression_default.diff from upstream svn.
  - Add 14_closing_section_not_chapter.diff from upstream svn.
* debian/libsword7.*:
  - Rename to libsword8.*
  - Change libsword7 to libsword8 within files.
* debian/rules:
  - SONAME bump to 8.
  - Set library version check to >= 1.6
* debian/control:
  - Change libsword7 to libsword8.
  - Add libsword7 to Conflicts.
  - Fix case of sword to SWORD in package descriptions.
  - Bump Standards-Version to 3.8.1 (no changes needed).
  - Fix section for libsword-dbg to avoid lintian warning.
* debian/rules:
  - Add DFSG get-orig-source target.
* debian/copyright:
  - Fix various mistakes in initial attempt to document copyrights.

[ Dmitrijs Ledkovs ]
* debian/rules: Added utils.mk to use missing-files target and call it on
  each build.
* debian/libsword-dev.install: Added libsword.la, previously missing.
* debian/libsword7.install: Added missing libicu translit files.
* debian/control:
  - Updated all uses of SWORD version to 1.6
  - Added libsword-dbg package
* debian/watch: Fixed a small mistake which was resulting in extra "."
  in final version name.
* debian/rules: simplified manpage processing.
* debian/libsword8.lintian-overrides: added override for module
  installation directory.
* debian/copyright: Updated with information about everyfile.
  Closes: #513448 LP: #322638
* debian/diatheke.examples: moved examples here from the diatheke.install
* debian/rules:
  - enabled shell script based testsuite
  - added commented out cppunit testsuite
* debian/patches/40_missing_includes.diff:
  - added several missing stdio.h includes to prevent FTBFS of testsuite.

[ Closed Bugs ]
* FTBFS on intrepid (LP: #305172)

files added:
AUTHORS

CODINGSTYLE

COPYING

ChangeLog

INSTALL

LICENSE

Makefile.am

Makefile.cvs

Makefile.in

NEWS

README

README.svn

aclocal.m4

arminst.sh

autogen.sh

bindings

bindings/Makefile

bindings/Makefile.am

bindings/README

bindings/autogen.sh

bindings/bcppmake

bindings/bcppmake/MainCLXTest.cpp

bindings/bcppmake/MainCLXTest.dfm

bindings/bcppmake/MainCLXTest.h

bindings/bcppmake/MainTest.cpp

bindings/bcppmake/MainTest.dfm

bindings/bcppmake/MainTest.h

bindings/bcppmake/Makefile.am

bindings/bcppmake/clxtest.bpr

bindings/bcppmake/clxtest.cpp

bindings/bcppmake/sword.bpf

bindings/bcppmake/sword.bpr

bindings/bcppmake/sword.c

bindings/bcppmake/sworddll.bpg

bindings/bcppmake/test.cpp

bindings/clx

bindings/clx/Sword.pas

bindings/clx/test1

bindings/clx/test1/MainFrm.pas

bindings/clx/test1/MainFrm.xfm

bindings/clx/test1/test1.conf

bindings/clx/test1/test1.dpr

bindings/clx/test1/test1.kof

bindings/clx/test1/test1.res

bindings/clx/test1/test1g.bpg

bindings/clx/test2

bindings/clx/test2/MainFrm.pas

bindings/clx/test2/MainFrm.xfm

bindings/clx/test2/test2.conf

bindings/clx/test2/test2.dpr

bindings/clx/test2/test2.kof

bindings/clx/test2/test2.res

bindings/configure.ac

bindings/corba

bindings/corba/Makefile.am

bindings/corba/java

bindings/corba/java/Makefile

bindings/corba/java/Makefile.in

bindings/corba/java/classes

bindings/corba/java/src

bindings/corba/java/src/org

bindings/corba/java/src/org/crosswire

bindings/corba/java/src/org/crosswire/sword

bindings/corba/java/src/org/crosswire/sword/orb

bindings/corba/java/src/org/crosswire/sword/orb/SwordOrb.java

bindings/corba/java/src/org/crosswire/util

bindings/corba/java/src/org/crosswire/util/Base64.java

bindings/corba/java/swordorb.jpx

bindings/corba/java/swordorb.jpx.local

bindings/corba/java/testclient

bindings/corba/orbitcpp

bindings/corba/orbitcpp/Makefile

bindings/corba/orbitcpp/Makefile.am

bindings/corba/orbitcpp/server.cpp

bindings/corba/orbitcpp/swordorb-impl.cpp

bindings/corba/orbitcpp/swordorb-impl.hpp

bindings/corba/orbitcpp/testclient.cpp

bindings/corba/orbitcpp/webmgr.hpp

bindings/corba/swordorb.idl

bindings/flatapi.cpp

bindings/gsoap

bindings/gsoap/Makefile

bindings/gsoap/Makefile.am

bindings/gsoap/gsoapsword.cpp

bindings/gsoap/gsoapsword.h

bindings/gsoap/include

bindings/gsoap/testclient.cpp

bindings/swig

bindings/swig/README

bindings/swig/bases.i

bindings/swig/defs.i

bindings/swig/directors.i

bindings/swig/encfiltmgr.i

bindings/swig/examples

bindings/swig/examples/mod2zmod.pl

bindings/swig/extras.i

bindings/swig/filemgr.i

bindings/swig/ftptrans.i

bindings/swig/installmgr.i

bindings/swig/listkey.i

bindings/swig/localemgr.i

bindings/swig/lzsscomprs.i

bindings/swig/markupcallback.h

bindings/swig/markupfiltmgr.i

bindings/swig/oldmake

bindings/swig/oldmake/Makefile.am

bindings/swig/oldmake/Makefile.oth

bindings/swig/oldmake/Makefile.swig

bindings/swig/osishtmlhref.i

bindings/swig/package

bindings/swig/package/Makefile.am

bindings/swig/package/Makefile.in

bindings/swig/package/README.cvs

bindings/swig/package/aclocal.m4

bindings/swig/package/autogen.sh

bindings/swig/package/bases.i

bindings/swig/package/config.guess

bindings/swig/package/config.sub

bindings/swig/package/configure

bindings/swig/package/configure.ac

bindings/swig/package/defs.i

bindings/swig/package/depcomp

bindings/swig/package/directors.i

bindings/swig/package/encfiltmgr.i

bindings/swig/package/extras.i

bindings/swig/package/filemgr.i

bindings/swig/package/ftptrans.i

bindings/swig/package/install-sh

bindings/swig/package/installmgr.i

bindings/swig/package/listkey.i

bindings/swig/package/localemgr.i

bindings/swig/package/ltmain.sh

bindings/swig/package/lzsscomprs.i

bindings/swig/package/markupcallback.h

bindings/swig/package/markupfiltmgr.i

bindings/swig/package/missing

bindings/swig/package/osishtmlhref.i

bindings/swig/package/perl.m4

bindings/swig/package/php4.m4

bindings/swig/package/python.m4

bindings/swig/package/rawcom.i

bindings/swig/package/rawgenbook.i

bindings/swig/package/rawld.i

bindings/swig/package/rawld4.i

bindings/swig/package/rawtext.i

bindings/swig/package/rendercallback.h

bindings/swig/package/searcher.h

bindings/swig/package/stringmgr.i

bindings/swig/package/swbuf.i

bindings/swig/package/swcacher.i

bindings/swig/package/swcom.i

bindings/swig/package/swcomprs.i

bindings/swig/package/swconfig.i

bindings/swig/package/swdisp.i

bindings/swig/package/swfilter.i

bindings/swig/package/swfiltermgr.i

bindings/swig/package/swgenbook.i

bindings/swig/package/swig.m4

bindings/swig/package/swkey.i

bindings/swig/package/swld.i

bindings/swig/package/swlocale.i

bindings/swig/package/swlog.i

bindings/swig/package/swmgr.i

bindings/swig/package/swmodule.i

bindings/swig/package/swobject.i

bindings/swig/package/swoptfilter.i

bindings/swig/package/sword.i

bindings/swig/package/sword.m4

bindings/swig/package/swsearchable.i

bindings/swig/package/swtext.i

bindings/swig/package/swversion.i

bindings/swig/package/tcl.m4

bindings/swig/package/templates.i

bindings/swig/package/treekey.i

bindings/swig/package/treekeyidx.i

bindings/swig/package/url.i

bindings/swig/package/utilxml.i

bindings/swig/package/versekey.i

bindings/swig/package/versetreekey.i

bindings/swig/package/zcom.i

bindings/swig/package/zipcomprs.i

bindings/swig/package/zld.i

bindings/swig/package/zlib.m4

bindings/swig/package/ztext.i

bindings/swig/rawcom.i

bindings/swig/rawgenbook.i

bindings/swig/rawld.i

bindings/swig/rawld4.i

bindings/swig/rawtext.i

bindings/swig/rendercallback.h

bindings/swig/searcher.h

bindings/swig/stringmgr.i

bindings/swig/swbuf.i

bindings/swig/swcacher.i

bindings/swig/swcom.i

bindings/swig/swcomprs.i

bindings/swig/swconfig.i

bindings/swig/swdisp.i

bindings/swig/swfilter.i

bindings/swig/swfiltermgr.i

bindings/swig/swgenbook.i

bindings/swig/swig-perl.doxygen

bindings/swig/swkey.i

bindings/swig/swld.i

bindings/swig/swlocale.i

bindings/swig/swlog.i

bindings/swig/swmgr.i

bindings/swig/swmodule.i

bindings/swig/swobject.i

bindings/swig/swoptfilter.i

bindings/swig/sword.i

bindings/swig/sword.pl

bindings/swig/swsearchable.i

bindings/swig/swtext.i

bindings/swig/swversion.i

bindings/swig/templates.i

bindings/swig/treekey.i

bindings/swig/treekeyidx.i

bindings/swig/url.i

bindings/swig/utilxml.i

bindings/swig/versekey.i

bindings/swig/versetreekey.i

bindings/swig/vstudio

bindings/swig/vstudio/SwigSword.csproj

bindings/swig/vstudio/libsword-csharpbindings.sln

bindings/swig/vstudio/libsword_csharpsword.vcproj

bindings/swig/zcom.i

bindings/swig/zipcomprs.i

bindings/swig/zld.i

bindings/swig/ztext.i

bindings/usrinst.sh

buildtest.cpp

config.guess

config.h.in

config.sub

configure

configure.ac

debian/addld.1.pod

debian/diatheke.1

debian/diatheke.examples

debian/diatheke.manpages

debian/imp2gbs.1.pod

debian/imp2ld.1.pod

debian/imp2vs.1.pod

debian/installmgr.1.pod

debian/libsword8.dirs

debian/libsword8.docs

debian/libsword8.install

debian/libsword8.links

debian/libsword8.lintian-overrides

debian/libsword8.manpages

debian/mkfastmod.1.pod

debian/mod2imp.1.pod

debian/osis2mod.1.pod

debian/patches/11_regex_only_when_needed.diff

debian/patches/12_fix_compiler_warnings.diff

debian/patches/13_fix_osis2mod_compression_default.diff

debian/patches/14_closing_section_not_chapter.diff

debian/patches/40_missing_includes.diff

debian/tei2mod.1.pod

debian/vpl2mod.1.pod

debian/vs2osisref.1.pod

debian/watch

debian/xml2gbs.1.pod

depcomp

distignore

doc/Doxyfile

doc/Makefile.am

doc/README

doc/greektrans.txt

doc/translation-template.conf

examples

examples/Makefile.am

examples/Makefile.in

examples/classes

examples/classes/Makefile

examples/classes/ciphercng.cpp

examples/classes/swmgrex.cpp

examples/cmdline

examples/cmdline/Makefile.am

examples/cmdline/Makefile.in

examples/cmdline/bcppmake

examples/cmdline/bcppmake/cmdline.bpg

examples/cmdline/bcppmake/listoptions.bpf

examples/cmdline/bcppmake/listoptions.bpr

examples/cmdline/bcppmake/lookup.bpf

examples/cmdline/bcppmake/lookup.bpr

examples/cmdline/bcppmake/outplain.bpf

examples/cmdline/bcppmake/outplain.bpr

examples/cmdline/bcppmake/outrender.bpf

examples/cmdline/bcppmake/outrender.bpr

examples/cmdline/bcppmake/search.bpf

examples/cmdline/bcppmake/search.bpr

examples/cmdline/bcppmake/threaded_search.bpf

examples/cmdline/bcppmake/threaded_search.bpr

examples/cmdline/bcppmake/verserangeparse.bpf

examples/cmdline/bcppmake/verserangeparse.bpr

examples/cmdline/listoptions.cpp

examples/cmdline/lookup.cpp

examples/cmdline/outplain.cpp

examples/cmdline/outrender.cpp

examples/cmdline/search.cpp

examples/cmdline/threaded_search.cpp

examples/cmdline/verserangeparse.cpp

examples/simple.cpp

icu/Makefile.am

icu/Makefile.in

icu/translit_Any_Latex.txt

icu/translit_Any_Latin1.txt

icu/translit_BETA_Greek.txt

icu/translit_BGreek_Greek.txt

icu/translit_CCAT_Hebrew.txt

icu/translit_CCAT_Syriac.txt

icu/translit_Latin_Arabic.txt

icu/translit_Latin_Armenian.txt

icu/translit_Latin_Coptic.txt

icu/translit_Latin_Ethiopic.txt

icu/translit_Latin_Georgian.txt

icu/translit_Latin_Gothic.txt

icu/translit_Latin_Hebrew.txt

icu/translit_Latin_Syriac.txt

icu/translit_Latin_Thai.txt

icu/translit_Latin_Ugaritic.txt

icu/translit_swordindex.txt

include

include/Greek2Greek.h

include/GreekChars.h

include/Makefile

include/Makefile.am

include/SwordAPI.pas

include/canon.h

include/canon_abbrevs.h

include/canon_kjva.h

include/canon_leningrad.h

include/canon_mt.h

include/canon_nrsv.h

include/canon_nrsva.h

include/canon_null.h

include/cipherfil.h

include/config.h

include/config.h.in

include/curlftpt.h

include/curlhttpt.h

include/defs.h

include/echomod.h

include/encfiltmgr.h

include/entriesblk.h

include/femain.h

include/filemgr.h

include/flatapi.h

include/ftplib.h

include/ftplibftpt.h

include/ftpparse.h

include/ftptrans.h

include/gbffootnotes.h

include/gbfheadings.h

include/gbfhtml.h

include/gbfhtmlhref.h

include/gbfmorph.h

include/gbfosis.h

include/gbfplain.h

include/gbfredletterwords.h

include/gbfrtf.h

include/gbfstrongs.h

include/gbfthml.h

include/gbfwebif.h

include/gbfwordjs.h

include/greeklexattribs.h

include/hebrewmcim.h

include/hrefcom.h

include/installmgr.h

include/latin1utf16.h

include/latin1utf8.h

include/listkey.h

include/localemgr.h

include/lzsscomprs.h

include/markupfiltmgr.h

include/multimapwdef.h

include/nullim.h

include/osisfootnotes.h

include/osisheadings.h

include/osishtmlhref.h

include/osislemma.h

include/osismorph.h

include/osismorphsegmentation.h

include/osisosis.h

include/osisplain.h

include/osisredletterwords.h

include/osisrtf.h

include/osisruby.h

include/osisscripref.h

include/osisstrongs.h

include/osisvariants.h

include/osiswebif.h

include/osiswordjs.h

include/papyriplain.h

include/plainfootnotes.h

include/plainhtml.h

include/rawcom.h

include/rawcom4.h

include/rawfiles.h

include/rawgenbook.h

include/rawld.h

include/rawld4.h

include/rawstr.h

include/rawstr4.h

include/rawtext.h

include/rawtext4.h

include/rawverse.h

include/rawverse4.h

include/roman.h

include/rtfhtml.h

include/sapphire.h

include/stringmgr.h

include/strkey.h

include/swbasicfilter.h

include/swbuf.h

include/swcacher.h

include/swcipher.h

include/swcom.h

include/swcomprs.h

include/swconfig.h

include/swdisp.h

include/swfilter.h

include/swfiltermgr.h

include/swgenbook.h

include/swinputmeth.h

include/swkey.h

include/swld.h

include/swlocale.h

include/swlog.h

include/swmacs.h

include/swmgr.h

include/swmodule.h

include/swobject.h

include/swoptfilter.h

include/swsearchable.h

include/swtext.h

include/swunicod.h

include/swversion.h

include/sysdata.h

include/teihtmlhref.h

include/teiplain.h

include/teirtf.h

include/thmlfootnotes.h

include/thmlgbf.h

include/thmlheadings.h

include/thmlhtml.h

include/thmlhtmlhref.h

include/thmllemma.h

include/thmlmorph.h

include/thmlosis.h

include/thmlplain.h

include/thmlrtf.h

include/thmlscripref.h

include/thmlstrongs.h

include/thmlvariants.h

include/thmlwebif.h

include/thmlwordjs.h

include/treekey.h

include/treekeyidx.h

include/unicodertf.h

include/untgz.h

include/url.h

include/utf16utf8.h

include/utf8arabicpoints.h

include/utf8arshaping.h

include/utf8bidireorder.h

include/utf8cantillation.h

include/utf8greekaccents.h

include/utf8hebrewpoints.h

include/utf8html.h

include/utf8latin1.h

include/utf8nfc.h

include/utf8nfkd.h

include/utf8transliterator.h

include/utf8utf16.h

include/utilstr.h

include/utilxml.h

include/versekey.h

include/versemgr.h

include/versetreekey.h

include/zcom.h

include/zconf.h

include/zipcomprs.h

include/zld.h

include/zstr.h

include/ztext.h

include/zverse.h

install-sh

lib/Makefile.am

lib/Makefile.in

lib/README

lib/bcppmake

lib/bcppmake/libsword.bdsproj

lib/bcppmake/libsword.bpf

lib/bcppmake/libsword.bpr

lib/bcppmake/libsword6icu.bpf

lib/bcppmake/libsword6icu.bpr

lib/vcppmake

lib/vcppmake/vc8

lib/vcppmake/vc8/libsword.vcproj

locales.d

locales.d/Makefile.am

locales.d/abbr.conf

locales.d/af-utf8.conf

locales.d/af.conf

locales.d/ar_EG-cp1256.conf

locales.d/ar_EG-utf8.conf

locales.d/bg_BG-cp1251.conf

locales.d/bg_BG-utf8.conf

locales.d/cs-utf8.conf

locales.d/cs.conf

locales.d/cy-utf8.conf

locales.d/cy.conf

locales.d/da-utf8.conf

locales.d/da.conf

locales.d/de-utf8.conf

locales.d/de.conf

locales.d/de_abbrev-utf8.conf

locales.d/de_abbrev.conf

locales.d/en_GB.conf

locales.d/es-utf8.conf

locales.d/es.conf

locales.d/et-utf8.conf

locales.d/et.conf

locales.d/et_abbr-utf8.conf

locales.d/et_abbr.conf

locales.d/fa-utf8.conf

locales.d/fi-utf8.conf

locales.d/fi.conf

locales.d/fr-utf8.conf

locales.d/fr.conf

locales.d/fr_abbrev-utf8.conf

locales.d/fr_abbrev.conf

locales.d/ga-utf8.conf

locales.d/he-utf8.conf

locales.d/hu-utf8.conf

locales.d/hu.conf

locales.d/id-utf8.conf

locales.d/id.conf

locales.d/it-utf8.conf

locales.d/it.conf

locales.d/ja-utf8.conf

locales.d/ko-utf8.conf

locales.d/ko.conf

locales.d/ko_abbrev-utf8.conf

locales.d/ko_abbrev.conf

locales.d/la-utf8.conf

locales.d/la.conf

locales.d/lt-utf8.conf

locales.d/mt-utf8.conf

locales.d/nb-utf8.conf

locales.d/nb.conf

locales.d/nl-utf8.conf

locales.d/nl.conf

locales.d/no-utf8.conf

locales.d/no.conf

locales.d/pl-utf8.conf

locales.d/pl.conf

locales.d/pt-utf8.conf

locales.d/pt.conf

locales.d/pt_BR-utf8.conf

locales.d/pt_BR.conf

locales.d/ro-utf8.conf

locales.d/ro.conf

locales.d/ru_RU-cp1251.conf

locales.d/ru_RU-koi8-r.conf

locales.d/ru_RU-utf8.conf

locales.d/sk-utf8.conf

locales.d/sk.conf

locales.d/sl-utf8.conf

locales.d/sl.conf

locales.d/sv-utf8.conf

locales.d/sv.conf

locales.d/th-utf8.conf

locales.d/uk_UA-cp1251.conf

locales.d/uk_UA-koi8-u.conf

locales.d/uk_UA-utf8.conf

locales.d/vi-utf8.conf

locales.d/zh_TW-utf8.conf

locales.d/zh_english-utf8.conf

ltmain.sh

m4/acx_clucene.m4

m4/cppunit.m4

m4/libtool.m4

m4/ltoptions.m4

m4/ltsugar.m4

m4/ltversion.m4

m4/lt~obsolete.m4

missing

obj/Makefile

olb/Convert.bpr

olb/Convert.cpp

olb/Doinit.c

olb/Getstrng.c

olb/Getvrsn.c

olb/Mainfrm.cpp

olb/Mainfrm.dfm

olb/Mainfrm.h

olb/Online.c

olb/addstrongs.cpp

olb/dumpav.cpp

olb/olb.bpg

olb/olb2sword.bpr

olb/olb2sword.cpp

olb/online.ide

olb/online.prj

olb/prn2sword.bpr

olb/prn2sword.cpp

olb/prn2swordfrm.cpp

olb/prn2swordfrm.dfm

olb/prn2swordfrm.h

pix/sword.gif

samples

samples/Makefile.am

samples/mods.conf.large

samples/mods.conf.small

samples/mods.d

samples/mods.d/globals.conf

samples/mods.d/rwp.conf

samples/mods.d/strongsnt.conf

samples/mods.d/strongsot.conf

samples/mods.d/vines.conf

samples/mods.d/web.conf

samples/mods.d/websters.conf

samples/recommended

samples/recommended/README

samples/recommended/sword.conf

scripts

scripts/burncd

scripts/demotar

scripts/disttar

scripts/dlltar

scripts/eastonstar

scripts/mhctar

scripts/mkcd

scripts/mkswordbase

scripts/mkswordbase2

scripts/mkswordtar

scripts/svetar

scripts/swordenv

scripts/swtxtdsp.bat

scripts/vinestar

scripts/webtar

src/Makefile

src/frontend

src/frontend/Makefile

src/frontend/Makefile.am

src/frontend/X11

src/frontend/X11/Makefile

src/frontend/framework

src/frontend/framework/Makefile

src/frontend/framework/femain.cpp

src/frontend/im

src/frontend/im/Makefile

src/frontend/im/hebrewmcim.cpp

src/frontend/im/nullim.cpp

src/frontend/im/swinputmeth.cpp

src/frontend/swdisp.cpp

src/frontend/swlog.cpp

src/frontend/windoze

src/frontend/windoze/Makefile

src/keys

src/keys/Makefile

src/keys/Makefile.am

src/keys/genarray.c

src/keys/listkey.cpp

src/keys/nt.bks

src/keys/nt.cps

src/keys/ot.bks

src/keys/ot.cps

src/keys/strkey.cpp

src/keys/swkey.cpp

src/keys/treekey.cpp

src/keys/treekeyidx.cpp

src/keys/versekey.cpp

src/keys/versetreekey.cpp

src/mgr

src/mgr/Makefile

src/mgr/Makefile.am

src/mgr/curlftpt.cpp

src/mgr/curlhttpt.cpp

src/mgr/encfiltmgr.cpp

src/mgr/filemgr.cpp

src/mgr/ftplibftpt.cpp

src/mgr/ftptrans.cpp

src/mgr/installmgr.cpp

src/mgr/localemgr.cpp

src/mgr/markupfiltmgr.cpp

src/mgr/stringmgr.cpp

src/mgr/swcacher.cpp

src/mgr/swconfig.cpp

src/mgr/swfiltermgr.cpp

src/mgr/swlocale.cpp

src/mgr/swmgr.cpp

src/mgr/swsearchable.cpp

src/mgr/versemgr.cpp

src/modules

src/modules/Makefile

src/modules/Makefile.am

src/modules/comments

src/modules/comments/Makefile

src/modules/comments/Makefile.am

src/modules/comments/hrefcom

src/modules/comments/hrefcom/Makefile

src/modules/comments/hrefcom/Makefile.am

src/modules/comments/hrefcom/hrefcom.cpp

src/modules/comments/rawcom

src/modules/comments/rawcom/Makefile

src/modules/comments/rawcom/Makefile.am

src/modules/comments/rawcom/rawcom.cpp

src/modules/comments/rawcom4

src/modules/comments/rawcom4/Makefile.am

src/modules/comments/rawcom4/rawcom4.cpp

src/modules/comments/rawfiles

src/modules/comments/rawfiles/Makefile

src/modules/comments/rawfiles/Makefile.am

src/modules/comments/rawfiles/rawfiles.cpp

src/modules/comments/swcom.cpp

src/modules/comments/zcom

src/modules/comments/zcom/Makefile

src/modules/comments/zcom/Makefile.am

src/modules/comments/zcom/zcom.cpp

src/modules/common

src/modules/common/Makefile

src/modules/common/Makefile.am

src/modules/common/compress.cpp.txt

src/modules/common/entriesblk.cpp

src/modules/common/lzsscomprs.cpp

src/modules/common/rawstr.cpp

src/modules/common/rawstr4.cpp

src/modules/common/rawverse.cpp

src/modules/common/rawverse4.cpp

src/modules/common/sapphire.cpp

src/modules/common/swcipher.cpp

src/modules/common/swcomprs.cpp

src/modules/common/swcomprs.doc

src/modules/common/zipcomprs.cpp

src/modules/common/zstr.cpp

src/modules/common/zverse.cpp

src/modules/filters

src/modules/filters/Makefile

src/modules/filters/Makefile.am

src/modules/filters/cipherfil.cpp

src/modules/filters/gbffootnotes.cpp

src/modules/filters/gbfheadings.cpp

src/modules/filters/gbfhtml.cpp

src/modules/filters/gbfhtmlhref.cpp

src/modules/filters/gbfmorph.cpp

src/modules/filters/gbfosis.cpp

src/modules/filters/gbfplain.cpp

src/modules/filters/gbfredletterwords.cpp

src/modules/filters/gbfrtf.cpp

src/modules/filters/gbfstrongs.cpp

src/modules/filters/gbfthml.cpp

src/modules/filters/gbfwebif.cpp

src/modules/filters/gbfwordjs.cpp

src/modules/filters/greeklexattribs.cpp

src/modules/filters/latin1utf16.cpp

src/modules/filters/latin1utf8.cpp

src/modules/filters/osisfootnotes.cpp

src/modules/filters/osisheadings.cpp

src/modules/filters/osishtmlhref.cpp

src/modules/filters/osislemma.cpp

src/modules/filters/osismorph.cpp

src/modules/filters/osismorphsegmentation.cpp

src/modules/filters/osisosis.cpp

src/modules/filters/osisplain.cpp

src/modules/filters/osisredletterwords.cpp

src/modules/filters/osisrtf.cpp

src/modules/filters/osisruby.cpp

src/modules/filters/osisscripref.cpp

src/modules/filters/osisstrongs.cpp

src/modules/filters/osisvariants.cpp

src/modules/filters/osiswebif.cpp

src/modules/filters/osiswordjs.cpp

src/modules/filters/papyriplain.cpp

src/modules/filters/plainfootnotes.cpp

src/modules/filters/plainhtml.cpp

src/modules/filters/rtfhtml.cpp

src/modules/filters/swbasicfilter.cpp

src/modules/filters/swoptfilter.cpp

src/modules/filters/teihtmlhref.cpp

src/modules/filters/teiplain.cpp

src/modules/filters/teirtf.cpp

src/modules/filters/thmlfootnotes.cpp

src/modules/filters/thmlgbf.cpp

src/modules/filters/thmlheadings.cpp

src/modules/filters/thmlhtml.cpp

src/modules/filters/thmlhtmlhref.cpp

src/modules/filters/thmllemma.cpp

src/modules/filters/thmlmorph.cpp

src/modules/filters/thmlosis.cpp

src/modules/filters/thmlplain.cpp

src/modules/filters/thmlrtf.cpp

src/modules/filters/thmlscripref.cpp

src/modules/filters/thmlstrongs.cpp

src/modules/filters/thmlvariants.cpp

src/modules/filters/thmlwebif.cpp

src/modules/filters/thmlwordjs.cpp

src/modules/filters/unicodertf.cpp

src/modules/filters/utf16utf8.cpp

src/modules/filters/utf8arabicpoints.cpp

src/modules/filters/utf8arshaping.cpp

src/modules/filters/utf8bidireorder.cpp

src/modules/filters/utf8cantillation.cpp

src/modules/filters/utf8greekaccents.cpp

src/modules/filters/utf8hebrewpoints.cpp

src/modules/filters/utf8html.cpp

src/modules/filters/utf8latin1.cpp

src/modules/filters/utf8nfc.cpp

src/modules/filters/utf8nfkd.cpp

src/modules/filters/utf8transliterator.cpp

src/modules/filters/utf8utf16.cpp

src/modules/genbook

src/modules/genbook/Makefile

src/modules/genbook/Makefile.am

src/modules/genbook/rawgenbook

src/modules/genbook/rawgenbook/Makefile

src/modules/genbook/rawgenbook/Makefile.am

src/modules/genbook/rawgenbook/rawgenbook.cpp

src/modules/genbook/swgenbook.cpp

src/modules/lexdict

src/modules/lexdict/Makefile

src/modules/lexdict/Makefile.am

src/modules/lexdict/rawld

src/modules/lexdict/rawld/Makefile

src/modules/lexdict/rawld/Makefile.am

src/modules/lexdict/rawld/rawld.cpp

src/modules/lexdict/rawld4

src/modules/lexdict/rawld4/Makefile

src/modules/lexdict/rawld4/Makefile.am

src/modules/lexdict/rawld4/rawld4.cpp

src/modules/lexdict/swld.cpp

src/modules/lexdict/zld

src/modules/lexdict/zld/Makefile

src/modules/lexdict/zld/Makefile.am

src/modules/lexdict/zld/zld.cpp

src/modules/readme

src/modules/swmodule.cpp

src/modules/tests

src/modules/tests/Makefile

src/modules/tests/echomod.cpp

src/modules/texts

src/modules/texts/Makefile

src/modules/texts/Makefile.am

src/modules/texts/rawtext

src/modules/texts/rawtext/Makefile

src/modules/texts/rawtext/Makefile.am

src/modules/texts/rawtext/rawtext.cpp

src/modules/texts/rawtext4

src/modules/texts/rawtext4/Makefile.am

src/modules/texts/rawtext4/rawtext4.cpp

src/modules/texts/swtext.cpp

src/modules/texts/ztext

src/modules/texts/ztext/Makefile

src/modules/texts/ztext/Makefile.am

src/modules/texts/ztext/ztext.cpp

src/utilfuns

src/utilfuns/Makefile

src/utilfuns/Makefile.am

src/utilfuns/ftplib.c

src/utilfuns/ftpparse.c

src/utilfuns/roman.cpp

src/utilfuns/swbuf.cpp

src/utilfuns/swobject.cpp

src/utilfuns/swunicod.cpp

src/utilfuns/swversion.cpp

src/utilfuns/url.cpp

src/utilfuns/utilstr.cpp

src/utilfuns/utilxml.cpp

src/utilfuns/zlib

src/utilfuns/zlib/untgz.c

stamp-h.in

sword.bmp

sword.kdevprj

sword.pc.in

sword.spec.in

tests

tests/Makefile.am

tests/Makefile.in

tests/bcppmake

tests/bcppmake/Makefile.am

tests/bcppmake/filtertest.bpf

tests/bcppmake/filtertest.bpr

tests/bcppmake/libsword.bpf

tests/bcppmake/libsword.bpr

tests/bcppmake/mgrtest.bpf

tests/bcppmake/mgrtest.bpr

tests/bcppmake/parsekey.bpf

tests/bcppmake/parsekey.bpr

tests/bcppmake/tests.bpg

tests/casttest.cpp

tests/ciphertest.cpp

tests/complzss.cpp

tests/compnone.cpp

tests/compzip.cpp

tests/configtest.cpp

tests/cppunit

tests/cppunit/Makefile.am

tests/cppunit/Makefile.in

tests/cppunit/main.cpp

tests/cppunit/stringmgr_test.cpp

tests/cppunit/swbuf_test.cpp

tests/cppunit/url_test.cpp

tests/cppunit/versekey_test.cpp

tests/filtertest.cpp

tests/icutest.cpp

tests/indextest.cpp

tests/installmgrtest.cpp

tests/introtest.cpp

tests/keycast.cpp

tests/keytest.cpp

tests/lextest.cpp

tests/listtest.cpp

tests/localetest.cpp

tests/mgrtest.cpp

tests/modtest.cpp

tests/outputcps.cpp

tests/parsekey.cpp

tests/rawldidxtest.cpp

tests/refsystest.cpp

tests/romantest.cpp

tests/swaptest.cpp

tests/swbuftest.cpp

tests/testblocks.cpp

tests/testsuite

tests/testsuite/Makefile.am

tests/testsuite/listtest.good

tests/testsuite/listtest.sh

tests/testsuite/runall.sh

tests/testsuite/runtest.sh

tests/testsuite/tmp

tests/testsuite/versekeytest.good

tests/testsuite/versekeytest.sh

tests/testsuite/versemgrtest.good

tests/testsuite/versemgrtest.sh

tests/testsuite/verseparsing-utf8.good

tests/testsuite/verseparsing-utf8.sh

tests/testsuite/verseparsing.good

tests/testsuite/verseparsing.sh

tests/testsuite/xmltag.good

tests/testsuite/xmltag.sh

tests/tlitmgrtest.cpp

tests/tmp

tests/tmp/Makefile.am

tests/tmp/README

tests/translittest.cpp

tests/versekeytest.cpp

tests/versemgrtest.cpp

tests/vtreekeytest.cpp

tests/webiftest.cpp

tests/xmltest.cpp

usrinst.sh

utilities

utilities/Makefile.am

utilities/Makefile.in

utilities/addcomment.cpp

utilities/addgb.cpp

utilities/addld.cpp

utilities/addvs.cpp

utilities/bcpp6make

utilities/bcpp6make/cipherraw.bpf

utilities/bcpp6make/cipherraw.bpr

utilities/bcpp6make/diatheke.bpf

utilities/bcpp6make/diatheke.bpr

utilities/bcpp6make/imp2gbs.bpf

utilities/bcpp6make/imp2gbs.bpr

utilities/bcpp6make/imp2ld.bpf

utilities/bcpp6make/imp2ld.bpr

utilities/bcpp6make/imp2vs.bpf

utilities/bcpp6make/imp2vs.bpr

utilities/bcpp6make/mkfastmod.bpf

utilities/bcpp6make/mkfastmod.bpr

utilities/bcpp6make/mod2imp.bpf

utilities/bcpp6make/mod2imp.bpr

utilities/bcpp6make/mod2osis.bpf

utilities/bcpp6make/mod2osis.bpr

utilities/bcpp6make/mod2vpl.bpf

utilities/bcpp6make/mod2vpl.bpr

utilities/bcpp6make/mod2zmod.bpf

utilities/bcpp6make/mod2zmod.bpr

utilities/bcpp6make/obj

utilities/bcpp6make/obj/dummy

utilities/bcpp6make/osis2mod.bpf

utilities/bcpp6make/osis2mod.bpr

utilities/bcpp6make/stage

utilities/bcpp6make/stage/dummy

utilities/bcpp6make/step2vpl.bpf

utilities/bcpp6make/step2vpl.bpr

utilities/bcpp6make/stepdump.bpf

utilities/bcpp6make/stepdump.bpr

utilities/bcpp6make/utils.bpg

utilities/bcpp6make/vpl2mod.bpf

utilities/bcpp6make/vpl2mod.bpr

utilities/bcpp6make/vs2osisref.bpf

utilities/bcpp6make/vs2osisref.bpr

utilities/bcpp6make/xml2gbs.bpf

utilities/bcpp6make/xml2gbs.bpr

utilities/bcppmake

utilities/bcppmake/Makefile.am

utilities/bcppmake/addgb.bpf

utilities/bcppmake/addgb.bpr

utilities/bcppmake/addld.bpf

utilities/bcppmake/addld.bpr

utilities/bcppmake/addvs.bpf

utilities/bcppmake/addvs.bpr

utilities/bcppmake/cipherraw.bdsproj

utilities/bcppmake/cipherraw.bpf

utilities/bcppmake/cipherraw.bpr

utilities/bcppmake/diatheke.bdsproj

utilities/bcppmake/diatheke.bpf

utilities/bcppmake/diatheke.bpr

utilities/bcppmake/imp2gbs.bdsproj

utilities/bcppmake/imp2gbs.bpf

utilities/bcppmake/imp2gbs.bpr

utilities/bcppmake/imp2ld.bdsproj

utilities/bcppmake/imp2ld.bpf

utilities/bcppmake/imp2ld.bpr

utilities/bcppmake/imp2vs.bdsproj

utilities/bcppmake/imp2vs.bpf

utilities/bcppmake/imp2vs.bpr

utilities/bcppmake/installmgr.bdsproj

utilities/bcppmake/installmgr.bpf

utilities/bcppmake/installmgr.bpr

utilities/bcppmake/libsword.bpf

utilities/bcppmake/libsword.bpr

utilities/bcppmake/mkfastmod.bdsproj

utilities/bcppmake/mkfastmod.bpf

utilities/bcppmake/mkfastmod.bpr

utilities/bcppmake/mod2imp.bdsproj

utilities/bcppmake/mod2imp.bpf

utilities/bcppmake/mod2imp.bpr

utilities/bcppmake/mod2osis.bdsproj

utilities/bcppmake/mod2osis.bpf

utilities/bcppmake/mod2osis.bpr

utilities/bcppmake/mod2vpl.bdsproj

utilities/bcppmake/mod2vpl.bpf

utilities/bcppmake/mod2vpl.bpr

utilities/bcppmake/mod2zmod.bdsproj

utilities/bcppmake/mod2zmod.bpf

utilities/bcppmake/mod2zmod.bpr

utilities/bcppmake/osis2mod.bdsproj

utilities/bcppmake/osis2mod.bpf

utilities/bcppmake/osis2mod.bpr

utilities/bcppmake/step2vpl.bdsproj

utilities/bcppmake/step2vpl.bpf

utilities/bcppmake/step2vpl.bpr

utilities/bcppmake/stepdump.bdsproj

utilities/bcppmake/stepdump.bpf

utilities/bcppmake/stepdump.bpr

utilities/bcppmake/tei2mod.bpf

utilities/bcppmake/tei2mod.bpr

utilities/bcppmake/treeidxutil.bpf

utilities/bcppmake/treeidxutil.bpr

utilities/bcppmake/utilities.bdsgroup

utilities/bcppmake/utilities.bpg

utilities/bcppmake/vpl2mod.bdsproj

utilities/bcppmake/vpl2mod.bpf

utilities/bcppmake/vpl2mod.bpr

utilities/bcppmake/vs2osisref.bdsproj

utilities/bcppmake/vs2osisref.bpf

utilities/bcppmake/vs2osisref.bpr

utilities/bcppmake/vs2osisreftxt.bpf

utilities/bcppmake/vs2osisreftxt.bpr

utilities/bcppmake/xml2gbs.bdsproj

utilities/bcppmake/xml2gbs.bpf

utilities/bcppmake/xml2gbs.bpr

utilities/cipherraw.cpp

utilities/diatheke

utilities/diatheke/Makefile.am

utilities/diatheke/Makefile.in

utilities/diatheke/README

utilities/diatheke/cgi

utilities/diatheke/cgi/Makefile.am

utilities/diatheke/cgi/dia-def.pl

utilities/diatheke/cgi/diatheke.pl

utilities/diatheke/cgi/index-private.html

utilities/diatheke/cgi/index-public.html

utilities/diatheke/corediatheke.cpp

utilities/diatheke/corediatheke.h

utilities/diatheke/diafiltmgr.cpp

utilities/diatheke/diafiltmgr.h

utilities/diatheke/diatheke.cpp

utilities/diatheke/diatheke.vcproj

utilities/diatheke/diathekemgr.cpp

utilities/diatheke/diathekemgr.h

utilities/diatheke/gbfcgi.cpp

utilities/diatheke/gbfcgi.h

utilities/diatheke/osiscgi.cpp

utilities/diatheke/osiscgi.h

utilities/diatheke/pqa

utilities/diatheke/pqa/Diatheke.pqa

utilities/diatheke/pqa/src

utilities/diatheke/pqa/src/README

utilities/diatheke/pqa/src/all.html

utilities/diatheke/pqa/src/ancient.html

utilities/diatheke/pqa/src/dict.html

utilities/diatheke/pqa/src/english.html

utilities/diatheke/pqa/src/french.html

utilities/diatheke/pqa/src/german.html

utilities/diatheke/pqa/src/index.html

utilities/diatheke/pqa/src/lex.html

utilities/diatheke/pqa/src/other.html

utilities/diatheke/pqa/src/spanish.html

utilities/diatheke/soap

utilities/diatheke/soap/sapouni.cgi

utilities/diatheke/soap/soapatheke.pl

utilities/diatheke/tcl

utilities/diatheke/tcl/biblebot-diatheke.tcl

utilities/diatheke/thmlcgi.cpp

utilities/diatheke/thmlcgi.h

utilities/emptyvss.cpp

utilities/gbfidx.cpp

utilities/genbookutil.cpp

utilities/imp2gbs.cpp

utilities/imp2ld.cpp

utilities/imp2vs.cpp

utilities/installmgr.cpp

utilities/kylixmake

utilities/kylixmake/Makefile.am

utilities/kylixmake/libsword.bpf

utilities/kylixmake/libsword.bpr

utilities/kylixmake/mod2zmod.bpf

utilities/kylixmake/mod2zmod.bpr

utilities/kylixmake/mod2zmod.res

utilities/kylixmake/utilities.bpg

utilities/lexdump.c

utilities/mkfastmod.cpp

utilities/mod2imp.cpp

utilities/mod2osis.cpp

utilities/mod2vpl.cpp

utilities/mod2zmod.cpp

utilities/modwrite.cpp

utilities/no13.c

utilities/osis2mod.cpp

utilities/perl

utilities/perl/Makefile.am

utilities/perl/cipherkeygen.pl

utilities/perl/linkvers.pl

utilities/perl/localecap.pl

utilities/perl/mkvsmod.pl

utilities/step2vpl.cpp

utilities/stepdump.cpp

utilities/sub.c

utilities/tei2mod.cpp

utilities/treeidxutil.cpp

utilities/vcppmake

utilities/vcppmake/addgb.vcproj

utilities/vcppmake/addld.vcproj

utilities/vcppmake/addvs.vcproj

utilities/vcppmake/cipherraw.vcproj

utilities/vcppmake/emptyvss.vcproj

utilities/vcppmake/imp2gbs.vcproj

utilities/vcppmake/imp2ld.vcproj

utilities/vcppmake/imp2vs.vcproj

utilities/vcppmake/installmgr.vcproj

utilities/vcppmake/mkfastmod.vcproj

utilities/vcppmake/mod2imp.vcproj

utilities/vcppmake/mod2osis.vcproj

utilities/vcppmake/mod2vpl.vcproj

utilities/vcppmake/mod2zmod.vcproj

utilities/vcppmake/osis2mod.vcproj

utilities/vcppmake/step2vpl.vcproj

utilities/vcppmake/stepdump.vcproj

utilities/vcppmake/tei2mod.vcproj

utilities/vcppmake/treeidxutil.vcproj

utilities/vcppmake/utilities.sln

utilities/vcppmake/vs2osisref.vcproj

utilities/vcppmake/vs2osisreftxt.vcproj

utilities/vcppmake/xml2gbs.vcproj

utilities/vpl2mod.cpp

utilities/vs2osisref.cpp

utilities/vs2osisreftxt.cpp

utilities/xml2gbs.cpp

files removed:
debian/diatheke.dirs

debian/libsword-dev.dirs

debian/libsword6.dirs

debian/libsword6.docs

debian/libsword6.install

debian/libsword6.shlibs

debian/patches/01_sword_c++.diff

debian/patches/03_clucene.diff

debian/patches/04_ziplock.diff

debian/patches/05_getline.diff

debian/patches/06_warnings.diff

debian/patches/07_warn_tools.diff

debian/patches/08_gcc_43.diff

debian/patches/09_pcfile.diff

sword-1.5.9.tar.gz

sword-1.5.9.tar.gz.cdbs-config_list

files modified:
debian/changelog

debian/compat

debian/control

debian/copyright

debian/diatheke.docs

debian/diatheke.install

debian/libsword-dev.install

debian/patches/02_libver.diff

debian/patches/10_diatheke.diff

debian/patches/series

debian/rules

Show diffs side-by-side

added added

removed removed

utilities/osis2mod.cpp

* CrossWire Bible Society

* P. O. Box 2528

* Tempe, AZ 85280-2528

* This program is free software; you can redistribute it and/or modify it

* under the terms of the GNU General Public License as published by the

* Free Software Foundation version 2.

* This program is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty of

* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU

* General Public License for more details.

#include <ctype.h>

#include <stdio.h>

#include <fcntl.h>

#include <errno.h>

#include <stdlib.h>

#include <stack>

#include <vector>

#include <iostream>

#include <fstream>

#include <utilstr.h>

#include <swmgr.h>

#include <rawtext.h>

#include <rawtext4.h>

#include <swbuf.h>

#include <utilxml.h>

#include <listkey.h>

#include <versekey.h>

#include <ztext.h>

#include <lzsscomprs.h>

#include <zipcomprs.h>

#include <cipherfil.h>

#ifdef _ICU_

#include <utf8nfc.h>

#include <latin1utf8.h>

#endif

#ifndef NO_SWORD_NAMESPACE

using namespace sword;

#endif

using namespace std;

// Turn debugging on and off

//#define DEBUG

int debug = 0;

const int DEBUG_WRITE = 1; // writing to module

const int DEBUG_VERSE = 2; // verse start and end

const int DEBUG_QUOTE = 4; // quotes, especially Words of Christ (WOC)

const int DEBUG_TITLE = 8; // titles

const int DEBUG_INTERVERSE = 16; // inter-verse maerial

const int DEBUG_XFORM = 32; // transformations

const int DEBUG_REV11N = 64; // versification

const int DEBUG_REF = 128; // parsing of osisID and osisRef

const int DEBUG_STACK = 256; // cleanup of references

const int DEBUG_OTHER = 512; // ins and outs of books, chapters and verses

// Exit codes

const int EXIT_BAD_ARG = 1; // Bad parameter given for program

const int EXIT_NO_WRITE = 2; // Could not open the module for writing

const int EXIT_NO_CREATE = 3; // Could not create the module

const int EXIT_NO_READ = 4; // Could not open the input file for reading.

const int EXIT_BAD_NESTING = 5; // BSP or BCV nesting is bad

#ifdef _ICU_

UTF8NFC normalizer;

Latin1UTF8 converter;

#endif

int normalized = 0;

int converted = 0;

SWText *module = 0;

VerseKey currentVerse;

SWBuf v11n = "KJV";

char activeOsisID[255];

char currentOsisID[255];

SWBuf activeVerseText;

ListKey currentKeyIDs = ListKey();

std::vector<ListKey> linkedVerses;

static bool inCanonicalOSISBook = true; // osisID is for a book that is not in Sword's canon

static bool normalize = true; // Whether to normalize UTF-8 to NFC

bool isOSISAbbrev(const char *buf) {

VerseMgr *vmgr = VerseMgr::getSystemVerseMgr();

const VerseMgr::System *av11n = vmgr->getVersificationSystem(currentVerse.getVersificationSystem());

return av11n->getBookNumberByOSISName(buf) >= 0;

100

}

101

102

/**

103

* Determine whether the string contains a valid unicode sequence.

104

* The following table give the pattern of a valid UTF-8 character.

105

* Unicode Range 1st 2nd 3rd 4th

106

* U-00000000 - U-0000007F 0nnnnnnn

107

* U-00000080 - U-000007FF 110nnnnn 10nnnnnn

108

* U-00000800 - U-0000FFFF 1110nnnn 10nnnnnn 10nnnnnn

109

* U-00010000 - U-001FFFFF 11110nnn 10nnnnnn 10nnnnnn 10nnnnnn

110

* Note:

111

* 1. The latest UTF-8 RFC allows for a max of 4 bytes.

112

* Earlier allowed 6.

113

* 2. The number of bits of the leading byte before the first 0

114

* is the total number of bytes.

115

* 3. The "n" are the bits of the unicode codepoint.

116

* This routine does not check to see if the code point is in the range.

117

* It could.

118

119

* param txt the text to check

120

* return 1 if all high order characters form a valid unicode sequence

121

* -1 if there are no high order characters.

122

* Note: this is also a valid unicode sequence

123

* 0 if there are high order characters that do not form

124

* a valid unicode sequence

125

* author DM Smith

126

127

int detectUTF8(const char *txt) {

128

unsigned int countUTF8 = 0;

129

int count = 0;

130

131

// Cast it to make masking and shifting easier

132

const unsigned char *p = (const unsigned char*) txt;

133

while (*p) {

134

// Is the high order bit set?

135

if (*p & 0x80) {

136

// Then count the number of high order bits that are set.

137

// This determines the number of following bytes

138

// that are a part of the unicode character

139

unsigned char i = *p;

140

for (count = 0; i & 0x80; count++) {

141

i <<= 1;

142

}

143

144

// Validate count:

145

// Count 0: bug in code that would cause core walking

146

// Count 1: is a pattern of 10nnnnnn,

147

// which does not signal the start of a unicode character

148

// Count 5 to 8: 111110nn, 1111110n and 11111110 and 11111111

149

// are not legal starts, either

150

if (count < 2 || count > 4) return 0;

151

152

// At this point we expect (count - 1) following characters

153

// of the pattern 10nnnnnn

154

while (--count && *++p) {

155

// The pattern of each following character must be: 10nnnnnn

156

// So, compare the top 2 bits.

157

if ((0xc0 & *p) != 0x80) return 0;

158

}

159

160

// Oops, we've run out of bytes too soon: Cannot be UTF-8

161

if (count) return 0;

162

163

// We have a valid UTF-8 character, so count it

164

countUTF8++;

165

}

166

167

// Advance to the next character to examine.

168

p++;

169

}

170

171

// At this point it is either UTF-8 or 7-bit ascii

172

return countUTF8 ? 1 : -1;

173

}

174

175

void prepareSWText(const char *osisID, SWBuf &text)

176

{

177

// Always check on UTF8 and report on non-UTF8 entries

178

int utf8State = detectUTF8(text.c_str());

179

180

// Trust, but verify.

181

if (!normalize && !utf8State) {

182

cout << "WARNING(UTF8): " << osisID << ": Should be converted to UTF-8 (" << text << ")" << endl;

183

}

184

185

#ifdef _ICU_

186

if (normalize) {

187

// Don't need to normalize text that is ASCII

188

// But assume other non-UTF-8 text is Latin1 (cp1252) and convert it to UTF-8

189

if (!utf8State) {

190

cout << "INFO(UTF8): " << osisID << ": Converting to UTF-8 (" << text << ")" << endl;

191

converter.processText(text, (SWKey *)2); // note the hack of 2 to mimic a real key. TODO: remove all hacks

192

converted++;

193

194

// Prepare for double check. This probably can be removed.

195

// But for now we are running the check again.

196

// This is to determine whether we need to normalize output of the conversion.

197

utf8State = detectUTF8(text.c_str());

198

}

199

200

// Double check. This probably can be removed.

201

if (!utf8State) {

202

cout << "ERROR(UTF8): " << osisID << ": Converting to UTF-8 (" << text << ")" << endl;

203

}

204

205

if (utf8State > 0) {

206

SWBuf before = text;

207

normalizer.processText(text, (SWKey *)2); // note the hack of 2 to mimic a real key. TODO: remove all hacks

208

if (before != text) {

209

normalized++;

210

}

211

}

212

}

213

#endif

214

}

215

216

// This routine converts an osisID or osisRef into one that SWORD can parse into a verse list

217

// An osisRef is made up of:

218

// a single osisID

219

// an osisID-osisID

220

// or

221

// an osisRef osisRef

222

223

// An osisID can have a work prefix which is terminated by a : and may have a grain

224

// which is started by a !

225

226

// However, SWORD cannot handle work prefixes or grains and expects ranges to be

227

// separated with a single;

228

void prepareSWVerseKey(SWBuf &buf) {

229

// This routine modifies the buf in place

230

char* s = buf.getRawData();

231

char* p = s;

232

bool inRange = false;

233

while (*p) {

234

if (inRange) {

235

#ifdef DEBUG

236

if (debug & DEBUG_REF) {

237

cout << "DEBUG(REF): Copy range marker:" << *p << endl;;

238

}

239

#endif

240

// Range markers are copied as is

241

*s++ = *p++;

242

}

243

244

// Look ahead to see if we are in a work prefix

245

// but don't look past an osisID

246

char *n = p;

247

while (*n && *n != ':' && *n != ' ' && *n != '-') {

248

n++;

249

}

250

251

// We have found a work prefix

252

if (*n == ':') {

253

// set p to skip the work prefix

254

p = n + 1;

255

#ifdef DEBUG

256

if (debug & DEBUG_REF) {

257

cout << "DEBUG(REF): Found a work prefix ";

258

for (char *x = s; x <= n; x++) {

259

cout << *x;

260

}

261

cout << endl;

262

}

263

#endif

264

}

265

266

// Now we are in the meat of an osisID.

267

// Copy it to its end but stop on a grain marker of '!'

268

#ifdef DEBUG

269

if (debug & DEBUG_REF) {

270

cout << "DEBUG(REF): Copy osisID:";

271

}

272

#endif

273

while (*p && *p != '!' && *p != ' ' && *p != '-') {

274

#ifdef DEBUG

275

if (debug & DEBUG_REF) {

276

cout << *p;

277

}

278

#endif

279

*s++ = *p++;

280

}

281

#ifdef DEBUG

282

if (debug & DEBUG_REF) {

283

cout << endl;

284

}

285

#endif

286

287

// The ! and everything following until we hit

288

// the end of the osisID is part of the grain reference

289

if (*p == '!') {

290

n = p;

291

while (*n && *n != ' ' && *n != '-') {

292

n++;

293

}

294

#ifdef DEBUG

295

if (debug & DEBUG_REF) {

296

cout << "DEBUG(REF): Found a grain suffix ";

297

for (char *x = p; x < n; x++) {

298

cout << *x;

299

}

300

cout << endl;

301

}

302

#endif

303

p = n;

304

}

305

306

// At this point we have processed an osisID

307

308

// if we are not in a range and the next characer is a -

309

// then we are entering a range

310

inRange = !inRange && *p == '-';

311

312

#ifdef DEBUG

313

if (debug & DEBUG_REF) {

314

if (inRange) {

315

cout << "DEBUG(REF): Found a range" << endl;

316

}

317

}

318

#endif

319

320

// between ranges and stand alone osisIDs we might have whitespace

321

if (!inRange && *p == ' ') {

322

// skip this and subsequent spaces

323

while (*p == ' ') {

324

p++;

325

}

326

// replacing them all with a ';'

327

*s++ = ';';

328

#ifdef DEBUG

329

if (debug & DEBUG_REF) {

330

cout << "DEBUG(REF): replacing space with ;. Remaining: " << p << endl;

331

}

332

#endif

333

}

334

}

335

336

// Determine whether we have modified the buffer

337

// We have modified the buffer if s is not sitting on the null byte of the original

338

if (*s) {

339

// null terminate the reference

340

*s = '\0';

341

// Since we modified the swbuf, we need to tell it what we have done

342

buf.setSize(s - buf.c_str());

343

#ifdef DEBUG

344

if (debug & DEBUG_REF) {

345

cout << "DEBUG(REF): shortended keyVal to`" << buf.c_str() << "`"<< endl;

346

}

347

#endif

348

}

349

}

350

351

/**

352

* Determine whether a verse as given is valid for the versification.

353

* This is done by comparing the before and after of normalization.

354

355

bool isValidRef(const char *buf) {

356

// Create a VerseKey that does not do auto normalization

357

// Note: need to turn on headings so that a heading does not get normalized anyway

358

// And set it to the reference under question

359

VerseKey before;

360

before.setVersificationSystem(currentVerse.getVersificationSystem());

361

before.AutoNormalize(0);

362

before.Headings(1);

363

before.setText(buf);

364

365

// If we are a heading we must bail

366

// These will autonormalize to the last verse of the prior chapter

367

if (!before.Testament() || !before.Book() || !before.Chapter() || !before.Verse()) {

368

return true;

369

}

370

371

// Create a VerseKey that does do auto normalization

372

// And set it to the reference under question

373

VerseKey after;

374

after.setVersificationSystem(currentVerse.getVersificationSystem());

375

after.AutoNormalize(1);

376

after.setText(buf);

377

378

if (before == after)

379

{

380

return true;

381

}

382

383

// If we have gotten here the reference is not in the selected versification.

384

cout << "INFO(V11N): " << before << " is not in the " << currentVerse.getVersificationSystem() << " versification." << endl;

385

386

#ifdef DEBUG

387

if (debug & DEBUG_REV11N) {

388

cout << "DEBUG(V11N): " << before << " normalizes to " << after << endl;

389

}

390

#endif

391

392

return false;

393

}

394

395

/**

396

* This routine is used to ensure that all the text in the input is saved to the module.

397

* Assumption: The input orders all the verses for a chapter in numerical order. Thus, any

398

* verses that are not in the chosen versification (v11n) follow those that are.

399

400

* The prior implementation of this adjusted the verse to the last one that is in the chosen v11n.

401

* If it the chapter were extra, then it is appended to the last verse of the last

402

* chapter in the chosen v11n for that book. If it is just extra verses for a chapter, then it is

403

* appended to the last verse of the chapter.

404

405

* The problem with this is when a OSIS verse refers to more than one verse, e.g.

406

* osisID="Gen.1.29 Gen.1.30 Gen.1.31" (Gen.1.31 is the last verse of the chapter in the chosen v11n)

407

* and then it is followed by Gen.1.32.

408

409

* This routine assumes that linking is postponed to the end so that in the example Gen.1.30-31

410

* are not linked but rather empty. This routine will then find the last verse in the computed

411

* chapter that has content.

412

413

* Alternative, we could have done linking as we went, but this routine would have needed

414

* to find the first entry in the link set and elsewhere in the code when appending to a

415

* verse, it would need to be checked for adjacent links and those would have needed to be adjusted.

416

417

* param key the key that may need to be adjusted

418

419

void makeValidRef(VerseKey &key) {

420

421

int chapterMax = key.getChapterMax();

422

int verseMax = key.getVerseMax();

423

424

#ifdef DEBUG

425

if (debug & DEBUG_REV11N) {

426

cout << "DEBUG(V11N) Chapter max:" << chapterMax << ", Verse Max:" << verseMax << endl;

427

}

428

#endif

429

430

cout << "INFO(V11N): " << key.getOSISRef() << " is not in the " << key.getVersificationSystem() << " versification.";

431

// Since isValidRef returned false constrain the key to the nearest prior reference.

432

// If we are past the last chapter set the reference to the last chapter

433

if (key.Chapter() > chapterMax) {

434

key.Chapter(chapterMax);

435

}

436

437

// Either we set the chapter to the last chapter and now need to set to the last verse in the chapter

438

// Or the verse is beyond the end of the chapter.

439

// In any case we need to constrain the verse to it's chapter.

440

key.Verse(verseMax);

441

442

// There are three cases we want to handle:

443

// In the examples we are using the KJV versification where the last verse of Matt.7 is Matt.7.29.

444

// In each of these cases the out-of-versification, extra verse is Matt.7.30.

445

// 1) The "extra" verse follows the last verse in the chapter.

446

// <verse osisID="Matt.7.29">...</verse><verse osisID="Matt.7.30">...</verse>

447

// In this case re-versify Matt.7.30 as Matt.7.29.

448

449

// 2) The "extra" verse follows a range (a set of linked verses).

450

// <verse osisID="Matt.7.28-Matt.7.29">...</verse><verse osisID="Matt.7.30">...</verse>

451

// In this case, re-versify Matt.7.30 as Matt.7.28, the first verse in the linked set.

452

// Since we are post-poning linking, we want to re-reversify to the last entry in the module.

453

454

// 3) The last verse in the chapter is not in the input. There may be other verses missing as well.

455

// <verse osisID="Matt.7.8">...</verse><verse osisID="Matt.7.30">...</verse>

456

// In this case we should re-versify Matt.7.30 as Matt.7.29.

457

// However, since this and 2) are ambiguous, we'll re-reversify to the last entry in the module.

458

459

while (!key.Error() && !module->hasEntry(&key)) {

460

key.decrement(1);

461

}

462

463

cout << " Appending content to " << key.getOSISRef() << endl;

464

}

465

466

void writeEntry(SWBuf &text, bool force = false) {

467

char keyOsisID[255];

468

469

static const char* revision = "<milestone type=\"x-importer\" subType=\"x-osis2mod\" n=\"$Rev: 2400 $\"/>";

470

static bool firstOT = true;

471

static bool firstNT = true;

472

473

if (!inCanonicalOSISBook) {

474

return;

475

}

476

477

strcpy(keyOsisID, currentVerse.getOSISRef());

478

479

// set keyOsisID to anything that an osisID cannot be.

480

if (force) {

481

strcpy(keyOsisID, "-force");

482

}

483

484

static VerseKey lastKey;

485

lastKey.setVersificationSystem(currentVerse.getVersificationSystem());

486

lastKey.AutoNormalize(0);

487

lastKey.Headings(1);

488

489

VerseKey saveKey;

490

saveKey.setVersificationSystem(currentVerse.getVersificationSystem());

491

saveKey.AutoNormalize(0);

492

saveKey.Headings(1);

493

saveKey = currentVerse;

494

495

// If we have seen a verse and the supplied one is different then we output the collected one.

496

if (*activeOsisID && strcmp(activeOsisID, keyOsisID)) {

497

498

if (!isValidRef(lastKey)) {

499

makeValidRef(lastKey);

500

}

501

502

currentVerse = lastKey;

503

504

prepareSWText(activeOsisID, activeVerseText);

505

506

// Put the revision into the module

507

int testmt = currentVerse.Testament();

508

if ((testmt == 1 && firstOT) || (testmt == 2 && firstNT)) {

509

VerseKey t;

510

t.setVersificationSystem(currentVerse.getVersificationSystem());

511

t.AutoNormalize(0);

512

t.Headings(1);

513

t = currentVerse;

514

currentVerse.Book(0);

515

currentVerse.Chapter(0);

516

currentVerse.Verse(0);

517

module->setEntry(revision);

518

currentVerse = t;

519

switch (testmt) {

520

case 1:

521

firstOT = false;

522

break;

523

case 2:

524

firstNT = false;

525

break;

526

}

527

}

528

529

// If the entry already exists, then append this entry to the text.

530

// This is for verses that are outside the chosen versification. They are appended to the prior verse.

531

// The space should not be needed if we retained verse tags.

532

SWBuf currentText = module->getRawEntry();

533

if (currentText.length()) {

534

cout << "INFO(WRITE): Appending entry: " << currentVerse.getOSISRef() << ": " << activeVerseText << endl;

535

activeVerseText = currentText + " " + activeVerseText;

536

}

537

538

#ifdef DEBUG

539

if (debug & DEBUG_WRITE) {

540

cout << "DEBUG(WRITE): " << activeOsisID << ":" << currentVerse.getOSISRef() << ": " << activeVerseText << endl;

541

}

542

#endif

543

544

module->setEntry(activeVerseText);

545

activeVerseText = "";

546

}

547

548

// The following is for initial verse content and for appending interverse content.

549

// Eliminate leading whitespace on the beginning of each verse and

550

// before we append to current content, since we just added one

551

text.trimStart();

552

if (activeVerseText.length()) {

553

activeVerseText += " ";

554

activeVerseText += text;

555

}

556

else {

557

activeVerseText = text;

558

}

559

// text has been consumed so clear it out.

560

text = "";

561

562

currentVerse = saveKey;

563

lastKey = currentVerse;

564

strcpy(activeOsisID, keyOsisID);

565

}

566

567

void linkToEntry(VerseKey &linkKey, VerseKey &dest) {

568

569

// Only link verses that are in the versification.

570

if (!isValidRef(linkKey)) {

571

return;

572

}

573

574

VerseKey saveKey;

575

saveKey.setVersificationSystem(currentVerse.getVersificationSystem());

576

saveKey.AutoNormalize(0);

577

saveKey.Headings(1);

578

saveKey = currentVerse;

579

currentVerse = linkKey;

580

581

cout << "INFO(LINK): Linking " << currentVerse.getOSISRef() << " to " << dest.getOSISRef() << "\n";

582

module->linkEntry(&dest);

583

584

currentVerse = saveKey;

585

}

586

587

// Return true if the content was handled or is to be ignored.

588

// false if the what has been seen is to be accumulated and considered later.

589

bool handleToken(SWBuf &text, XMLTag token) {

590

591

// Everything between the begin book tag and the first begin chapter tag is inBookHeader

592

static bool inBookHeader = false;

593

594

// Everything between the begin chapter tag and the first begin verse tag is inChapterHeader

595

static bool inChapterHeader = false;

596

597

// Flags indicating whether we are processing the content of a chapter

598

static bool inChapter = false;

599

600

// Flags indicating whether we are processing the content of a verse

601

static bool inVerse = false;

602

603

// Flags indicating whether we are processing the content of to be prepended to a verse

604

static bool inPreVerse = false;

605

static int genID = 1;

606

607

// Flag indicating whether we are in "Words of Christ"

608

static bool inWOC = false;

609

// Tag for WOC quotes within a verse

610

static XMLTag wocTag = "<q who=\"Jesus\" marker=\"\">";

611

612

// Flag used to indicate where useful text begins

613

static bool firstDiv = false;

614

615

// Stack of quote elements used to handle Words of Christ

616

static std::stack<XMLTag> quoteStack;

617

618

// Stack of elements used to validate that books, chapters and verses are well-formed

619

// This goes beyond simple xml well-formed and also considers milestoned div, chapter and verse

620

// to be begin and end tags, too.

621

// It is an error if books and chapters are not well formed (though not required by OSIS)

622

// It is a warning that verses are not well formed (because some clients are not ready)

623

static std::stack<XMLTag> tagStack;

624

625

// The following are used to validate well-formedness

626

static int chapterDepth = 0;

627

static int bookDepth = 0;

628

static int verseDepth = 0;

629

630

int tagDepth = tagStack.size();

631

const char *tokenName = token.getName();

632

bool isEndTag = token.isEndTag() || token.getAttribute("eID");

633

const char *typeAttr = token.getAttribute("type");

634

635

// process start tags

636

if (!isEndTag) {

637

638

// Remember non-empty start tags

639

if (!token.isEmpty()) {

640

tagStack.push(token);

641

#ifdef DEBUG

642

if (debug & DEBUG_STACK) {

643

cout << "DEBUG(STACK): " << currentOsisID << ": push (" << tagStack.size() << ") " << token.getName() << endl;

644

}

645

#endif

646

}

647

648

// throw away everything up to the first div

649

if (!firstDiv) {

650

if (!strcmp(tokenName, "div")) {

651

#ifdef DEBUG

652

if (debug & DEBUG_OTHER) {

653

cout << "DEBUG(FOUND): Found first div and pitching prior material: " << text << endl;

654

}

655

#endif

656

// TODO: Save off the content to use it to suggest the module's conf.

657

firstDiv = true;

658

text = "";

659

}

660

else {

661

// Collect the content so it can be used to suggest the module's conf.

662

return false;

663

}

664

}

665

666

//-- WITH osisID OR annotateRef -------------------------------------------------------------------------

667

// Handle Book, Chapter, and Verse (or commentary equivalent)

668

if (token.getAttribute("osisID") || token.getAttribute("annotateRef")) {

669

670

// BOOK START, <div type="book" ...>

671

if ((!strcmp(tokenName, "div")) && (typeAttr && !strcmp(typeAttr, "book"))) {

672

if (inBookHeader || inChapterHeader) { // this one should never happen, but just in case

673

#ifdef DEBUG

674

if (debug & DEBUG_TITLE) {

675

cout << "DEBUG(TITLE): " << currentOsisID << ": OOPS HEADING " << endl;

676

cout << "\tinChapterHeader = " << inChapterHeader << endl;

677

cout << "\tinBookHeader = " << inBookHeader << endl;

678

}

679

#endif

680

currentVerse.Testament(0);

681

currentVerse.Book(0);

682

currentVerse.Chapter(0);

683

currentVerse.Verse(0);

684

writeEntry(text);

685

}

686

currentVerse = token.getAttribute("osisID");

687

currentVerse.Chapter(0);

688

currentVerse.Verse(0);

689

strcpy(currentOsisID, currentVerse.getOSISRef());

690

691

inChapter = false;

692

inVerse = false;

693

inPreVerse = false;

694

inBookHeader = true;

695

inChapterHeader = false;

696

697

bookDepth = tagStack.size();

698

chapterDepth = 0;

699

verseDepth = 0;

700

701

inCanonicalOSISBook = isOSISAbbrev(token.getAttribute("osisID"));

702

if (!inCanonicalOSISBook) {

703

cout << "WARNING(V11N): New book is " << token.getAttribute("osisID") << " and is not in " << v11n << " versification, ignoring" << endl;

704

}

705

#ifdef DEBUG

706

else if (debug & DEBUG_OTHER) {

707

cout << "DEBUG(FOUND): New book is " << currentVerse.getOSISRef() << endl;

708

}

709

#endif

710

711

return false;

712

}

713

714

// CHAPTER START, <div type="chapter" ...> or <chapter ...>

715

if (((!strcmp(tokenName, "div")) && (typeAttr && !strcmp(typeAttr, "chapter"))) ||

716

(!strcmp(tokenName, "chapter"))

717

) {

718

if (inBookHeader) {

719

#ifdef DEBUG

720

if (debug & DEBUG_TITLE) {

721

cout << "DEBUG(TITLE): " << currentOsisID << ": BOOK HEADING "<< text.c_str() << endl;

722

}

723

#endif

724

writeEntry(text);

725

}

726

727

currentVerse = token.getAttribute("osisID");

728

currentVerse.Verse(0);

729

#ifdef DEBUG

730

if (debug & DEBUG_OTHER) {

731

cout << "DEBUG(FOUND): Current chapter is " << currentVerse.getOSISRef() << " (" << token.getAttribute("osisID") << ")" << endl;

732

}

733

#endif

734

strcpy(currentOsisID, currentVerse.getOSISRef());

735

736

inChapter = true;

737

inVerse = false;

738

inPreVerse = false;

739

inBookHeader = false;

740

inChapterHeader = true;

741

742

chapterDepth = tagStack.size();

743

verseDepth = 0;

744

745

return false;

746

}

747

748

// VERSE, <verse ...> OR COMMENTARY START, <div annotateType="xxx" ...>

749

if (!strcmp(tokenName, "verse") ||

750

(!strcmp(tokenName, "div") && token.getAttribute("annotateType"))) {

751

#ifdef DEBUG

752

if (debug & DEBUG_OTHER) {

753

cout << "DEBUG(FOUND): Entering verse" << endl;

754

}

755

#endif

756

if (inChapterHeader) {

757

SWBuf heading = text;

758

text = "";

759

760

if (heading.length()) {

761

#ifdef DEBUG

762

if (debug & DEBUG_TITLE) {

763

cout << "DEBUG(TITLE): " << currentOsisID << ": CHAPTER HEADING "<< heading.c_str() << endl;

764

}

765

#endif

766

writeEntry(heading);

767

}

768

769

inChapterHeader = false;

770

}

771

772

// Did we have pre-verse material that needs to be marked?

773

if (inPreVerse) {

774

char genBuf[200];

775

sprintf(genBuf, "<div type=\"x-milestone\" subType=\"x-preverse\" eID=\"pv%d\"/>", genID++);

776

text.append(genBuf);

777

}

778

779

// Get osisID for verse or annotateRef for commentary

780

SWBuf keyVal = token.getAttribute(strcmp(tokenName, "verse") ? "annotateRef" : "osisID");

781

782

// Massage the key into a form that ParseVerseList can accept

783

prepareSWVerseKey(keyVal);

784

785

// The osisID or annotateRef can be more than a single verse

786

// The first or only one is the currentVerse

787

// Use the last verse seen (i.e. the currentVerse) as the basis for recovering from bad parsing.

788

// This should never happen if the references are valid OSIS references

789

ListKey verseKeys = currentVerse.ParseVerseList(keyVal, currentVerse, true);

790

int memberKeyCount = verseKeys.Count();

791

if (memberKeyCount) {

792

currentVerse = verseKeys.getElement(0);

793

// See if this osisID or annotateRef refers to more than one verse.

794

// If it does, save it until all verses have been seen.

795

// At that point we will output links.

796

// This can be done by incrementing, which will produce an error

797

// if there is only one verse.

798

verseKeys.setPosition(TOP);

799

verseKeys.increment(1);

800

if (!verseKeys.Error()) {

801

linkedVerses.push_back(verseKeys);

802

}

803

}

804

else {

805

cout << "ERROR(REF): Invalid osisID/annotateRef: " << token.getAttribute(strcmp(tokenName, "verse") ? "annotateRef" : "osisID") << endl;

806

}

807

808

strcpy(currentOsisID, currentVerse.getOSISRef());

809

#ifdef DEBUG

810

if (debug & DEBUG_OTHER) {

811

cout << "DEBUG(FOUND): New current verse is " << currentVerse.getOSISRef() << endl;

812

cout << "DEBUG(FOUND): osisID/annotateRef is adjusted to: " << keyVal << endl;

813

}

814

#endif

815

816

inVerse = true;

817

inPreVerse = false;

818

inBookHeader = false;

819

inChapterHeader = false;

820

verseDepth = tagStack.size();

821

822

// Include the token if it is not a verse

823

if (strcmp(tokenName, "verse")) {

824

text.append(token);

825

}

826

#ifdef DEBUG

827

else if (debug & DEBUG_VERSE)

828

{

829

// transform the verse into a milestone

830

XMLTag t = "<milestone resp=\"v\" />";

831

// copy all the attributes of the verse element to the milestone

832

StringList attrNames = token.getAttributeNames();

833

for (StringList::iterator loop = attrNames.begin(); loop != attrNames.end(); loop++) {

834

const char* attr = (*loop).c_str();

835

t.setAttribute(attr, token.getAttribute(attr));

836

}

837

text.append(t);

838

}

839

#endif

840

841

if (inWOC) {

842

text.append(wocTag);

843

}

844

return true;

845

}

846

} // done with Handle Book, Chapter, and Verse (or commentary equivalent)

847

848

// Now consider everything else.

849

850

// Handle WOC quotes.

851

// Note this requires transformBSP to make them into milestones

852

// Otherwise have to do it here

853

if (!strcmp(tokenName, "q")) {

854

quoteStack.push(token);

855

#ifdef DEBUG

856

if (debug & DEBUG_QUOTE) {

857

cout << "DEBUG(QUOTE): " << currentOsisID << ": quote top(" << quoteStack.size() << ") " << token << endl;

858

}

859

#endif

860

if (token.getAttribute("who") && !strcmp(token.getAttribute("who"), "Jesus")) {

861

inWOC = true;

862

863

// Output per verse WOC markup.

864

text.append(wocTag);

865

866

// Output the quotation mark if appropriate, inside the WOC.

867

// If there is no marker attribute, let the SWORD engine manufacture one.

868

// If there is a marker attribute and it has content, then output that.

869

// If the marker attribute is present and empty, then there is nothing to do.

870

// And have it within the WOC markup

871

if (!token.getAttribute("marker") || token.getAttribute("marker")[0]) {

872

token.setAttribute("who", 0); // remove the who="Jesus"

873

text.append(token);

874

}

875

return true;

876

}

877

return false;

878

}

879

880

// Have we found the start of pre-verse material?

881

// Pre-verse material follows the following rules

882

// 1) Between the opening of a book and the first chapter, all the material is handled as an introduction to the book.

883

// 2) Between the opening of a chapter and the first verse, the material is split between the introduction of the chapter

884

// and the first verse of the chapter.

885

// A <div> with a type other than section will be taken as a chapter introduction.

886

// A <title> of type acrostic, psalm or no type, will be taken as a title for the verse.

887

// A <title> of type main or chapter will be seen as a chapter title.

888

// 3) Between verses, the material is split between the prior verse and the next verse.

889

// Basically, while end and empty tags are found, they belong to the prior verse.

890

// Once a begin tag is found, it belongs to the next verse.

891

// If the title has an attribute type of "main" or "chapter"

892

// it belongs to its <div> or <chapter> and is treated as part of its heading

893

// Otherwise if it a title in a chapter before the first the first verse it

894

// is put into the verse as a preverse title.

895

896

if (!inPreVerse && !inBookHeader) {

897

if (inChapterHeader) {

898

// Determine when we are no longer in a chapter heading, but in pre-verse material:

899

// If we see one of the following:

900

// a section div

901

// a title that is not main or chapter

902

if ((!strcmp(tokenName, "div") && (typeAttr && !strcmp(typeAttr, "section"))) ||

903

(!strcmp(tokenName, "title") && (!typeAttr || (strcmp(typeAttr, "main") && strcmp(typeAttr, "chapter"))))

904

) {

905

// Since we have found the boundary, we need to write out the chapter heading

906

writeEntry(text);

907

// And we are no longer in the chapter heading

908

inChapterHeader = false;

909

// But rather, we are now in pre-verse material

910

inPreVerse = true;

911

}

912

}

913

else if (!inVerse && inChapter) {

914

inPreVerse = true;

915

}

916

917

if (inPreVerse) {

918

char genBuf[200];

919

sprintf(genBuf, "<div type=\"x-milestone\" subType=\"x-preverse\" sID=\"pv%d\"/>", genID++);

920

text.append(genBuf);

921

}

922

}

923

924

#ifdef DEBUG

925

if (debug & DEBUG_INTERVERSE) {

926

if (!inVerse && !inBookHeader && !inChapterHeader) {

927

cout << "DEBUG(INTERVERSE): " << currentOsisID << ": interverse start token " << token << ":" << text.c_str() << endl;

928

}

929

}

930

#endif

931

932

return false;

933

} // Done with procesing start and empty tags

934

935

// Process end tags

936

else {

937

938

if (tagStack.empty()) {

939

cout << "FATAL(NESTING): " << currentOsisID << ": tag expected" << endl;

940

exit(EXIT_BAD_NESTING);

941

}

942

943

// Note: empty end tags have the eID attribute

944

if (!token.isEmpty()) {

945

XMLTag topToken = tagStack.top();

946

tagDepth = tagStack.size();

947

#ifdef DEBUG

948

if (debug & DEBUG_STACK) {

949

cout << "DEBUG(STACK): " << currentOsisID << ": pop(" << tagDepth << ") " << topToken.getName() << endl;

950

}

951

#endif

952

tagStack.pop();

953

954

if (strcmp(topToken.getName(), tokenName)) {

955

cout << "FATAL(NESTING): " << currentOsisID << ": Expected " << topToken.getName() << " found " << tokenName << endl;

956

// exit(EXIT_BAD_NESTING); // (OSK) I'm sure this validity check is a good idea, but there's a but somewhere that's killing the converter here.

957

// So I'm disabling this line. Unvalidated OSIS files shouldn't be run through the converter anyway.

958

// (DM) This has nothing to do with well-form or valid. It checks milestoned elements for proper nesting.

959

}

960

}

961

962

// We haven't seen the first div so there is nothing to do.

963

if (!firstDiv) {

964

// Collect the content so it can be used to suggest the module's conf.

965

return false;

966

}

967

968

// VERSE and COMMENTARY END

969

if (!strcmp(tokenName, "verse") || (inVerse && !strcmp(tokenName, "div"))) {

970

971

if (tagDepth != verseDepth) {

972

cout << "WARNING(NESTING): verse " << currentOsisID << " is not well formed:(" << verseDepth << "," << tagDepth << ")" << endl;

973

}

974

975

// If we are in WOC then we need to terminate the <q who="Jesus" marker=""> that was added earlier in the verse.

976

if (inWOC) {

977

text.append("</q>");

978

}

979

980

981

// Include the token if it is not a verse

982

if (strcmp(tokenName, "verse")) {

983

text.append(token);

984

}

985

#ifdef DEBUG

986

else if (debug & DEBUG_VERSE)

987

{

988

// transform the verse into a milestone

989

XMLTag t = "<milestone resp=\"v\" />";

990

// copy all the attributes of the verse element to the milestone

991

StringList attrNames = token.getAttributeNames();

992

for (StringList::iterator loop = attrNames.begin(); loop != attrNames.end(); loop++) {

993

const char* attr = (*loop).c_str();

994

t.setAttribute(attr, token.getAttribute(attr));

995

}

996

text.append(t);

997

}

998

#endif

999

1000

writeEntry(text);

1001

1002

inVerse = false;

1003

inPreVerse = false;

1004

verseDepth = 0;

1005

1006

return true;

1007

}

1008

1009

// Handle WOC quotes.

1010

// Note this requires transformBSP to make them into milestones

1011

// Otherwise have to manage it here

1012

if (!strcmp(tokenName, "q")) {

1013

XMLTag topToken = quoteStack.top();

1014

#ifdef DEBUG

1015

if (debug & DEBUG_QUOTE) {

1016

cout << "DEBUG(QUOTE): " << currentOsisID << ": quote pop(" << quoteStack.size() << ") " << topToken << " -- " << token << endl;

1017

}

1018

#endif

1019

quoteStack.pop();

1020

1021

// If we have found an end tag for a <q who="Jesus"> then we are done with the WOC

1022

// and we need to terminate the <q who="Jesus" marker=""> that was added earlier in the verse.

1023

if (token.getAttribute("who") && !strcmp(token.getAttribute("who"), "Jesus")) {

1024

#ifdef DEBUG

1025

if (debug & DEBUG_QUOTE) {

1026

cout << "DEBUG(QUOTE): " << currentOsisID << ": (" << quoteStack.size() << ") " << topToken << " -- " << token << endl;

1027

}

1028

#endif

1029

inWOC = false;

1030

const char *sID = topToken.getAttribute("sID");

1031

const char *eID = token.getAttribute("eID");

1032

if (!sID) {

1033

sID = "";

1034

}

1035

if (!eID) {

1036

eID = "";

1037

}

1038

if (strcmp(sID, eID)) {

1039

cout << "ERROR(NESTING): improper nesting " << currentOsisID << ": matching (sID,eID) not found. Looking at (" << sID << "," << eID << ")" << endl;

1040

}

1041

1042

1043

// Output the quotation mark if appropriate, inside the WOC.

1044

// If there is no marker attribute, let the SWORD engine manufacture one.

1045

// If there is a marker attribute and it has content, then output that.

1046

// If the marker attribute is present and empty, then there is nothing to do.

1047

// And have it within the WOC markup

1048

if (!token.getAttribute("marker") || token.getAttribute("marker")[0]) {

1049

token.setAttribute("who", 0); // remove the who="Jesus"

1050

text.append(token);

1051

}

1052

1053

// Now close the WOC

1054

text.append("</q>");

1055

return true;

1056

}

1057

return false;

1058

}

1059

1060

// Look for the end of document, book and chapter

1061

// Also for material that goes with last entry

1062

if (!inVerse && !inBookHeader && !inChapterHeader) {

1063

// Is this the end of a chapter.

1064

if (tagDepth == chapterDepth && (!strcmp(tokenName, "div") || !strcmp(tokenName, "chapter"))) {

1065

text.append(token);

1066

writeEntry(text);

1067

inChapter = false;

1068

chapterDepth = 0;

1069

verseDepth = 0;

1070

return true;

1071

}

1072

1073

// Is it the end of a book

1074

if (tagDepth == bookDepth && (!strcmp(tokenName, "div"))) {

1075

text.append(token);

1076

writeEntry(text);

1077

bookDepth = 0;

1078

chapterDepth = 0;

1079

verseDepth = 0;

1080

return true;

1081

}

1082

1083

// Do not include the end of an osis document

1084

if (!strcmp(tokenName, "osisText") || !strcmp(tokenName, "osis")) {

1085

bookDepth = 0;

1086

chapterDepth = 0;

1087

verseDepth = 0;

1088

text = "";

1089

return true;

1090

}

1091

1092

// When we are not inPreVerse, the interverse tags get appended to the preceeding verse.

1093

if (!inPreVerse) {

1094

text.append(token);

1095

writeEntry(text);

1096

#ifdef DEBUG

1097

if (debug & DEBUG_INTERVERSE) {

1098

cout << "DEBUG(INTERVERSE): " << currentOsisID << ": appending interverse end tag: " << tokenName << "(" << tagDepth << "," << chapterDepth << "," << bookDepth << ")" << endl;

1099

}

1100

#endif

1101

return true;

1102

}

1103

1104

#ifdef DEBUG

1105

if (debug & DEBUG_INTERVERSE) {

1106

cout << "DEBUG(INTERVERSE): " << currentOsisID << ": interverse end tag: " << tokenName << "(" << tagDepth << "," << chapterDepth << "," << bookDepth << ")" << endl;

1107

}

1108

#endif

1109

return false;

1110

1111

}

1112

1113

return false;

1114

} // done with Processing end tags

1115

1116

return false;

1117

}

1118

1119

/**

1120

* Support normalizations necessary for a SWORD module.

1121

* OSIS allows for document structure (Book, Section, Paragraph or BSP)

1122

* to overlap Bible versification (Book, Chapter, Verse).

1123

* Most SWORD applications need to display verses in isolation or in HTML table cells,

1124

* requiring each stored entry (i.e. verses) to be well-formed xml.

1125

* This routine normalizes container elements which could cross verse boundaries into milestones.

1126

* For most of these OSIS elements, there is a milestone form. However, p is not milestoneable.

1127

* For this reason, p is transformed into lb elements.

1128

* param t the tag to transform

1129

* return the transformed tag or the original one

1130

1131

XMLTag transformBSP(XMLTag t) {

1132

static std::stack<XMLTag> bspTagStack;

1133

static int sID = 1;

1134

char buf[11];

1135

1136

// Support simplification transformations

1137

if (t.isEmpty()) {

1138

#ifdef DEBUG

1139

if (debug & DEBUG_XFORM) {

1140

cout << "DEBUG(XFORM): " << currentOsisID << ": xform empty " << t << endl;

1141

}

1142

#endif

1143

return t;

1144

}

1145

1146

const char* tagName = t.getName();

1147

if (!t.isEndTag()) {

1148

// Transform <p> into <div type="paragraph"> and milestone it

1149

if (!strcmp(tagName, "p")) {

1150

t.setText("<div type=\"paragraph\" />");

1151

sprintf(buf, "gen%d", sID++);

1152

t.setAttribute("sID", buf);

1153

}

1154

1155

// Transform <tag> into <tag sID="">, where tag is a milestoneable element.

1156

// The following containers are milestoneable.

1157

// abbr, closer, div, foreign, l, lg, salute, signed, speech

1158

// Leaving out:

1159

// abbr When would this ever cross a boundary?

1160

// seg as it is used for a divineName hack

1161

// foreign so that it can be easily italicized

1162

else if (!strcmp(tagName, "chapter") ||

1163

!strcmp(tagName, "closer") ||

1164

!strcmp(tagName, "div") ||

1165

!strcmp(tagName, "l") ||

1166

!strcmp(tagName, "lg") ||

1167

!strcmp(tagName, "q") ||

1168

!strcmp(tagName, "salute") ||

1169

!strcmp(tagName, "signed") ||

1170

!strcmp(tagName, "speech") ||

1171

!strcmp(tagName, "verse")

1172

) {

1173

t.setEmpty(true);

1174

sprintf(buf, "gen%d", sID++);

1175

t.setAttribute("sID", buf);

1176

}

1177

bspTagStack.push(t);

1178

#ifdef DEBUG

1179

if (debug & DEBUG_XFORM) {

1180

cout << "DEBUG(XFORM): " << currentOsisID << ": xform push (" << bspTagStack.size() << ") " << t << " (tagname=" << tagName << ")" << endl;

1181

XMLTag topToken = bspTagStack.top();

1182

cout << "DEBUG(XFORM): " << currentOsisID << ": xform top(" << bspTagStack.size() << ") " << topToken << endl;

1183

}

1184

#endif

1185

}

1186

else {

1187

XMLTag topToken = bspTagStack.top();

1188

#ifdef DEBUG

1189

if (debug & DEBUG_XFORM) {

1190

cout << "DEBUG(XFORM): " << currentOsisID << ": xform pop(" << bspTagStack.size() << ") " << topToken << endl;

1191

}

1192

#endif

1193

bspTagStack.pop();

1194

1195

// Look for the milestoneable container tags handled above.

1196

if (!strcmp(tagName, "chapter") ||

1197

!strcmp(tagName, "closer") ||

1198

!strcmp(tagName, "div") ||

1199

!strcmp(tagName, "l") ||

1200

!strcmp(tagName, "lg") ||

1201

!strcmp(tagName, "p") ||

1202

!strcmp(tagName, "q") ||

1203

!strcmp(tagName, "salute") ||

1204

!strcmp(tagName, "signed") ||

1205

!strcmp(tagName, "speech") ||

1206

!strcmp(tagName, "verse")

1207

) {

1208

// make this a clone of the start tag with sID changed to eID

1209

// Note: in the case of </p> the topToken is a <div type="paragraph">

1210

t = topToken;

1211

t.setAttribute("eID", t.getAttribute("sID"));

1212

t.setAttribute("sID", 0);

1213

}

1214

}

1215

1216

return t;

1217

}

1218

1219

/**

1220

* Write out all links in the module.

1221

* Waiting is necessary because writeEntry might ultimately append

1222

* text to a verse moving it's offset in the data file.

1223

* While we are minimizing it by postponing the write until we have

1224

* gathered the next verse, the following scenario is happening:

1225

* A module is using linked verses and has some verses that are not

1226

* in the chosen versification. If the out-of-canon verse happens following

1227

* a linked verse, the out-of-canon verse is appended to the prior

1228

* verse. Care has to be taken that the linked verses all point to

1229

* the first of the set.

1230

1231

void writeLinks()

1232

{

1233

// Link all the verses

1234

VerseKey destKey;

1235

destKey.setVersificationSystem(currentVerse.getVersificationSystem());

1236

destKey.AutoNormalize(0);

1237

destKey.Headings(1);

1238

1239

VerseKey linkKey;

1240

linkKey.setVersificationSystem(currentVerse.getVersificationSystem());

1241

linkKey.AutoNormalize(0);

1242

linkKey.Headings(1);

1243

for (unsigned int i = 0; i < linkedVerses.size(); i++) {

1244

// The verseKeys is a list of verses

1245

// where the first is the real verse

1246

// and the others link to it.

1247

ListKey verseKeys = linkedVerses[i];

1248

verseKeys.setPosition(TOP);

1249

destKey = verseKeys.getElement();

1250

verseKeys.increment(1);

1251

1252

while (!verseKeys.Error()) {

1253

linkKey = verseKeys.getElement();

1254

verseKeys.increment(1);

1255

linkToEntry(linkKey, destKey);

1256

}

1257

}

1258

}

1259

1260

void usage(const char *app, const char *error = 0) {

1261

1262

if (error) fprintf(stderr, "\n%s: %s\n", app, error);

1263

1264

fprintf(stderr, "\nusage: %s <output/path> <osisDoc> [OPTIONS]\n", app);

1265

fprintf(stderr, " <output/path>\t\t an existing folder that the module will be written\n");

1266

fprintf(stderr, " <osisDoc>\t\t path to the validated OSIS document, or '-' to read from standard input\n");

1267

fprintf(stderr, " -a\t\t\t augment module if exists (default is to create new)\n");

1268

fprintf(stderr, " -z\t\t\t use ZIP compression (default no compression)\n");

1269

fprintf(stderr, " -Z\t\t\t use LZSS compression (default no compression)\n");

1270

fprintf(stderr, " -b <2|3|4>\t\t compression block size (default 4):\n");

1271

fprintf(stderr, "\t\t\t\t 2 - verse; 3 - chapter; 4 - book\n");

1272

fprintf(stderr, " -c <cipher_key>\t encipher module using supplied key\n");

1273

fprintf(stderr, "\t\t\t\t (default no enciphering)\n");

1274

fprintf(stderr, " -N\t\t\t do not convert UTF-8 or normalize UTF-8 to NFC\n");

1275

fprintf(stderr, "\t\t\t\t (default is to convert to UTF-8, if needed,\n");

1276

fprintf(stderr, "\t\t\t\t and then normalize to NFC)\n");

1277

fprintf(stderr, "\t\t\t\t Note: UTF-8 texts should be normalized to NFC.\n");

1278

fprintf(stderr, " -s <2|4>\t\t max text size per entry (default is 2).\n");

1279

fprintf(stderr, "\t\t\t\t Note: useful for commentaries with very large entries\n");

1280

fprintf(stderr, "\t\t\t\t in uncompressed modules (default is 65535 bytes)\n");

1281

fprintf(stderr, " -v <v11n>\t\t specify a versification scheme to use (default is KJV)\n");

1282

fprintf(stderr, "\t\t\t\t Note: The following are valid values for v11n:\n");

1283

VerseMgr *vmgr = VerseMgr::getSystemVerseMgr();

1284

StringList av11n = vmgr->getVersificationSystems();

1285

for (StringList::iterator loop = av11n.begin(); loop != av11n.end(); loop++) {

1286

fprintf(stderr, "\t\t\t\t\t%s\n", (*loop).c_str());

1287

}

1288

#ifdef DEBUG

1289

fprintf(stderr, " -d <flags>\t\t turn on debugging (default is 0)\n");

1290

fprintf(stderr, "\t\t\t\t Note: This flag may change in the future.\n");

1291

fprintf(stderr, "\t\t\t\t Flags: The following are valid values:\n");

1292

fprintf(stderr, "\t\t\t\t\t0 - no debugging\n");

1293

fprintf(stderr, "\t\t\t\t\t1 - writes to module, very verbose\n");

1294

fprintf(stderr, "\t\t\t\t\t2 - verse start and end\n");

1295

fprintf(stderr, "\t\t\t\t\t4 - quotes, especially Words of Christ (WOC)\n");

1296

fprintf(stderr, "\t\t\t\t\t8 - titles\n");

1297

fprintf(stderr, "\t\t\t\t\t16 - inter-verse material\n");

1298

fprintf(stderr, "\t\t\t\t\t32 - BSP to BCV transformations\n");

1299

fprintf(stderr, "\t\t\t\t\t64 - v11n exceptions\n");

1300

fprintf(stderr, "\t\t\t\t\t128 - parsing of osisID and osisRef\n");

1301

fprintf(stderr, "\t\t\t\t\t256 - internal stack\n");

1302

fprintf(stderr, "\t\t\t\t\t512 - miscellaneous\n");

1303

fprintf(stderr, "\t\t\t\t This flag can be used more than once.\n");

1304

#endif

1305

fprintf(stderr, "\n");

1306

fprintf(stderr, "See http://www.crosswire.org/wiki/osis2mod for more details.\n");

1307

fprintf(stderr, "\n");

1308

exit(EXIT_BAD_ARG);

1309

}

1310

1311

void processOSIS(istream& infile) {

1312

activeOsisID[0] = '\0';

1313

1314

strcpy(currentOsisID,"N/A");

1315

1316

currentVerse.setVersificationSystem(v11n);

1317

currentVerse.AutoNormalize(0);

1318

currentVerse.Headings(1); // turn on mod/testmnt/book/chap headings

1319

currentVerse.Persist(1);

1320

1321

module->setKey(currentVerse);

1322

module->setPosition(TOP);

1323

1324

SWBuf token;

1325

SWBuf text;

1326

bool intoken = false;

1327

bool inWhitespace = false;

1328

bool seeingSpace = false;

1329

char curChar = '\0';

1330

1331

while (infile.good()) {

1332

1333

curChar = infile.get();

1334

1335

// skip the character if it is bad. infile.good() will catch the problem

1336

if (curChar == -1) {

1337

continue;

1338

}

1339

1340

if (!intoken && curChar == '<') {

1341

intoken = true;

1342

token = "<";

1343

continue;

1344

}

1345

1346

// Outside of tokens merge adjacent whitespace

1347

if (!intoken) {

1348

seeingSpace = isspace(curChar);

1349

if (seeingSpace) {

1350

if (inWhitespace) {

1351

continue;

1352

}

1353

// convert all whitespace to blanks

1354

curChar = ' ';

1355

}

1356

inWhitespace = seeingSpace;

1357

}

1358

1359

if (intoken && curChar == '>') {

1360

intoken = false;

1361

inWhitespace = false;

1362

token.append('>');

1363

// take this isalpha if out to check for bugs in text

1364

if ((isalpha(token[1])) || (isalpha(token[2]))) {

1365

//cout << "Handle:" << token.c_str() << endl;

1366

XMLTag t = transformBSP(token.c_str());

1367

1368

if (!handleToken(text, t)) {

1369

text.append(t);

1370

}

1371

}

1372

continue;

1373

}

1374

1375

if (intoken) {

1376

token.append(curChar);

1377

}

1378

else {

1379

switch (curChar) {

1380

case '>' : text.append(">"); break;

1381

case '<' : text.append("<"); break;

1382

default : text.append(curChar); break;

1383

}

1384

}

1385

}

1386

1387

// Force the last entry from the text buffer.

1388

text = "";

1389

writeEntry(text, true);

1390

writeLinks();

1391

1392

#ifdef _ICU_

1393

if (converted) fprintf(stderr, "osis2mod converted %d verses to UTF-8\n", converted);

1394

if (normalized) fprintf(stderr, "osis2mod normalized %d verses to NFC\n", normalized);

1395

#endif

1396

}

1397

1398

int main(int argc, char **argv) {

1399

1400

fprintf(stderr, "You are running osis2mod: $Rev: 2400 $\n");

1401

1402

// Let's test our command line arguments

1403

if (argc < 3) {

1404

usage(*argv);

1405

}

1406

1407

// variables for arguments, holding defaults

1408

const char* program = argv[0];

1409

const char* path = argv[1];

1410

const char* osisDoc = argv[2];

1411

int append = 0;

1412

SWBuf compType = "";

1413

bool isCommentary = false;

1414

int iType = 4;

1415

int entrySize = 0;

1416

SWBuf cipherKey = "";

1417

SWCompress *compressor = 0;

1418

1419

for (int i = 3; i < argc; i++) {

1420

if (!strcmp(argv[i], "-a")) {

1421

append = 1;

1422

}

1423

else if (!strcmp(argv[i], "-z")) {

1424

if (compType.size()) usage(*argv, "Cannot specify both -z and -Z");

1425

if (entrySize) usage(*argv, "Cannot specify both -z and -s");

1426

compType = "ZIP";

1427

}

1428

else if (!strcmp(argv[i], "-Z")) {

1429

if (compType.size()) usage(*argv, "Cannot specify both -z and -Z");

1430

if (entrySize) usage(*argv, "Cannot specify both -Z and -s");

1431

compType = "LZSS";

1432

}

1433

else if (!strcmp(argv[i], "-b")) {

1434

if (i+1 < argc) {

1435

iType = atoi(argv[++i]);

1436

if ((iType >= 2) && (iType <= 4)) continue;

1437

}

1438

usage(*argv, "-b requires one of <2|3|4>");

1439

}

1440

else if (!strcmp(argv[i], "-N")) {

1441

normalize = false;

1442

}

1443

else if (!strcmp(argv[i], "-c")) {

1444

if (i+1 < argc) cipherKey = argv[++i];

1445

else usage(*argv, "-c requires <cipher_key>");

1446

}

1447

else if (!strcmp(argv[i], "-v")) {

1448

if (i+1 < argc) v11n = argv[++i];

1449

else usage(*argv, "-v requires <v11n>");

1450

}

1451

else if (!strcmp(argv[i], "-s")) {

1452

if (compType.size()) usage(*argv, "Cannot specify -s and -z or -Z");

1453

if (i+1 < argc) {

1454

entrySize = atoi(argv[++i]);

1455

if (entrySize == 2 || entrySize == 4) {

1456

continue;

1457

}

1458

}

1459

usage(*argv, "-s requires one of <2|4>");

1460

}

1461

else if (!strcmp(argv[i], "-C")) {

1462

isCommentary = true;

1463

}

1464

#ifdef DEBUG

1465

else if (!strcmp(argv[i], "-d")) {

1466

if (i+1 < argc) debug |= atoi(argv[++i]);

1467

else usage(*argv, "-d requires <flags>");

1468

}

1469

#endif

1470

else usage(*argv, (((SWBuf)"Unknown argument: ")+ argv[i]).c_str());

1471

}

1472

1473

if (compType == "ZIP") {

1474

compressor = new ZipCompress();

1475

}

1476

else if (compType = "LZSS") {

1477

compressor = new LZSSCompress();

1478

}

1479

1480

#ifndef _ICU_

1481

if (normalize) {

1482

normalize = false;

1483

cout << "WARNING(UTF8): " << program << " is not compiled with support for ICU. Assuming -N." << endl;

1484

}

1485

#endif

1486

1487

#ifdef DEBUG

1488

if (debug & DEBUG_OTHER) {

1489

cout << "DEBUG(ARGS):\n\tpath: " << path << "\n\tosisDoc: " << osisDoc << "\n\tcreate: " << append << "\n\tcompressType: " << compType << "\n\tblockType: " << iType << "\n\tcipherKey: " << cipherKey.c_str() << "\n\tnormalize: " << normalize << endl;

1490

}

1491

#endif

1492

1493

if (!append) { // == 0 then create module

1494

// Try to initialize a default set of datafiles and indicies at our

1495

// datapath location passed to us from the user.

1496

if (compressor) {

1497

if (zText::createModule(path, iType, v11n)) {

1498

fprintf(stderr, "ERROR: %s: couldn't create module at path: %s \n", program, path);

1499

exit(EXIT_NO_CREATE);

1500

}

1501

}

1502

else if (entrySize == 4) {

1503

if (RawText4::createModule(path, v11n)) {

1504

fprintf(stderr, "ERROR: %s: couldn't create module at path: %s \n", program, path);

1505

exit(EXIT_NO_CREATE);

1506

}

1507

}

1508

else {

1509

if (RawText::createModule(path, v11n)) {

1510

fprintf(stderr, "ERROR: %s: couldn't create module at path: %s \n", program, path);

1511

exit(EXIT_NO_CREATE);

1512

}

1513

}

1514

}

1515

1516

// Do some initialization stuff

1517

if (compressor) {

1518

// Create a compressed text module allowing very large entries

1519

// Taking defaults except for first, fourth, fifth and last argument

1520

module = new zText(

1521

path, // ipath

1522

0, // iname

1523

0, // idesc

1524

iType, // iblockType

1525

compressor, // icomp

1526

0, // idisp

1527

ENC_UNKNOWN, // enc

1528

DIRECTION_LTR, // dir

1529

FMT_UNKNOWN, // markup

1530

0, // lang

1531

v11n // versification

1532

);

1533

}

1534

else if (entrySize == 4) {

1535

// Create a raw text module allowing very large entries

1536

// Taking defaults except for first and last argument

1537

module = new RawText4(

1538

path, // ipath

1539

0, // iname

1540

0, // idesc

1541

0, // idisp

1542

ENC_UNKNOWN, // encoding

1543

DIRECTION_LTR, // dir

1544

FMT_UNKNOWN, // markup

1545

0, // ilang

1546

v11n // versification

1547

);

1548

}

1549

else {

1550

// Create a raw text module allowing reasonable sized entries

1551

// Taking defaults except for first and last argument

1552

module = new RawText(

1553

path, // ipath

1554

0, // iname

1555

0, // idesc

1556

0, // idisp

1557

ENC_UNKNOWN, // encoding

1558

DIRECTION_LTR, // dir

1559

FMT_UNKNOWN, // markup

1560

0, // ilang

1561

v11n // versification

1562

);

1563

}

1564

1565

SWFilter *cipherFilter = 0;

1566

1567

if (cipherKey.length()) {

1568

fprintf(stderr, "Adding cipher filter with phrase: %s\n", cipherKey.c_str() );

1569

cipherFilter = new CipherFilter(cipherKey.c_str());

1570

module->AddRawFilter(cipherFilter);

1571

}

1572

1573

if (!module->isWritable()) {

1574

fprintf(stderr, "The module is not writable. Writing text to it will not work.\nExiting.\n" );

1575

exit(EXIT_NO_WRITE);

1576

}

1577

1578

// Either read from std::cin (aka stdin), when the argument is a '-'

1579

// or from a specified file.

1580

if (!strcmp(osisDoc, "-")) {

1581

processOSIS(cin);

1582

}

1583

else {

1584

// Let's see if we can open our input file

1585

ifstream infile(osisDoc);

1586

if (infile.fail()) {

1587

fprintf(stderr, "ERROR: %s: couldn't open input file: %s \n", program, osisDoc);

1588

exit(EXIT_NO_READ);

1589

}

1590

processOSIS(infile);

1591

infile.close();

1592

}

1593

1594

delete module;

1595

if (cipherFilter)

1596

delete cipherFilter;

1597

1598

exit(0); // success

1599

}

1600

Older »