~ubuntu-branches/ubuntu/maverick/uim/maverick

Viewing changes to sigscheme/doc/multibyte.html

Committer: Bazaar Package Importer
Author(s): Masahito Omote
Date: 2008-05-18 22:18:10 UTC
mfrom: (1.1.8 upstream)
mto: This revision was merged to the branch mainline in revision 5.
Revision ID: james.westby@ubuntu.com-20080518221810-4d2rd0ca18xnu8kc

Tags: 1:1.5.1-1

* New upstream release
* uim-qt3: Add uim inputcontext plugin for Qt3. And due to uim-*-qt are
  not supported in Qt4 for now officially, uim-*-qt are contained in
  this package.
* uim-qt: Depends uim-qt3 because of described above.
* libuim6: New package for syncing with upstream upgrade soversion.
* 05_qmake_bug_workaround.dpatch: patch for the workaround that qmake does
  not add link option against other libraries(e.g. -lX11) by default.

files added:
debian/libuim6.install

debian/patches/05_qmake_bug_workaround.dpatch

debian/uim-qt3.install

debian/uim-qt3.menu

doc/ENV

doc/PACKAGING

emacs/uim-version.el

emacs/uim-version.el.in

gtk/gtk-rc-get-immodule-file.c

m4/ax_func_sigsetjmp.m4

m4/ax_path_qmake4.m4

m4/eb4.m4

m4/wnn.m4

notify

notify/Makefile.am

notify/Makefile.in

notify/uim-knotify3.cc

notify/uim-libnotify.c

pixmaps/anthy-utf8.png

pixmaps/elatin.png

pixmaps/elatin.svg

pixmaps/look.png

pixmaps/look.svg

pixmaps/sj3.png

pixmaps/sj3.svg

pixmaps/uim-m17nlib-relink-icons.in

pixmaps/wnn.png

pixmaps/wnn.svg

qt4/Makefile.am

qt4/Makefile.in

qt4/edittest

qt4/edittest/Makefile.am

qt4/edittest/Makefile.in

qt4/edittest/README

qt4/edittest/edittest.pro

qt4/edittest/main.cpp

qt4/immodule

qt4/immodule/INDENT

qt4/immodule/Makefile.am

qt4/immodule/Makefile.in

qt4/immodule/README.en

qt4/immodule/README.ja

qt4/immodule/candidatewindow.cpp

qt4/immodule/candidatewindow.h

qt4/immodule/debug.h

qt4/immodule/plugin.cpp

qt4/immodule/plugin.h

qt4/immodule/qhelpermanager.cpp

qt4/immodule/qhelpermanager.h

qt4/immodule/qtextutil.cpp

qt4/immodule/qtextutil.h

qt4/immodule/quiminfomanager.cpp

qt4/immodule/quiminfomanager.h

qt4/immodule/quiminputcontext.cpp

qt4/immodule/quiminputcontext.h

qt4/immodule/quiminputcontext_compose.cpp

qt4/immodule/quiminputcontext_compose.h

qt4/immodule/quiminputcontext_with_slave.cpp

qt4/immodule/quiminputcontext_with_slave.h

qt4/immodule/quiminputcontextplugin.pro.in

qt4/immodule/subwindow.cpp

qt4/immodule/subwindow.h

replace/bsd-asprintf.c

replace/bsd-snprintf.c

replace/fake-rfc2553.c

replace/fake-rfc2553.h

replace/strtoll.c

replace/strtonum.c

scm/anthy-utf8-custom.scm

scm/anthy-utf8.scm

scm/deprecated-util.scm

scm/editline.scm

scm/elatin-custom.scm

scm/elatin-rules.scm

scm/elatin.scm

scm/ichar.scm

scm/iso-639-1.scm

scm/look-custom.scm

scm/look.scm

scm/sj3-custom.scm

scm/sj3-key-custom.scm

scm/sj3.scm

scm/tutcode-bushudic.scm

scm/tutcode-custom.scm

scm/tutcode-rule.scm

scm/wnn-custom.scm

scm/wnn-key-custom.scm

scm/wnn.scm

sigscheme/doc/multibyte.html

sigscheme/doc/multibyte.txt

sigscheme/lib/sigscheme-init.scm

sigscheme/lib/srfi-0.scm

sigscheme/lib/srfi-1.scm

sigscheme/lib/srfi-43.scm

sigscheme/lib/srfi-55.scm

sigscheme/lib/srfi-69.scm

sigscheme/lib/srfi-9.scm

sigscheme/lib/srfi-95.scm

sigscheme/lib/unittest.scm

sigscheme/m4/ax_func_sigsetjmp.m4

sigscheme/sigscheme.mk.in

sigscheme/src/functable-legacy-macro.c

sigscheme/src/functable-srfi43.c

sigscheme/src/functable-srfi55.c

sigscheme/src/functable-srfi9.c

sigscheme/src/legacy-macro.c

sigscheme/src/module-srfi43.c

sigscheme/src/module-srfi55.c

sigscheme/src/module-srfi9.c

sigscheme/test-c/test-array2list-coll.c

sigscheme/test-c/test-array2list.c

sigscheme/test-c/test-gc-protect-coll.c

sigscheme/test-c/test-gc-protect.c

sigscheme/test/gauche-let-optionals.scm

sigscheme/test/oleg-srfi2.scm

sigscheme/test/scm-r4rstest.scm

sigscheme/test/test-char-pred.scm

sigscheme/test/test-fail.scm

sigscheme/test/test-legacy-macro.scm

sigscheme/test/test-srfi0.scm

sigscheme/test/test-srfi1-another.scm

sigscheme/test/test-srfi1-obsolete.scm

sigscheme/test/test-srfi43.scm

sigscheme/test/test-srfi55.scm

sigscheme/test/test-srfi9.scm

sigscheme/test/test-sscm-ext.scm

sigscheme/test/test-string-proc.scm

sigscheme/test/test-unittest.scm

test/test-anthy.scm

uim/anthy-utf8.c

uim/bsdlook.c

uim/bsdlook.h

uim/counted-init.c

uim/counted-init.h

uim/encoding-table.c

uim/iconv.c

uim/look.c

uim/rk.c

uim/sj3.c

uim/uim-error.c

uim/uim-notify.c

uim/uim-notify.h

uim/uim-posix.c

uim/uim-posix.h

uim/uim-scm-abbrev.h

uim/uim-scm-sigscheme.c

uim/uim-x-kana-input-hack.c

uim/uim-x-util.h

uim/wnnlib.c

uim/wnnlib.h

files removed:
debian/libuim5.install

debian/uim-qt.menu

scm/spellcheck-custom.scm

scm/spellcheck.scm

scm/uim-db.scm

sigscheme/doc/gc-protection.html

sigscheme/doc/gc-protection.txt

sigscheme/doc/test-c.html

sigscheme/doc/test-c.txt

sigscheme/lib/slib.scm

sigscheme/test/test-r4rs.scm

sigscheme/test/test-srfi1.scm

sigscheme/test/unittest.scm

test/test-db.scm

test/test-slib.scm

uim/editline.h

uim/iso-639-1.def

uim/uim-compat-scm.c

uim/uim-compat-scm.h

uim/uim-encoding.h

uim/uim-scm.c

files modified:
AUTHORS

COPYING

ChangeLog

Makefile.am

Makefile.in

NEWS

RELNOTE

aclocal.m4

config.guess

config.sub

configure

configure.ac

debian/changelog

debian/control

debian/patches/00list

debian/patches/01_support_skk_alternatives.dpatch

debian/rules

debian/uim-anthy.install

debian/uim-anthy.postinst

debian/uim-common.install

debian/uim-el.install

debian/uim-latin.install

debian/uim-qt.install

depcomp

doc/00INDEX

doc/COMPATIBILITY

doc/Makefile.am

doc/Makefile.in

doc/RELEASING

doc/UIM-SCM

doc/UIM-SH

emacs/Makefile.am

emacs/Makefile.in

emacs/README

emacs/README.ja

emacs/callback.h

emacs/candidate.h

emacs/commit.h

emacs/context.c

emacs/context.h

emacs/debug.h

emacs/encoding.h

emacs/helper-message.h

emacs/helper-server.h

emacs/helper.h

emacs/im.h

emacs/key.c

emacs/key.h

emacs/output.h

emacs/preedit.h

emacs/prop.h

emacs/uim-candidate.el

emacs/uim-el-agent.c

emacs/uim-el-agent.h

emacs/uim-el-helper-agent.c

emacs/uim-el-helper-agent.h

emacs/uim-el-types.h

emacs/uim-helper.el

emacs/uim-key.el

emacs/uim-keymap.el

emacs/uim-leim.el

emacs/uim-util.el

emacs/uim-var.el

emacs/uim.el

examples/Makefile.in

examples/uim-custom/Makefile.am

examples/uim-custom/Makefile.in

examples/uim-custom/uim-custom-update.c

fep/Makefile.am

fep/Makefile.in

fep/README

fep/README.ja

fep/callbacks.c

fep/callbacks.h

fep/draw.c

fep/draw.h

fep/escseq.h

fep/helper.h

fep/key.h

fep/read.h

fep/str.h

fep/udsock.c

fep/udsock.h

fep/uim-fep.c

gtk/Makefile.am

gtk/Makefile.in

gtk/compose.h

gtk/gtk-im-uim.c

gtk/key-util-gtk.c

gtk/key-util-gtk.h

gtk/test/Makefile.in

gtk/test/entry.c

gtk/text-util.h

gtk/uim-cand-win-gtk.c

gtk/uim-cand-win-gtk.h

gtk/uim-eb.c

gtk/uim-eb.h

helper/GNOME_UimApplet.server.in.in

helper/Makefile.am

helper/Makefile.in

helper/candwin-gtk.c

helper/dict-anthy.h

helper/dict-canna-cclass.h

helper/dict-canna.h

helper/dict-cclass-dialog.h

helper/dict-dict.h

helper/dict-util.h

helper/dict-word-list-view-gtk.h

helper/dict-word-list-win-gtk.c

helper/dict-word-list-win-gtk.h

helper/dict-word-win-gtk.h

helper/dict-word.h

helper/eggtrayicon.h

helper/im-switcher-gtk.c

helper/pref-gtk-custom-widgets.c

helper/pref-gtk.c

helper/toolbar-common-gtk.c

install-sh

intltool-extract.in

intltool-merge.in

intltool-update.in

ltmain.sh

m4/Makefile.am

m4/Makefile.in

make-dist.sh

pixmaps/Makefile.am

pixmaps/Makefile.in

pixmaps/README

pixmaps/byeoru.png

pixmaps/direct.png

pixmaps/direct_input.png

pixmaps/hangul2.png

pixmaps/hangul3.png

pixmaps/im_switcher.png

pixmaps/ipa-x-sampa.png

pixmaps/ja_azik.png

pixmaps/ja_direct.png

pixmaps/ja_fullwidth_alnum.png

pixmaps/ja_halfkana.png

pixmaps/ja_halfwidth_alnum.png

pixmaps/ja_hiragana.png

pixmaps/ja_kana.png

pixmaps/ja_katakana.png

pixmaps/ja_nicola.png

pixmaps/ja_pocketbell.png

pixmaps/ja_romaji.png

pixmaps/ko_direct.png

pixmaps/ko_hangulchar.png

pixmaps/ko_hangulword.png

pixmaps/latin.png

pixmaps/mana.png

pixmaps/off.png

pixmaps/on.png

pixmaps/pinyin-big5.png

pixmaps/prime_mode_application.png

pixmaps/py.png

pixmaps/pyunihan.png

pixmaps/romaja.png

pixmaps/scim.png

pixmaps/skk.png

pixmaps/tcode.png

pixmaps/trycode.png

pixmaps/tutcode.png

pixmaps/uim-dict.png

pixmaps/unknown.png

pixmaps/viqr.png

po/Makefile.in.in

po/POTFILES.in

po/fr.po

po/ja.po

po/ko.po

qt/Makefile.am

qt/Makefile.in

qt/candwin-qt.h

qt/chardict/Makefile.in

qt/chardict/chardict-bushuviewwidget.h

qt/chardict/chardict-chargridview.h

qt/chardict/chardict-qt.h

qt/chardict/chardict-unicodeviewwidget.h

qt/chardict/po/Makefile.in.in

qt/chardict/po/ja.po

qt/chardict/qtgettext.h

qt/immodule-candidatewindow.h

qt/immodule-plugin.cpp

qt/immodule-plugin.h

qt/immodule-qhelpermanager.cpp

qt/immodule-qhelpermanager.h

qt/immodule-qtextutil.h

qt/immodule-quiminfomanager.cpp

qt/immodule-quiminfomanager.h

qt/immodule-quiminputcontext.cpp

qt/immodule-quiminputcontext.h

qt/immodule-quiminputcontext_compose.h

qt/immodule-quiminputcontext_with_slave.h

qt/immodule-subwindow.h

qt/pref-customwidgets.cpp

qt/pref-customwidgets.h

qt/pref-qt.cpp

qt/pref-qt.h

qt/qtgettext.h

qt/switcher-qt.h

qt/test/Makefile.in

qt/test/qedittest.cpp

qt/toolbar-applet-kde.h

qt/toolbar-common-quimhelpertoolbar.cpp

qt/toolbar-common-quimhelpertoolbar.h

qt/toolbar-common-uimstateindicator.h

qt/toolbar-standalone-qt.h

replace/Makefile.am

replace/Makefile.in

replace/os_dep.h

scm/Makefile.am

scm/Makefile.in

scm/anthy-custom.scm

scm/anthy-key-custom.scm

scm/anthy.scm

scm/byeoru-custom.scm

scm/byeoru-dic.scm

scm/byeoru-key-custom.scm

scm/byeoru-symbols.scm

scm/byeoru.scm

scm/canna-custom.scm

scm/canna-key-custom.scm

scm/canna.scm

scm/custom-rt.scm

scm/custom.scm

scm/generic-custom.scm

scm/generic-key-custom.scm

scm/generic.scm

scm/hangul.scm

scm/i18n.scm

scm/im-custom.scm

scm/im-switcher.scm

scm/im.scm

scm/init.scm

scm/japanese.scm

scm/key.scm

scm/latin.scm

scm/lazy-load.scm

scm/load-action.scm

scm/m17nlib.scm

scm/mana-custom.scm

scm/mana-key-custom.scm

scm/mana.scm

scm/plugin.scm

scm/prime-custom.scm

scm/prime-key-custom.scm

scm/prime.scm

scm/rk.scm

scm/romaja.scm

scm/skk-custom.scm

scm/skk-dialog.scm

scm/skk-editor.scm

scm/skk-key-custom.scm

scm/skk.scm

scm/tcode.scm

scm/trycode.scm

scm/tutcode-key-custom.scm

scm/tutcode.scm

scm/uim-module-manager.scm

scm/uim-sh.scm

scm/ustr.scm

scm/util.scm

sigscheme/COPYING

sigscheme/ChangeLog

sigscheme/Makefile.am

sigscheme/Makefile.in

sigscheme/NEWS

sigscheme/QALog

sigscheme/README

sigscheme/RELNOTE

sigscheme/TODO

sigscheme/aclocal.m4

sigscheme/bench/Makefile.in

sigscheme/config.guess

sigscheme/config.sub

sigscheme/configure

sigscheme/configure.in

sigscheme/depcomp

sigscheme/doc/Makefile.am

sigscheme/doc/Makefile.in

sigscheme/doc/design.html

sigscheme/doc/global-obj.html

sigscheme/doc/index.html

sigscheme/doc/index.txt

sigscheme/doc/release.html

sigscheme/doc/release.txt

sigscheme/doc/spec.html

sigscheme/doc/spec.txt

sigscheme/doc/style.html

sigscheme/include/Makefile.in

sigscheme/include/sigscheme/Makefile.in

sigscheme/install-sh

sigscheme/lib/Makefile.am

sigscheme/lib/Makefile.in

sigscheme/libgcroots/Makefile.in

sigscheme/libgcroots/aclocal.m4

sigscheme/libgcroots/config.guess

sigscheme/libgcroots/config.sub

sigscheme/libgcroots/configure

sigscheme/libgcroots/depcomp

sigscheme/libgcroots/install-sh

sigscheme/libgcroots/ltmain.sh

sigscheme/libgcroots/m4/Makefile.in

sigscheme/ltmain.sh

sigscheme/m4/Makefile.am

sigscheme/m4/Makefile.in

sigscheme/make-dist.sh

sigscheme/runbench.sh

sigscheme/runtest-tail-rec.sh

sigscheme/runtest.sh

sigscheme/sigscheme.pc.in

sigscheme/src/Makefile.am

sigscheme/src/Makefile.in

sigscheme/src/char.c

sigscheme/src/config.h.in

sigscheme/src/continuation.c

sigscheme/src/encoding-config.h

sigscheme/src/encoding.c

sigscheme/src/encoding.h

sigscheme/src/env.c

sigscheme/src/eval.c

sigscheme/src/format.c

sigscheme/src/functable-r5rs-load.c

sigscheme/src/functable-r5rs-port.c

sigscheme/src/functable-r5rs-string-procedure.c

sigscheme/src/functable-r5rs-vector.c

sigscheme/src/functable-siod.c

sigscheme/src/functable-srfi1.c

sigscheme/src/functable-sscm-core.c

sigscheme/src/functable-sscm-ext.c

sigscheme/src/gcroots/gcroots.c

sigscheme/src/gcroots/gcroots.h

sigscheme/src/libtool-version.mk

sigscheme/src/list.c

sigscheme/src/load.c

sigscheme/src/main.c

sigscheme/src/module-siod.c

sigscheme/src/module-srfi1.c

sigscheme/src/module-srfi2.c

sigscheme/src/module-srfi34.c

sigscheme/src/module-srfi8.c

sigscheme/src/module-sscm-ext.c

sigscheme/src/module.c

sigscheme/src/number-io.c

sigscheme/src/port.c

sigscheme/src/procedure.c

sigscheme/src/promise.c

sigscheme/src/read.c

sigscheme/src/scmport-mbchar.c

sigscheme/src/sigscheme-combined-trim.h

sigscheme/src/sigscheme.c

sigscheme/src/sigscheme.h

sigscheme/src/sigschemeinternal.h

sigscheme/src/storage-common.h

sigscheme/src/storage-compact.h

sigscheme/src/storage-fatty.h

sigscheme/src/storage-gc.c

sigscheme/src/string-procedure.c

sigscheme/src/string.c

sigscheme/src/symbol.c

sigscheme/src/vector.c

sigscheme/src/write.c

sigscheme/test-c/Makefile.am

sigscheme/test-c/Makefile.in

sigscheme/test-c/sscm-test.h

sigscheme/test-c/test-format-coll.c

sigscheme/test-c/test-format.c

sigscheme/test-c/test-gc-protect-stack-coll.c

sigscheme/test-c/test-gc-protect-stack.c

sigscheme/test-c/test-minishell.c

sigscheme/test-c/test-storage-coll.c

sigscheme/test-c/test-storage.c

sigscheme/test/Makefile.am

sigscheme/test/Makefile.in

sigscheme/test/bigloo-letrec.scm

sigscheme/test/gauche-euc-jp.scm

sigscheme/test/gauche-primsyn.scm

sigscheme/test/run-singletest.sh.in

sigscheme/test/test-apply.scm

sigscheme/test/test-assoc.scm

sigscheme/test/test-begin.scm

sigscheme/test/test-bool.scm

sigscheme/test/test-char-cmp.scm

sigscheme/test/test-char.scm

sigscheme/test/test-continuation.scm

sigscheme/test/test-define-internal.scm

sigscheme/test/test-define.scm

sigscheme/test/test-do.scm

sigscheme/test/test-dyn-extent.scm

sigscheme/test/test-enc-eucgeneric.scm

sigscheme/test/test-enc-eucjp.scm

sigscheme/test/test-enc-sjis.scm

sigscheme/test/test-enc-utf8.scm

sigscheme/test/test-eq.scm

sigscheme/test/test-equal.scm

sigscheme/test/test-eqv.scm

sigscheme/test/test-eval.scm

sigscheme/test/test-formal-syntax.scm

sigscheme/test/test-formatplus.scm

sigscheme/test/test-lambda.scm

sigscheme/test/test-let.scm

sigscheme/test/test-letrec.scm

sigscheme/test/test-letstar.scm

sigscheme/test/test-list.scm

sigscheme/test/test-map.scm

sigscheme/test/test-member.scm

sigscheme/test/test-misc.scm

sigscheme/test/test-named-let.scm

sigscheme/test/test-number-arith.scm

sigscheme/test/test-number-cmp.scm

sigscheme/test/test-number-io.scm

sigscheme/test/test-number-literal.scm

sigscheme/test/test-number-pred.scm

sigscheme/test/test-obsolete.scm

sigscheme/test/test-pair.scm

sigscheme/test/test-quote.scm

sigscheme/test/test-srfi2.scm

sigscheme/test/test-srfi28.scm

sigscheme/test/test-srfi34-2.scm

sigscheme/test/test-srfi34.scm

sigscheme/test/test-srfi38.scm

sigscheme/test/test-srfi48.scm

sigscheme/test/test-srfi6.scm

sigscheme/test/test-srfi60.scm

sigscheme/test/test-srfi8.scm

sigscheme/test/test-string-cmp.scm

sigscheme/test/test-string-core.scm

sigscheme/test/test-string-null.scm

sigscheme/test/test-string.scm

sigscheme/test/test-symbol.scm

sigscheme/test/test-syntax-rules.scm

sigscheme/test/test-syntax.scm

sigscheme/test/test-tail-rec.scm

sigscheme/test/test-values.scm

sigscheme/test/test-vector.scm

sigscheme/test/unittest-bigloo.scm

sigscheme/test/unittest-gauche.scm

sigscheme/tools/Makefile.in

test/Makefile.am

test/Makefile.in

test/test-action.scm

test/test-custom-rt.scm

test/test-custom.scm

test/test-example.scm

test/test-i18n.scm

test/test-im.scm

test/test-intl.scm

test/test-key.scm

test/test-lazy-load.scm

test/test-plugin.scm

test/test-uim-test-utils.scm

test/test-uim-util.scm

test/test-ustr.scm

test/test-util.scm

test/uim-test-utils.scm

uim.desktop

uim.desktop.in.in

uim.pc.in

uim.spec

uim/Makefile.am

uim/Makefile.in

uim/agent.c

uim/anthy.c

uim/canna.c

uim/config.h.in

uim/editline.c

uim/intl.c

uim/libtool-version.mk

uim/m17nlib.c

uim/mana.c

uim/plugin.c

uim/plugin.h

uim/prime.c

uim/scim.cpp

uim/skk.c

uim/uim-custom.c

uim/uim-custom.h

uim/uim-func.c

uim/uim-helper-client.c

uim/uim-helper-server.c

uim/uim-helper.c

uim/uim-helper.h

uim/uim-im-switcher.h

uim/uim-internal.h

uim/uim-ipc.c

uim/uim-key.c

uim/uim-module-manager.c

uim/uim-scm.h

uim/uim-sh.c

uim/uim-util.c

uim/uim-util.h

uim/uim.c

uim/uim.h

xim/Makefile.am

xim/Makefile.in

xim/canddisp.cpp

xim/canddisp.h

xim/compose.cpp

xim/compose.h

xim/connection.cpp

xim/connection.h

xim/convdisp.cpp

xim/convdisp.h

xim/helper.h

xim/locale.cpp

xim/main.cpp

xim/util.cpp

xim/util.h

xim/xdispatch.h

xim/xim.h

xim/ximic.cpp

xim/ximim.cpp

xim/ximpacket.cpp

xim/ximpn.h

xim/ximserver.cpp

xim/ximserver.h

xim/ximtrans.cpp

Show diffs side-by-side

added added

removed removed

sigscheme/doc/multibyte.html

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN"

"http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">

<head>

/* Debug borders */

p, li, dt, dd, div, pre, h1, h2, h3, h4, h5, h6 {

border: 1px solid red;

}

body {

margin: 1em 5% 1em 5%;

}

a {

color: blue;

text-decoration: underline;

}

a:visited {

color: fuchsia;

}

em {

font-style: italic;

}

strong {

font-weight: bold;

}

tt {

color: navy;

}

h1, h2, h3, h4, h5, h6 {

color: #527bbd;

font-family: sans-serif;

margin-top: 1.2em;

margin-bottom: 0.5em;

line-height: 1.3;

}

h1 {

border-bottom: 2px solid silver;

}

h2 {

border-bottom: 2px solid silver;

padding-top: 0.5em;

}

div.sectionbody {

font-family: serif;

margin-left: 0;

}

hr {

border: 1px solid silver;

}

p {

margin-top: 0.5em;

margin-bottom: 0.5em;

}

pre {

padding: 0;

margin: 0;

}

span#author {

color: #527bbd;

font-family: sans-serif;

font-weight: bold;

font-size: 1.1em;

}

span#email {

}

span#revision {

font-family: sans-serif;

}

div#footer {

font-family: sans-serif;

font-size: small;

border-top: 2px solid silver;

padding-top: 0.5em;

margin-top: 4.0em;

}

div#footer-text {

float: left;

padding-bottom: 0.5em;

}

div#footer-badges {

float: right;

padding-bottom: 0.5em;

100

}

101

102

div#preamble,

103

div.tableblock, div.imageblock, div.exampleblock, div.verseblock,

104

div.quoteblock, div.literalblock, div.listingblock, div.sidebarblock,

105

div.admonitionblock {

106

margin-right: 10%;

107

margin-top: 1.5em;

108

margin-bottom: 1.5em;

109

}

110

div.admonitionblock {

111

margin-top: 2.5em;

112

margin-bottom: 2.5em;

113

}

114

115

div.content { /* Block element content. */

116

padding: 0;

117

}

118

119

/* Block element titles. */

120

div.title, caption.title {

121

font-family: sans-serif;

122

font-weight: bold;

123

text-align: left;

124

margin-top: 1.0em;

125

margin-bottom: 0.5em;

126

}

127

div.title + * {

128

margin-top: 0;

129

}

130

131

td div.title:first-child {

132

margin-top: 0.0em;

133

}

134

div.content div.title:first-child {

135

margin-top: 0.0em;

136

}

137

div.content + div.title {

138

margin-top: 0.0em;

139

}

140

141

div.sidebarblock > div.content {

142

background: #ffffee;

143

border: 1px solid silver;

144

padding: 0.5em;

145

}

146

147

div.listingblock {

148

margin-right: 0%;

149

}

150

div.listingblock > div.content {

151

border: 1px solid silver;

152

background: #f4f4f4;

153

padding: 0.5em;

154

}

155

156

div.quoteblock > div.content {

157

padding-left: 2.0em;

158

}

159

160

div.attribution {

161

text-align: right;

162

}

163

div.verseblock + div.attribution {

164

text-align: left;

165

}

166

167

div.admonitionblock .icon {

168

vertical-align: top;

169

font-size: 1.1em;

170

font-weight: bold;

171

text-decoration: underline;

172

color: #527bbd;

173

padding-right: 0.5em;

174

}

175

div.admonitionblock td.content {

176

padding-left: 0.5em;

177

border-left: 2px solid silver;

178

}

179

180

div.exampleblock > div.content {

181

border-left: 2px solid silver;

182

padding: 0.5em;

183

}

184

185

div.verseblock div.content {

186

white-space: pre;

187

}

188

189

div.imageblock div.content { padding-left: 0; }

190

div.imageblock img { border: 1px solid silver; }

191

span.image img { border-style: none; }

192

193

dl {

194

margin-top: 0.8em;

195

margin-bottom: 0.8em;

196

}

197

dt {

198

margin-top: 0.5em;

199

margin-bottom: 0;

200

font-style: italic;

201

}

202

dd > *:first-child {

203

margin-top: 0;

204

}

205

206

ul, ol {

207

list-style-position: outside;

208

}

209

ol.olist2 {

210

list-style-type: lower-alpha;

211

}

212

213

div.tableblock > table {

214

border: 3px solid #527bbd;

215

}

216

thead {

217

font-family: sans-serif;

218

font-weight: bold;

219

}

220

tfoot {

221

font-weight: bold;

222

}

223

224

div.hlist {

225

margin-top: 0.8em;

226

margin-bottom: 0.8em;

227

}

228

div.hlist td {

229

padding-bottom: 5px;

230

}

231

td.hlist1 {

232

vertical-align: top;

233

font-style: italic;

234

padding-right: 0.8em;

235

}

236

td.hlist2 {

237

vertical-align: top;

238

}

239

240

@media print {

241

div#footer-badges { display: none; }

242

}

243

244

div#toctitle {

245

color: #527bbd;

246

font-family: sans-serif;

247

font-size: 1.1em;

248

font-weight: bold;

249

margin-top: 1.0em;

250

margin-bottom: 0.1em;

251

}

252

253

div.toclevel1, div.toclevel2, div.toclevel3, div.toclevel4 {

254

margin-top: 0;

255

margin-bottom: 0;

256

}

257

div.toclevel2 {

258

margin-left: 2em;

259

font-size: 0.9em;

260

}

261

div.toclevel3 {

262

margin-left: 4em;

263

font-size: 0.9em;

264

}

265

div.toclevel4 {

266

margin-left: 6em;

267

font-size: 0.9em;

268

}

269

/* Workarounds for IE6's broken and incomplete CSS2. */

270

271

div.sidebar-content {

272

background: #ffffee;

273

border: 1px solid silver;

274

padding: 0.5em;

275

}

276

div.sidebar-title, div.image-title {

277

font-family: sans-serif;

278

font-weight: bold;

279

margin-top: 0.0em;

280

margin-bottom: 0.5em;

281

}

282

283

div.listingblock div.content {

284

border: 1px solid silver;

285

background: #f4f4f4;

286

padding: 0.5em;

287

}

288

289

div.quoteblock-content {

290

padding-left: 2.0em;

291

}

292

293

div.exampleblock-content {

294

border-left: 2px solid silver;

295

padding-left: 0.5em;

296

}

297

298

/* IE6 sets dynamically generated links as visited. */

299

div#toc a:visited { color: blue; }

300

</style>

301

<title>Multibyte character processing in SigScheme</title>

302

</head>

303

<body>

304

305

<h1>Multibyte character processing in SigScheme</h1>

306

</div>

307

<h2>1. Overview</h2>

308

309

<p>SigScheme's multibyte character handling interface is basically based on R6RS

310

Unicode character handlings. See also "R6RS conformance" section and

311

"Characters" subsection of "R5RS conformance" of <a href="spec.html">Specifications

312

of SigScheme</a>.</p>

313

<p>In addition to R6RS Unicode character handlings, SigScheme supports EUC-JP,

314

EUC-CN, EUC-KR and Shift_JIS character encoding schemes and they can be used

315

simultaneously. But no character encoding conversion method such as iconv is

316

provided at now.</p>

317

</div>

318

<h2>2. Current character codec</h2>

319

320

<p>On SigScheme, characters and strings are processed in accordance with the

321

parameter <strong>current character codec</strong>. Its initial value is specified by

322

<tt>—enable-default-encoding</tt> option of the configure script and defaults to

323

UTF-8. So characters and strings in SigScheme are treated as UTF-8 by default.</p>

324

<p>The value of current character codec can be checked by <tt>%%current-char-codec</tt>

325

procedure of SigScheme extension.</p>

326

327

328

<pre><tt>sscm> (require-extension (sscm-ext))

329

sscm> (%%current-char-codec)

330

"UTF-8"</tt></pre>

331

</div></div>

332

<p>To specify another encoding as default character codec, pass <tt>-C</tt> option to

333

<tt>sscm</tt> command as follows, or specify it in the second argument of

334

<tt>scm_initialize()</tt>.</p>

335

336

337

<pre><tt>$ sscm -C ISO-8859-1

338

$ sscm -C UTF-8

339

$ sscm -C EUC-JP

340

$ sscm -C EUC-CN

341

$ sscm -C EUC-KR

342

$ sscm -C Shift_JIS</tt></pre>

343

</div></div>

344

<p><tt>provided?</tt> predicate can be used to know whether an encoding is enabled by the

345

configuration or not.</p>

346

347

348

<pre><tt>(provided? "utf8")

349

(provided? "eucjp")

350

(provided? "euccn")

351

(provided? "euckr")

352

(provided? "sjis")</tt></pre>

353

</div></div>

354

<p>The <tt>ISO-8859-1</tt> encoding is used as generic singlebyte character encoding and

355

accepts any character represented in integer range 0-255, and always provided

356

regardless of configuration.</p>

357

<p>Use <tt>with-char-codec</tt> procedure to switch to another encoding temporarily.</p>

358

359

360

<pre><tt>(define euc-A (with-char-codec "EUC-JP" (lambda () (integer->char #xa4a2))))</tt></pre>

361

</div></div>

362

<p>See also "Ports" section of this document for current character codec switching

363

on I/O.</p>

364

</div>

365

<h2>3. Characters</h2>

366

367

<p>When the reader is working on an UTF-8 port:</p>

368

369

370

<pre><tt>#\あ ==> #\あ ;; U+3042 HIRAGANA LETTER A

371

#\x3042 ==> #\あ ;; U+3042 HIRAGANA LETTER A</tt></pre>

372

</div></div>

373

<p>Conversion between character and integer is performed based on the value of

374

<tt>%%current-char-codec</tt>. When <tt>%%current-char-codec</tt> is "UTF-8", integer value

375

of an Unicode character corresponds to the Unicode code point.</p>

376

<p>When <tt>%%current-char-codec</tt> is "UTF-8":</p>

377

378

379

<pre><tt>(integer->char #x3042) ==> #\あ ;; U+3042 HIRAGANA LETTER A

380

(char->integer #\あ) ==> 12354 ;; #x3042</tt></pre>

381

</div></div>

382

<p>If an integer value is invalid for the current codec, an error is caused.</p>

383

384

385

<pre><tt>(with-char-codec "UTF-8" (lambda () (integer->char #x3042))) ==> #\あ

386

(with-char-codec "ISO-8859-1" (lambda () (integer->char #x3042))) ==> error</tt></pre>

387

</div></div>

388

<p>Since a character in SigScheme is internally represented as an integer value

389

marked with character-object tag without any character encoding information,

390

user is responsible to manage the character encoding scheme of each character

391

object.</p>

392

<p>And no character encoding conversion is performed on integer<->char conversion

393

regaradless of <tt>%%current-char-codec</tt>.</p>

394

395

396

<pre><tt>;; U+3042 HIRAGANA LETTER A in Unicode

397

(define ucs-A (with-char-codec "UTF-8" (lambda () (integer->char #x3042))))

398

399

;; HIRAGANA LETTER A in EUC-JP

400

(define eucjp-A (with-char-codec "EUC-JP" (lambda () (integer->char #xa4a2))))

401

402

(eqv? ucs-A eucjp-A) ==> #f

403

404

;; no conversion is performed

405

(with-char-codec "UTF-8"

406

(lambda () (char->integer eucjp-A))) ==> 42146 ;; U+A4A2 YI RADICAL ZUP</tt></pre>

407

</div></div>

408

</div>

409

<h2>4. Strings</h2>

410

411

<p>When both reader's port and <tt>%%current-char-codec</tt> is UTF-8:</p>

412

413

414

<pre><tt>"\x3042;a\x3044;" ==> "あaい"

415

(string->list "あaい") ==> (#\あ #\a #\い)

416

(string-length "あaい") ==> 3</tt></pre>

417

</div></div>

418

<p>A string in SigScheme is internally represented as a C string with its logical

419

character length without character encoding information. User is responsible to

420

manage the character encoding scheme of each string object. Though strings have

421

no encoding information, they have logical character length counted in

422

<tt>%%current-char-codec</tt> on its object creation. So processing a string in

423

another encoding such as UTF-8 string as byte string cannot fully be performed.</p>

424

425

426

<pre><tt>;; U+3042 HIRAGANA LETTER A, with string length 1 counted in UTF-8

427

(define utf8-A "あ")

428

429

;; string length is not re-counted even if %%current-char-codec is changed

430

(with-char-codec "UTF-8" (lambda () (string-length utf8-A))) ==> 1

431

(with-char-codec "ISO-8859-1" (lambda () (string-length utf8-A))) ==> 1

432

433

;; character reference of string is based on %%current-char-codec

434

(with-char-codec "UTF-8" (lambda () (string-ref utf8-A 0))) ==> #\あ

435

(with-char-codec "ISO-8859-1" (lambda () (string-ref utf8-A 0))) ==> #\ã

436

437

;; character reference that exceeds logical length is an error even if its

438

;; physical length is enough

439

(with-char-codec "UTF-8" (lambda () (string-ref utf8-A 1))) ==> error

440

(with-char-codec "ISO-8859-1" (lambda () (string-ref utf8-A 1))) ==> error</tt></pre>

441

</div></div>

442

</div>

443

<h2>5. Identifiers</h2>

444

445

<p>Any Unicode characters can be used as identifiers in Scheme as R6RS allows.</p>

446

447

448

<pre><tt>'Français-symbole

449

'日本語シンボル

450

(define ひらがな->カタカナ (lambda (イ . ロ) ...))</tt></pre>

451

</div></div>

452

<p>But since SigScheme's Unicode handling is incomplete, all non-ASCII Unicode

453

characters are treated as ordinary letter. Though it allows using any

454

whitespace characters and punctuations as identifier, it should not be done.</p>

455

<p>Non-ASCII identifier in SigScheme is only allowed for Unicode. In other words,

456

allowed only if the reading port is UTF-8. This limitation is intended to avoid

457

character identity problem between different character encodings. For example,

458

WAVE DASH and FULLWIDTH TILDE may be altered to another unexpectedly if the

459

source code is converted to/from non-Unicode Japanese encoding. Inhibiting

460

non-Unicode identifiers is the simplest way to avoid such problems.</p>

461

<p>To use Unicode identifiers, prepend following line to the source code. See also

462

"Ports" section to understand its mechanism.</p>

463

464

465

466

</div></div>

467

</div>

468

<h2>6. Ports</h2>

469

470

<ul>

471

<li>

472

<p>

473

Each port is associated with a single character encoding when it is open

474

</p>

475

</li>

476

</ul>

477

478

479

<pre><tt>sscm> (current-input-port)

480

#<iport mb UTF-8 file stdin></tt></pre>

481

</div></div>

482

<ul>

483

<li>

484

<p>

485

The encoding of a port is not switched to another once it is open (NOTE: a C extension that operates on low level port can alter it)

486

</p>

487

</li>

488

<li>

489

<p>

490

The encoding of a port is determined by <tt>%%current-char-codec</tt> on its opening

491

</p>

492

</li>

493

</ul>

494

495

496

<pre><tt>$ sscm -C UTF-8

497

sscm> (%%current-char-codec)

498

"UTF-8"

499

500

sscm> (open-output-file "/tmp/sigscheme.tmp")

501

#<oport mb UTF-8 file /tmp/sigscheme.tmp>

502

503

sscm> (with-char-codec "ISO-8859-1"

504

(lambda () (open-output-file "/tmp/sigscheme.tmp")))

505

#<oport mb ISO-8859-1 file /tmp/sigscheme.tmp></tt></pre>

506

</div></div>

507

<ul>

508

<li>

509

<p>

510

<tt>%%current-char-codec</tt> does not affect already open ports

511

</p>

512

</li>

513

</ul>

514

515

516

<pre><tt>sscm> (current-input-port)

517

#<iport mb UTF-8 file stdin>

518

519

sscm> (with-char-codec "ISO-8859-1"

520

(lambda ()

521

(list (%%current-char-codec) (current-input-port))))

522

("ISO-8859-1" #<iport mb UTF-8 file stdin>)</tt></pre>

523

</div></div>

524

<ul>

525

<li>

526

<p>

527

Characters output to a port is encoded to a byte stream according to the port's own character encoding regardless of <tt>%%current-char-codec</tt> value

528

</p>

529

</li>

530

</ul>

531

532

533

<pre><tt>$ sscm -C ISO-8859-1

534

sscm> (current-output-port)

535

#<oport mb ISO-8859-1 file stdout>

536

537

sscm> (with-char-codec "UTF-8" (lambda () (write #\x3042)))

538

Error: ScmMultibyteCharPort: invalid character</tt></pre>

539

</div></div>

540

<p>To specify per-file character encoding, prepend following line into the

541

file. The <tt>load</tt> procedure detects this line and temporarily switches

542

<tt>%%current-char-codec</tt> and the encoding of the reading port until read all

543

expressions from the file.</p>

544

545

546

547

</div></div>

548

</div>

549

550

551

Last updated 17-May-2008 12:45:34 JST

552

</div>

553

</div>

554

</body>

555

</html>

Older »