~ubuntu-branches/ubuntu/natty/diffutils/natty

« back to all changes in this revision

Viewing changes to lib/propername.c

Committer: Bazaar Package Importer
Author(s): Santiago Vila
Date: 2010-05-04 20:38:00 UTC
mfrom: (2.1.7 sid)
Revision ID: james.westby@ubuntu.com-20100504203800-f67xd9rsa9xl9qqj

Tags: 1:3.0-1

New upstream release.

files added:
.tarball-version

ChangeLog-2008

GNUmakefile

TODO

bootstrap

build-aux

build-aux/announce-gen

build-aux/arg-nonnull.h

build-aux/c++defs.h

build-aux/compile

build-aux/config.guess

build-aux/config.rpath

build-aux/config.sub

build-aux/depcomp

build-aux/do-release-commit-and-tag

build-aux/gendocs.sh

build-aux/git-version-gen

build-aux/gitlog-to-changelog

build-aux/gnu-web-doc-update

build-aux/gnupload

build-aux/install-sh

build-aux/mdate-sh

build-aux/missing

build-aux/mkinstalldirs

build-aux/texinfo.tex

build-aux/update-copyright

build-aux/useless-if-before-free

build-aux/vc-list-files

build-aux/warn-on-use.h

cfg.mk

debian/source

debian/source/format

dist-check.mk

gnulib-tests

gnulib-tests/Makefile.am

gnulib-tests/Makefile.in

gnulib-tests/argmatch.c

gnulib-tests/argmatch.h

gnulib-tests/binary-io.h

gnulib-tests/gnulib.mk

gnulib-tests/hash-pjw.c

gnulib-tests/hash-pjw.h

gnulib-tests/init.sh

gnulib-tests/locale

gnulib-tests/locale/fr

gnulib-tests/locale/fr/LC_MESSAGES

gnulib-tests/locale/fr/LC_MESSAGES/test-quotearg.mo

gnulib-tests/locale/fr/LC_MESSAGES/test-quotearg.po

gnulib-tests/macros.h

gnulib-tests/pathmax.h

gnulib-tests/putenv.c

gnulib-tests/same-inode.h

gnulib-tests/setenv.c

gnulib-tests/signature.h

gnulib-tests/sleep.c

gnulib-tests/symlink.c

gnulib-tests/test-alloca-opt.c

gnulib-tests/test-argmatch.c

gnulib-tests/test-binary-io.c

gnulib-tests/test-binary-io.sh

gnulib-tests/test-bitrotate.c

gnulib-tests/test-btowc.c

gnulib-tests/test-btowc1.sh

gnulib-tests/test-btowc2.sh

gnulib-tests/test-c-ctype.c

gnulib-tests/test-c-stack.c

gnulib-tests/test-c-stack.sh

gnulib-tests/test-c-stack2.sh

gnulib-tests/test-c-strcase.sh

gnulib-tests/test-c-strcasecmp.c

gnulib-tests/test-c-strncasecmp.c

gnulib-tests/test-dirname.c

gnulib-tests/test-dup2.c

gnulib-tests/test-environ.c

gnulib-tests/test-errno.c

gnulib-tests/test-exclude.c

gnulib-tests/test-exclude1.sh

gnulib-tests/test-exclude2.sh

gnulib-tests/test-exclude3.sh

gnulib-tests/test-exclude4.sh

gnulib-tests/test-exclude5.sh

gnulib-tests/test-exclude6.sh

gnulib-tests/test-exclude7.sh

gnulib-tests/test-fcntl-h.c

gnulib-tests/test-fcntl.c

gnulib-tests/test-fnmatch.c

gnulib-tests/test-freopen-safer.c

gnulib-tests/test-freopen.c

gnulib-tests/test-getdtablesize.c

gnulib-tests/test-getopt.c

gnulib-tests/test-getopt.h

gnulib-tests/test-getopt_long.h

gnulib-tests/test-gettimeofday.c

gnulib-tests/test-hash.c

gnulib-tests/test-iconv-h.c

gnulib-tests/test-iconv.c

gnulib-tests/test-inttypes.c

gnulib-tests/test-langinfo.c

gnulib-tests/test-lstat.c

gnulib-tests/test-lstat.h

gnulib-tests/test-malloca.c

gnulib-tests/test-mbrtowc.c

gnulib-tests/test-mbrtowc1.sh

gnulib-tests/test-mbrtowc2.sh

gnulib-tests/test-mbrtowc3.sh

gnulib-tests/test-mbrtowc4.sh

gnulib-tests/test-mbscasecmp.c

gnulib-tests/test-mbscasecmp.sh

gnulib-tests/test-mbsinit.c

gnulib-tests/test-mbsinit.sh

gnulib-tests/test-mbsrtowcs.c

gnulib-tests/test-mbsrtowcs1.sh

gnulib-tests/test-mbsrtowcs2.sh

gnulib-tests/test-mbsrtowcs3.sh

gnulib-tests/test-mbsrtowcs4.sh

gnulib-tests/test-mbsstr1.c

gnulib-tests/test-mbsstr2.c

gnulib-tests/test-mbsstr2.sh

gnulib-tests/test-mbsstr3.c

gnulib-tests/test-mbsstr3.sh

gnulib-tests/test-memchr.c

gnulib-tests/test-nl_langinfo.c

gnulib-tests/test-nl_langinfo.sh

gnulib-tests/test-open.c

gnulib-tests/test-open.h

gnulib-tests/test-quotearg.c

gnulib-tests/test-quotearg.sh

gnulib-tests/test-setenv.c

gnulib-tests/test-sigaction.c

gnulib-tests/test-signal.c

gnulib-tests/test-sleep.c

gnulib-tests/test-stat-time.c

gnulib-tests/test-stat.c

gnulib-tests/test-stat.h

gnulib-tests/test-stdbool.c

gnulib-tests/test-stddef.c

gnulib-tests/test-stdint.c

gnulib-tests/test-stdio.c

gnulib-tests/test-stdlib.c

gnulib-tests/test-strerror.c

gnulib-tests/test-striconv.c

gnulib-tests/test-string.c

gnulib-tests/test-strings.c

gnulib-tests/test-symlink.c

gnulib-tests/test-symlink.h

gnulib-tests/test-sys_stat.c

gnulib-tests/test-sys_time.c

gnulib-tests/test-sys_wait.c

gnulib-tests/test-time.c

gnulib-tests/test-unistd.c

gnulib-tests/test-unsetenv.c

gnulib-tests/test-update-copyright.sh

gnulib-tests/test-usleep.c

gnulib-tests/test-vc-list-files-cvs.sh

gnulib-tests/test-vc-list-files-git.sh

gnulib-tests/test-version-etc.c

gnulib-tests/test-version-etc.sh

gnulib-tests/test-wchar.c

gnulib-tests/test-wcrtomb.c

gnulib-tests/test-wcrtomb.sh

gnulib-tests/test-wctype.c

gnulib-tests/test-wcwidth.c

gnulib-tests/test-xalloc-die.c

gnulib-tests/test-xalloc-die.sh

gnulib-tests/test-xstrtol.c

gnulib-tests/test-xstrtol.sh

gnulib-tests/test-xstrtoul.c

gnulib-tests/test-xstrtoumax.c

gnulib-tests/test-xstrtoumax.sh

gnulib-tests/uniwidth

gnulib-tests/uniwidth/test-uc_width.c

gnulib-tests/uniwidth/test-uc_width2.c

gnulib-tests/uniwidth/test-uc_width2.sh

gnulib-tests/unsetenv.c

gnulib-tests/usleep.c

gnulib-tests/wctob.c

gnulib-tests/zerosize-ptr.h

lib/alloca.in.h

lib/basename-lgpl.c

lib/bitrotate.h

lib/btowc.c

lib/c-ctype.c

lib/c-ctype.h

lib/c-strcase.h

lib/c-strcasecmp.c

lib/c-strncasecmp.c

lib/config.charset

lib/config.hin

lib/diffseq.h

lib/dirname-lgpl.c

lib/dirname.c

lib/dup2.c

lib/errno.in.h

lib/fcntl.c

lib/fcntl.in.h

lib/file-type.c

lib/file-type.h

lib/fnmatch.in.h

lib/fnmatch_loop.c

lib/freopen-safer.c

lib/freopen.c

lib/getdtablesize.c

lib/getopt.in.h

lib/getopt_int.h

lib/gettime.c

lib/gettimeofday.c

lib/gnulib.mk

lib/hash.c

lib/hash.h

lib/iconv.in.h

lib/iconv_open-aix.gperf

lib/iconv_open-aix.h

lib/iconv_open-hpux.gperf

lib/iconv_open-hpux.h

lib/iconv_open-irix.gperf

lib/iconv_open-irix.h

lib/iconv_open-osf.gperf

lib/iconv_open-osf.h

lib/iconv_open-solaris.gperf

lib/iconv_open-solaris.h

lib/iconv_open.c

lib/ignore-value.h

lib/intprops.h

lib/inttypes.in.h

lib/langinfo.in.h

lib/localcharset.c

lib/localcharset.h

lib/lstat.c

lib/malloca.c

lib/malloca.h

lib/malloca.valgrind

lib/mbchar.c

lib/mbchar.h

lib/mbiter.h

lib/mbrlen.c

lib/mbrtowc.c

lib/mbscasecmp.c

lib/mbsinit.c

lib/mbslen.c

lib/mbsrtowcs-state.c

lib/mbsrtowcs.c

lib/mbsstr.c

lib/mbuiter.h

lib/memchr.valgrind

lib/mktime-internal.h

lib/mktime.c

lib/nl_langinfo.c

lib/open.c

lib/progname.c

lib/progname.h

lib/propername.c

lib/propername.h

lib/quote.c

lib/quote.h

lib/quotearg.c

lib/quotearg.h

lib/ref-add.sin

lib/ref-del.sin

lib/regcomp.c

lib/regex.h

lib/regex_internal.c

lib/regex_internal.h

lib/regexec.c

lib/sh-quote.c

lib/sh-quote.h

lib/sig-handler.h

lib/sigaction.c

lib/signal.in.h

lib/sigprocmask.c

lib/stat-macros.h

lib/stat-time.h

lib/stat.c

lib/stdarg.in.h

lib/stdbool.in.h

lib/stddef.in.h

lib/stdint.in.h

lib/stdio--.h

lib/stdio-safer.h

lib/stdio-write.c

lib/stdio.in.h

lib/stdlib.in.h

lib/str-kmp.h

lib/streq.h

lib/strerror.c

lib/strftime.h

lib/striconv.c

lib/striconv.h

lib/string.in.h

lib/strings.in.h

lib/stripslash.c

lib/strncasecmp.c

lib/strndup.c

lib/strnlen.c

lib/strnlen1.c

lib/strnlen1.h

lib/strptime.c

lib/strtoll.c

lib/sys_stat.in.h

lib/sys_time.in.h

lib/sys_wait.in.h

lib/tempname.h

lib/time.in.h

lib/time_r.c

lib/timegm.c

lib/timespec.h

lib/trim.c

lib/trim.h

lib/uinttostr.c

lib/unistd.in.h

lib/unitypes.h

lib/uniwidth

lib/uniwidth.h

lib/uniwidth/cjk.h

lib/uniwidth/width.c

lib/verify.h

lib/version-etc-fsf.c

lib/version-etc.c

lib/version-etc.h

lib/wchar.in.h

lib/wcrtomb.c

lib/wctype.in.h

lib/wcwidth.c

lib/xalloc-die.c

lib/xfreopen.c

lib/xfreopen.h

lib/xstriconv.c

lib/xstriconv.h

lib/xstrndup.c

lib/xstrndup.h

lib/xstrtol-error.c

lib/xstrtoul.c

m4/00gnulib.m4

m4/alloca.m4

m4/argmatch.m4

m4/btowc.m4

m4/clock_time.m4

m4/config-h.m4

m4/dirname.m4

m4/double-slash-root.m4

m4/dup2.m4

m4/eealloc.m4

m4/environ.m4

m4/errno_h.m4

m4/exclude.m4

m4/extensions.m4

m4/fcntl-o.m4

m4/fcntl.m4

m4/fcntl_h.m4

m4/file-type.m4

m4/freopen.m4

m4/getdtablesize.m4

m4/getopt.m4

m4/gettext_gl.m4

m4/gettime.m4

m4/gettimeofday.m4

m4/glibc21_gl.m4

m4/gnu-make.m4

m4/gnulib-common.m4

m4/gnulib-comp.m4

m4/hard-locale.m4

m4/hash.m4

m4/iconv_h.m4

m4/iconv_open.m4

m4/include_next.m4

m4/inline.m4

m4/intlmacosx.m4

m4/inttostr.m4

m4/inttypes-pri.m4

m4/langinfo_h.m4

m4/lib-ld_gl.m4

m4/lib-prefix_gl.m4

m4/libsigsegv.m4

m4/localcharset.m4

m4/locale-fr.m4

m4/locale-ja.m4

m4/locale-tr.m4

m4/locale-zh.m4

m4/longlong_gl.m4

m4/lstat.m4

m4/malloca.m4

m4/manywarnings.m4

m4/mbchar.m4

m4/mbiter.m4

m4/mbrlen.m4

m4/mbsinit.m4

m4/mbslen.m4

m4/mbsrtowcs.m4

m4/memchr.m4

m4/mkstemp.m4

m4/mktime.m4

m4/mmap-anon.m4

m4/mode_t.m4

m4/multiarch.m4

m4/nl_langinfo.m4

m4/nls.m4

m4/onceonly.m4

m4/open.m4

m4/pathmax.m4

m4/po_gl.m4

m4/putenv.m4

m4/quote.m4

m4/quotearg.m4

m4/setenv.m4

m4/sigaction.m4

m4/signal_h.m4

m4/signalblocking.m4

m4/sleep.m4

m4/ssize_t.m4

m4/stat-time.m4

m4/stat.m4

m4/stdarg.m4

m4/stddef_h.m4

m4/stdint.m4

m4/stdio-safer.m4

m4/stdio_h.m4

m4/stdlib_h.m4

m4/strcase.m4

m4/strerror.m4

m4/string_h.m4

m4/strings_h.m4

m4/strndup.m4

m4/strnlen.m4

m4/strptime.m4

m4/strtoimax.m4

m4/strtol.m4

m4/strtoll.m4

m4/strtoul.m4

m4/strtoull.m4

m4/strtoumax.m4

m4/symlink.m4

m4/sys_stat_h.m4

m4/sys_time_h.m4

m4/sys_wait_h.m4

m4/tempname.m4

m4/time_h.m4

m4/time_r.m4

m4/timegm.m4

m4/timespec.m4

m4/tm_gmtoff.m4

m4/unistd_h.m4

m4/unlocked-io.m4

m4/usleep.m4

m4/version-etc.m4

m4/warn-on-use.m4

m4/warnings.m4

m4/wchar_h.m4

m4/wchar_t.m4

m4/wcrtomb.m4

m4/wctob.m4

m4/wctype_h.m4

m4/wcwidth.m4

m4/wint_t.m4

m4/xalloc.m4

m4/xstrndup.m4

m4/xstrtol.m4

maint.mk

po/ca.gmo

po/ca.po

po/el.gmo

po/el.po

po/fi.gmo

po/fi.po

po/ga.gmo

po/ga.po

po/hu.gmo

po/hu.po

po/it.gmo

po/it.po

po/lv.gmo

po/lv.po

po/ms.gmo

po/ms.po

po/nl.gmo

po/nl.po

po/pt_BR.gmo

po/pt_BR.po

po/ro.gmo

po/ro.po

po/sr.gmo

po/sr.po

po/stamp-po

po/uk.gmo

po/uk.po

po/vi.gmo

po/vi.po

po/zh_CN.gmo

po/zh_CN.po

tests

tests/Makefile.am

tests/Makefile.in

tests/basic

tests/binary

tests/function-line-vs-leading-space

tests/help-version

tests/init.sh

tests/label-vs-func

tests/no-newline-at-eof

tests/stdin

tests/t-local.sh

files removed:
INSTALLME

config

config.hin

config/config.guess

config/config.rpath

config/config.sub

config/depcomp

config/install-sh

config/mdate-sh

config/missing

config/mkinstalldirs

config/texinfo.tex

lib/fnmatch.hin

lib/freesoft.c

lib/freesoft.h

lib/getopt.h

lib/posix

lib/posix/Makefile.am

lib/posix/Makefile.in

lib/posix/regex.h

lib/posixver.c

lib/posixver.h

lib/quotesys.c

lib/quotesys.h

lib/realloc.c

lib/regex.hin

lib/setmode.c

lib/setmode.h

lib/waitpid.c

m4/Makefile.am

m4/Makefile.am.in

m4/Makefile.in

m4/README

m4/c-bs-a.m4

m4/check-decl.m4

m4/gettext.m4

m4/glibc21.m4

m4/gnu-source.m4

m4/jm-glibc-io.m4

m4/lcmessage.m4

m4/lib-ld.m4

m4/lib-prefix.m4

m4/longlong.m4

m4/prereq.m4

m4/realloc.m4

m4/setmode.m4

m4/st_mtim.m4

m4/xstrtoumax.m4

po/en_GB.gmo

po/en_GB.po

src/version.c

files modified:
ABOUT-NLS

AUTHORS

COPYING

ChangeLog

INSTALL

Makefile.am

Makefile.in

NEWS

README

THANKS

aclocal.m4

configure

configure.ac

debian/changelog

debian/control

debian/copyright

debian/rules

debian/watch

exgettext

lib/Makefile.am

lib/Makefile.in

lib/alloca.c

lib/basename.c

lib/c-stack.c

lib/c-stack.h

lib/cmpbuf.c

lib/cmpbuf.h

lib/dirname.h

lib/error.c

lib/error.h

lib/exclude.c

lib/exclude.h

lib/exitfail.c

lib/exitfail.h

lib/fnmatch.c

lib/getopt.c

lib/getopt1.c

lib/gettext.h

lib/hard-locale.c

lib/hard-locale.h

lib/imaxtostr.c

lib/inttostr.c

lib/inttostr.h

lib/malloc.c

lib/memchr.c

lib/mkstemp.c

lib/offtostr.c

lib/prepargs.c

lib/regex.c

lib/strcasecmp.c

lib/strftime.c

lib/strtoimax.c

lib/strtol.c

lib/strtoul.c

lib/strtoull.c

lib/tempname.c

lib/umaxtostr.c

lib/unlocked-io.h

lib/xalloc.h

lib/xmalloc.c

lib/xstrtol.c

lib/xstrtol.h

lib/xstrtoumax.c

m4/c-stack.m4

m4/codeset.m4

m4/dos.m4

m4/error.m4

m4/fnmatch.m4

m4/iconv.m4

m4/inttypes.m4

m4/lib-link.m4

m4/malloc.m4

m4/mbrtowc.m4

m4/mbstate_t.m4

m4/progtest.m4

m4/regex.m4

m4/stdbool.m4

m4/strftime.m4

m4/vararrays.m4

man/Makefile.am

man/Makefile.in

man/cmp.1

man/diff.1

man/diff3.1

man/sdiff.1

ms/Makefile.am

ms/Makefile.in

ms/README

ms/config.bat

ms/config.sed

ms/config.site

po/LINGUAS

po/Makefile.in.in

po/Makevars

po/POTFILES.in

po/Rules-quot

po/cs.gmo

po/cs.po

po/da.gmo

po/da.po

po/de.gmo

po/de.po

po/diffutils.pot

po/eo.gmo

po/eo.po

po/es.gmo

po/es.po

po/fr.gmo

po/fr.po

po/gl.gmo

po/gl.po

po/he.gmo

po/he.po

po/id.gmo

po/id.po

po/ja.gmo

po/ja.po

po/pl.gmo

po/pl.po

po/ru.gmo

po/ru.po

po/sv.gmo

po/sv.po

po/tr.gmo

po/tr.po

po/zh_TW.gmo

po/zh_TW.po

src/Makefile.am

src/Makefile.in

src/analyze.c

src/cmp.c

src/context.c

src/diff.c

src/diff.h

src/diff3.c

src/dir.c

src/ed.c

src/ifdef.c

src/io.c

src/normal.c

src/sdiff.c

src/side.c

src/system.h

src/util.c

Show diffs side-by-side

added added

removed removed

lib/propername.c

/* Localization of proper names.

Written by Bruno Haible <bruno@clisp.org>, 2006.

This program is free software: you can redistribute it and/or modify

it under the terms of the GNU General Public License as published by

the Free Software Foundation; either version 3 of the License, or

(at your option) any later version.

This program is distributed in the hope that it will be useful,

but WITHOUT ANY WARRANTY; without even the implied warranty of

MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

GNU General Public License for more details.

You should have received a copy of the GNU General Public License

along with this program. If not, see <http://www.gnu.org/licenses/>. */

#include <config.h>

/* Specification. */

#include "propername.h"

#include <ctype.h>

#include <stdbool.h>

#include <stdio.h>

#include <stdlib.h>

#include <string.h>

#if HAVE_ICONV

# include <iconv.h>

#endif

#include "trim.h"

#include "mbchar.h"

#include "mbuiter.h"

#include "localcharset.h"

#include "c-strcase.h"

#include "xstriconv.h"

#include "xalloc.h"

#include "gettext.h"

/* Tests whether STRING contains trim (SUB), starting and ending at word

boundaries.

Here, instead of implementing Unicode Standard Annex #29 for determining

word boundaries, we assume that trim (SUB) starts and ends with words and

only test whether the part before it ends with a non-word and the part

after it starts with a non-word. */

static bool

mbsstr_trimmed_wordbounded (const char *string, const char *sub)

{

char *tsub = trim (sub);

bool found = false;

for (; *string != '\0';)

{

const char *tsub_in_string = mbsstr (string, tsub);

if (tsub_in_string == NULL)

break;

else

{

if (MB_CUR_MAX > 1)

{

mbui_iterator_t string_iter;

bool word_boundary_before;

bool word_boundary_after;

mbui_init (string_iter, string);

word_boundary_before = true;

if (mbui_cur_ptr (string_iter) < tsub_in_string)

{

mbchar_t last_char_before_tsub;

{

if (!mbui_avail (string_iter))

abort ();

last_char_before_tsub = mbui_cur (string_iter);

mbui_advance (string_iter);

}

while (mbui_cur_ptr (string_iter) < tsub_in_string);

if (mb_isalnum (last_char_before_tsub))

word_boundary_before = false;

}

mbui_init (string_iter, tsub_in_string);

{

mbui_iterator_t tsub_iter;

for (mbui_init (tsub_iter, tsub);

mbui_avail (tsub_iter);

mbui_advance (tsub_iter))

{

if (!mbui_avail (string_iter))

abort ();

mbui_advance (string_iter);

}

word_boundary_after = true;

if (mbui_avail (string_iter))

{

100

mbchar_t first_char_after_tsub = mbui_cur (string_iter);

101

if (mb_isalnum (first_char_after_tsub))

102

word_boundary_after = false;

103

}

104

105

if (word_boundary_before && word_boundary_after)

106

{

107

found = true;

108

break;

109

}

110

111

mbui_init (string_iter, tsub_in_string);

112

if (!mbui_avail (string_iter))

113

break;

114

string = tsub_in_string + mb_len (mbui_cur (string_iter));

115

}

116

else

117

{

118

bool word_boundary_before;

119

const char *p;

120

bool word_boundary_after;

121

122

word_boundary_before = true;

123

if (string < tsub_in_string)

124

if (isalnum ((unsigned char) tsub_in_string[-1]))

125

word_boundary_before = false;

126

127

p = tsub_in_string + strlen (tsub);

128

word_boundary_after = true;

129

if (*p != '\0')

130

if (isalnum ((unsigned char) *p))

131

word_boundary_after = false;

132

133

if (word_boundary_before && word_boundary_after)

134

{

135

found = true;

136

break;

137

}

138

139

if (*tsub_in_string == '\0')

140

break;

141

string = tsub_in_string + 1;

142

}

143

}

144

}

145

free (tsub);

146

return found;

147

}

148

149

/* Return the localization of NAME. NAME is written in ASCII. */

150

151

const char *

152

proper_name (const char *name)

153

{

154

/* See whether there is a translation. */

155

const char *translation = gettext (name);

156

157

if (translation != name)

158

{

159

/* See whether the translation contains the original name. */

160

if (mbsstr_trimmed_wordbounded (translation, name))

161

return translation;

162

else

163

{

164

/* Return "TRANSLATION (NAME)". */

165

char *result =

166

XNMALLOC (strlen (translation) + 2 + strlen (name) + 1 + 1, char);

167

168

sprintf (result, "%s (%s)", translation, name);

169

return result;

170

}

171

}

172

else

173

return name;

174

}

175

176

/* Return the localization of a name whose original writing is not ASCII.

177

NAME_UTF8 is the real name, written in UTF-8 with octal or hexadecimal

178

escape sequences. NAME_ASCII is a fallback written only with ASCII

179

characters. */

180

181

const char *

182

proper_name_utf8 (const char *name_ascii, const char *name_utf8)

183

{

184

/* See whether there is a translation. */

185

const char *translation = gettext (name_ascii);

186

187

/* Try to convert NAME_UTF8 to the locale encoding. */

188

const char *locale_code = locale_charset ();

189

char *alloc_name_converted = NULL;

190

char *alloc_name_converted_translit = NULL;

191

const char *name_converted = NULL;

192

const char *name_converted_translit = NULL;

193

const char *name;

194

195

if (c_strcasecmp (locale_code, "UTF-8") != 0)

196

{

197

#if HAVE_ICONV

198

name_converted = alloc_name_converted =

199

xstr_iconv (name_utf8, "UTF-8", locale_code);

200

201

# if (__GLIBC__ == 2 && __GLIBC_MINOR__ >= 2) || __GLIBC__ > 2 \

202

|| _LIBICONV_VERSION >= 0x0105

203

{

204

char *converted_translit;

205

206

size_t len = strlen (locale_code);

207

char *locale_code_translit = XNMALLOC (len + 10 + 1, char);

208

memcpy (locale_code_translit, locale_code, len);

209

memcpy (locale_code_translit + len, "//TRANSLIT", 10 + 1);

210

211

converted_translit =

212

xstr_iconv (name_utf8, "UTF-8", locale_code_translit);

213

214

free (locale_code_translit);

215

216

if (converted_translit != NULL)

217

{

218

# if !_LIBICONV_VERSION

219

/* Don't use the transliteration if it added question marks.

220

glibc's transliteration falls back to question marks; libiconv's

221

transliteration does not.

222

mbschr is equivalent to strchr in this case. */

223

if (strchr (converted_translit, '?') != NULL)

224

free (converted_translit);

225

else

226

# endif

227

name_converted_translit = alloc_name_converted_translit =

228

converted_translit;

229

}

230

}

231

# endif

232

#endif

233

}

234

else

235

{

236

name_converted = name_utf8;

237

name_converted_translit = name_utf8;

238

}

239

240

/* The name in locale encoding. */

241

name = (name_converted != NULL ? name_converted :

242

name_converted_translit != NULL ? name_converted_translit :

243

name_ascii);

244

245

/* See whether we have a translation. Some translators have not understood

246

that they should use the UTF-8 form of the name, if possible. So if the

247

translator provided a no-op translation, we ignore it. */

248

if (strcmp (translation, name_ascii) != 0)

249

{

250

/* See whether the translation contains the original name. */

251

if (mbsstr_trimmed_wordbounded (translation, name_ascii)

252

|| (name_converted != NULL

253

&& mbsstr_trimmed_wordbounded (translation, name_converted))

254

|| (name_converted_translit != NULL

255

&& mbsstr_trimmed_wordbounded (translation, name_converted_translit)))

256

{

257

if (alloc_name_converted != NULL)

258

free (alloc_name_converted);

259

if (alloc_name_converted_translit != NULL)

260

free (alloc_name_converted_translit);

261

return translation;

262

}

263

else

264

{

265

/* Return "TRANSLATION (NAME)". */

266

char *result =

267

XNMALLOC (strlen (translation) + 2 + strlen (name) + 1 + 1, char);

268

269

sprintf (result, "%s (%s)", translation, name);

270

271

if (alloc_name_converted != NULL)

272

free (alloc_name_converted);

273

if (alloc_name_converted_translit != NULL)

274

free (alloc_name_converted_translit);

275

return result;

276

}

277

}

278

else

279

{

280

if (alloc_name_converted != NULL && alloc_name_converted != name)

281

free (alloc_name_converted);

282

if (alloc_name_converted_translit != NULL

283

&& alloc_name_converted_translit != name)

284

free (alloc_name_converted_translit);

285

return name;

286

}

287

}

288

289

#ifdef TEST1

290

# include <locale.h>

291

int

292

main (int argc, char *argv[])

293

{

294

setlocale (LC_ALL, "");

295

if (mbsstr_trimmed_wordbounded (argv[1], argv[2]))

296

printf("found\n");

297

return 0;

298

}

299

#endif

300

301

#ifdef TEST2

302

# include <locale.h>

303

# include <stdio.h>

304

int

305

main (int argc, char *argv[])

306

{

307

setlocale (LC_ALL, "");

308

printf ("%s\n", proper_name_utf8 ("Franc,ois Pinard", "Fran\303\247ois Pinard"));

309

return 0;

310

}

311

#endif

Older »