summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorJim Meyering <jim@meyering.net>2000-03-01 13:22:35 +0000
committerJim Meyering <jim@meyering.net>2000-03-01 13:22:35 +0000
commitce4a63537c342d516c9402ff71ac2922193e136f (patch)
tree4e425d2b8516f5ab14445f6a69b983824f3cbe42
parent578156186de2da21b4a48a652c2d17a3d23dfc32 (diff)
downloadcoreutils-ce4a63537c342d516c9402ff71ac2922193e136f.tar.xz
New file from Bruno.
One portability tweak: guard inclusion of stddef.h.
-rw-r--r--lib/unicodeio.c121
1 files changed, 121 insertions, 0 deletions
diff --git a/lib/unicodeio.c b/lib/unicodeio.c
new file mode 100644
index 000000000..8e0b2d8f1
--- /dev/null
+++ b/lib/unicodeio.c
@@ -0,0 +1,121 @@
+/* Unicode character output to streams with locale dependent encoding.
+
+ Copyright (C) 2000 Free Software Foundation, Inc.
+
+ This program is free software; you can redistribute it and/or modify it
+ under the terms of the GNU Library General Public License as published
+ by the Free Software Foundation; either version 2, or (at your option)
+ any later version.
+
+ This program is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Library General Public License for more details.
+
+ You should have received a copy of the GNU Library General Public
+ License along with this program; if not, write to the Free Software
+ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307,
+ USA. */
+
+/* Written by Bruno Haible <haible@clisp.cons.org>. */
+
+#ifdef HAVE_CONFIG_H
+# include <config.h>
+#endif
+
+#if HAVE_STDDEF_H
+# include <stddef.h>
+#endif
+
+#include <stdio.h>
+
+#if HAVE_ICONV
+# include <iconv.h>
+/* Name of UCS-4 encoding with machine dependent endianness and alignment. */
+# ifdef _LIBICONV_VERSION
+# define UCS4_NAME "UCS-4-INTERNAL"
+# else
+# define UCS4_NAME "INTERNAL"
+# endif
+#endif
+
+#include <error.h>
+
+#if ENABLE_NLS
+# include <libintl.h>
+# define _(Text) gettext (Text)
+#else
+# define _(Text) Text
+#endif
+
+#include "unicodeio.h"
+
+/* Use md5.h for its nice detection of unsigned 32-bit type. */
+#include "md5.h"
+#undef uint32_t
+#define uint32_t md5_uint32
+
+/* Outputs the Unicode character CODE to the output stream STREAM.
+ Assumes that the locale doesn't change between two calls. */
+void
+print_unicode_char (FILE *stream, unsigned int code)
+{
+#if HAVE_ICONV
+ static int initialized;
+ static iconv_t ucs4_to_local;
+
+ uint32_t in;
+ char outbuf[25];
+ const char *inptr;
+ size_t inbytesleft;
+ char *outptr;
+ size_t outbytesleft;
+ size_t res;
+
+ if (!initialized)
+ {
+ extern const char *locale_charset (void);
+ const char *charset = locale_charset ();
+
+ ucs4_to_local = (charset != NULL
+ ? iconv_open (charset, UCS4_NAME)
+ : (iconv_t)(-1));
+ if (ucs4_to_local == (iconv_t)(-1))
+ {
+ /* For an unknown encoding, assume ASCII. */
+ ucs4_to_local = iconv_open ("ASCII", UCS4_NAME);
+ if (ucs4_to_local == (iconv_t)(-1))
+ error (1, 0, _("cannot output U+%04X: iconv function not usable"),
+ code);
+ }
+ initialized = 1;
+ }
+
+ in = code;
+ inptr = (char *) &in;
+ inbytesleft = sizeof (in);
+ outptr = outbuf;
+ outbytesleft = sizeof (outbuf);
+
+ /* Convert the character. */
+ res = iconv (ucs4_to_local, &inptr, &inbytesleft, &outptr, &outbytesleft);
+ if (inbytesleft > 0 || res == (size_t)(-1))
+ error (1, res == (size_t)(-1) ? errno : 0,
+ _("cannot convert U+%04X to local character set"), code);
+
+ /* Avoid glibc-2.1 bug. */
+# if defined _LIBICONV_VERSION || !(__GLIBC__ - 0 == 2 && __GLIBC_MINOR__ - 0 <= 1)
+
+ /* Get back to the initial shift state. */
+ res = iconv (ucs4_to_local, NULL, NULL, &outptr, &outbytesleft);
+ if (res == (size_t)(-1))
+ error (1, errno, _("cannot convert U+%04X to local character set"), code);
+
+# endif
+
+ fwrite (outbuf, 1, outptr - outbuf, stream);
+
+#else
+ error (1, 0, _("cannot output U+%04X: iconv function not available"), code);
+#endif
+}