/* -*- Mode: C; tab-width: 8; indent-tabs-mode: t; c-basic-offset: 8 -*- */
/* GMime
* Copyright (C) 2000-2007 Jeffrey Stedfast
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
*/
#ifdef HAVE_CONFIG_H
#include <config.h>
#endif
#include <stdio.h>
#include <string.h>
#include <errno.h>
#include "gmime-iconv-utils.h"
#include "gmime-charset.h"
#ifdef ENABLE_WARNINGS
#define w(x) x
#else
#define w(x)
#endif /* ENABLE_WARNINGS */
#ifdef G_THREADS_ENABLED
static GStaticMutex lock = G_STATIC_MUTEX_INIT;
#define LOCK() g_static_mutex_lock (&lock)
#define UNLOCK() g_static_mutex_unlock (&lock)
#else
#define LOCK()
#define UNLOCK()
#endif /* G_THREADS_ENABLED */
static iconv_t utf8_to_locale;
static iconv_t locale_to_utf8;
static void
iconv_utils_init (void)
{
static gboolean initialized = FALSE;
const char *utf8, *locale;
if (initialized)
return;
g_mime_charset_map_init ();
utf8 = g_mime_charset_iconv_name ("utf-8");
locale = g_mime_charset_iconv_name (g_mime_locale_charset ());
utf8_to_locale = iconv_open (locale, utf8);
locale_to_utf8 = iconv_open (utf8, locale);
initialized = TRUE;
}
/**
* g_mime_iconv_strndup:
* @cd: conversion descriptor
* @string: string in source charset
* @n: number of bytes to convert
*
* Allocates a new string buffer containing the first @n bytes of
* @string converted to the destination charset as described by the
* conversion descriptor @cd.
*
* Returns a new string buffer containing the first @n bytes of
* @string converted to the destination charset as described by the
* conversion descriptor @cd.
**/
char *
g_mime_iconv_strndup (iconv_t cd, const char *string, size_t n)
{
size_t inleft, outleft, converted = 0;
char *out, *outbuf;
const char *inbuf;
size_t outlen;
if (cd == (iconv_t) -1)
return g_strndup (string, n);
outlen = n * 2 + 16;
out = g_malloc (outlen + 4);
inbuf = string;
inleft = n;
do {
errno = 0;
outbuf = out + converted;
outleft = outlen - converted;
converted = iconv (cd, (char **) &inbuf, &inleft, &outbuf, &outleft);
if (converted == (size_t) -1) {
if (errno != E2BIG && errno != EINVAL)
goto fail;
}
/*
* E2BIG There is not sufficient room at *outbuf.
*
* We just need to grow our outbuffer and try again.
*/
converted = outbuf - out;
if (errno == E2BIG) {
outlen += inleft * 2 + 16;
out = g_realloc (out, outlen + 4);
outbuf = out + converted;
}
} while (errno == E2BIG && inleft > 0);
/*
* EINVAL An incomplete multibyte sequence has been encoun
* tered in the input.
*
* We'll just have to ignore it...
*/
/* flush the iconv conversion */
iconv (cd, NULL, NULL, &outbuf, &outleft);
/* Note: not all charsets can be nul-terminated with a single
nul byte. UCS2, for example, needs 2 nul bytes and UCS4
needs 4. I hope that 4 nul bytes is enough to terminate all
multibyte charsets? */
/* nul-terminate the string */
memset (outbuf, 0, 4);
/* reset the cd */
iconv (cd, NULL, NULL, NULL, NULL);
return out;
fail:
w(g_warning ("g_mime_iconv_strndup: %s", strerror (errno)));
g_free (out);
/* reset the cd */
iconv (cd, NULL, NULL, NULL, NULL);
return NULL;
}
/**
* g_mime_iconv_strdup:
* @cd: conversion descriptor
* @string: string in source charset
*
* Allocates a new string buffer containing @string converted to
* the destination charset described in @cd.
*
* Returns a new string buffer containing the original string
* converted to the new charset.
**/
char *
g_mime_iconv_strdup (iconv_t cd, const char *string)
{
return g_mime_iconv_strndup (cd, string, strlen (string));
}
/**
* g_mime_iconv_locale_to_utf8:
* @string: string in locale charset
*
* Allocates a new string buffer containing @string in UTF-8.
*
* Returns a new string buffer containing @string converted to UTF-8.
**/
char *
g_mime_iconv_locale_to_utf8 (const char *string)
{
char *buf;
LOCK ();
iconv_utils_init ();
buf = g_mime_iconv_strdup (locale_to_utf8, string);
UNLOCK ();
return buf;
}
/**
* g_mime_iconv_locale_to_utf8_length:
* @string: string in locale charset
* @n: number of bytes to convert
*
* Allocates a new string buffer containing the first @n bytes of
* @string converted to UTF-8.
*
* Returns a new string buffer containing the first @n bytes of
* @string converted to UTF-8.
**/
char *
g_mime_iconv_locale_to_utf8_length (const char *string, size_t n)
{
char *buf;
LOCK ();
iconv_utils_init ();
buf = g_mime_iconv_strndup (locale_to_utf8, string, n);
UNLOCK ();
return buf;
}
/**
* g_mime_iconv_utf8_to_locale:
* @string: string in UTF-8 charset
*
* Allocates a new string buffer containing @string converted to the
* user's locale charset.
*
* Returns a new string buffer containing @string converted to the
* user's locale charset.
**/
char *
g_mime_iconv_utf8_to_locale (const char *string)
{
char *buf;
LOCK ();
iconv_utils_init ();
buf = g_mime_iconv_strdup (utf8_to_locale, string);
UNLOCK ();
return buf;
}
/**
* g_mime_iconv_utf8_to_locale_length:
* @string: string in UTF-8 charset
* @n: number of bytes to convert
*
* Allocates a new string buffer containing the first @n bytes of
* @string converted to the user's locale charset.
*
* Returns a new string buffer containing the first @n bytes of
* @string converted to the user's locale charset.
**/
char *
g_mime_iconv_utf8_to_locale_length (const char *string, size_t n)
{
char *buf;
LOCK ();
iconv_utils_init ();
buf = g_mime_iconv_strndup (utf8_to_locale, string, n);
UNLOCK ();
return buf;
}
syntax highlighted by Code2HTML, v. 0.9.1