bug-gnulib
[Top][All Lists]
Advanced

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

charset conversion functions for Unicode strings


From: Bruno Haible
Subject: charset conversion functions for Unicode strings
Date: Sat, 27 Jan 2007 01:38:16 +0100 (MET)
User-agent: KMail/1.5.4

Here comes the second part of the Unicode string library: charset conversion.
It is all built on the striconveha module.

2007-01-26  Bruno Haible  <address@hidden>

        * MODULES.html.sh (Unicode string functions): Add the new modules.

        * modules/uniconv/u32-strconv-to-locale: New file.
        * lib/uniconv/u32-strconv-to-locale.c: New file.

        * modules/uniconv/u16-strconv-to-locale: New file.
        * lib/uniconv/u16-strconv-to-locale.c: New file.

        * modules/uniconv/u8-strconv-to-locale: New file.
        * lib/uniconv/u8-strconv-to-locale.c: New file.

        * modules/uniconv/u32-strconv-from-locale: New file.
        * lib/uniconv/u32-strconv-from-locale.c: New file.

        * modules/uniconv/u16-strconv-from-locale: New file.
        * lib/uniconv/u16-strconv-from-locale.c: New file.

        * modules/uniconv/u8-strconv-from-locale: New file.
        * lib/uniconv/u8-strconv-from-locale.c: New file.

        * modules/uniconv/u32-strconv-to-enc: New file.
        * lib/uniconv/u32-strconv-to-enc.c: New file.
        * modules/uniconv/u32-strconv-to-enc-tests: New file.
        * tests/uniconv/test-u32-strconv-to-enc.c: New file.

        * modules/uniconv/u16-strconv-to-enc: New file.
        * lib/uniconv/u16-strconv-to-enc.c: New file.
        * lib/uniconv/u-strconv-to-enc.h: New file.
        * modules/uniconv/u16-strconv-to-enc-tests: New file.
        * tests/uniconv/test-u16-strconv-to-enc.c: New file.

        * modules/uniconv/u8-strconv-to-enc: New file.
        * lib/uniconv/u8-strconv-to-enc.c: New file.
        * modules/uniconv/u8-strconv-to-enc-tests: New file.
        * tests/uniconv/test-u8-strconv-to-enc.c: New file.

        * modules/uniconv/u32-strconv-from-enc: New file.
        * lib/uniconv/u32-strconv-from-enc.c: New file.
        * modules/uniconv/u32-strconv-from-enc-tests: New file.
        * tests/uniconv/test-u32-strconv-from-enc.c: New file.

        * modules/uniconv/u16-strconv-from-enc: New file.
        * lib/uniconv/u16-strconv-from-enc.c: New file.
        * modules/uniconv/u16-strconv-from-enc-tests: New file.
        * tests/uniconv/test-u16-strconv-from-enc.c: New file.

        * modules/uniconv/u8-strconv-from-enc: New file.
        * lib/uniconv/u8-strconv-from-enc.c: New file.
        * lib/uniconv/u-strconv-from-enc.h: New file.
        * modules/uniconv/u8-strconv-from-enc-tests: New file.
        * tests/uniconv/test-u8-strconv-from-enc.c: New file.

        * modules/uniconv/u32-conv-from-enc: New file.
        * lib/uniconv/u32-conv-from-enc.c: New file.
        * modules/uniconv/u32-conv-from-enc-tests: New file.
        * tests/uniconv/test-u32-conv-from-enc.c: New file.

        * modules/uniconv/u16-conv-from-enc: New file.
        * lib/uniconv/u16-conv-from-enc.c: New file.
        * lib/uniconv/u-conv-from-enc.h: New file.
        * modules/uniconv/u16-conv-from-enc-tests: New file.
        * tests/uniconv/test-u16-conv-from-enc.c: New file.

        * modules/uniconv/u8-conv-from-enc: New file.
        * lib/uniconv/u8-conv-from-enc.c: New file.
        * modules/uniconv/u8-conv-from-enc-tests: New file.
        * tests/uniconv/test-u8-conv-from-enc.c: New file.

        * modules/uniconv/base: New file.
        * lib/uniconv.h: New file.

=========================== lib/uniconv.h ===================================
/* Conversions between Unicode and legacy encodings.
   Copyright (C) 2002, 2005, 2007 Free Software Foundation, Inc.

   This program is free software; you can redistribute it and/or modify it
   under the terms of the GNU Library General Public License as published
   by the Free Software Foundation; either version 2, or (at your option)
   any later version.

   This program is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   Library General Public License for more details.

   You should have received a copy of the GNU Library General Public
   License along with this program; if not, write to the Free Software
   Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301,
   USA.  */

#ifndef _UNICONV_H
#define _UNICONV_H

/* Get size_t.  */
#include <stddef.h>

#include "unitypes.h"

/* Get enum iconv_ilseq_handler.  */
#include "striconveh.h"

/* Get iconv_register_autodetect(), mem_iconveha() declaration.  */
#include "striconveha.h"

/* Get locale_charset() declaration.  */
#include "localcharset.h"


#ifdef __cplusplus
extern "C" {
#endif


/* Converts an entire string, possibly including NUL bytes, from one encoding
   to a Unicode encoding.
   Converts a memory region given in encoding FROMCODE.  FROMCODE is as for
   iconv_open(3).
   The input is in the memory region between SRC (inclusive) and SRC + SRCLEN
   (exclusive).
   If OFFSETS is not NULL, it should point to an array of SRCLEN integers; this
   array is filled with offsets into the result, i.e. the character starting
   at SRC[i] corresponds to the character starting at (*RESULTP)[OFFSETS[i]],
   and other offsets are set to (size_t)(-1).
   *RESULTP and *LENGTH should initially be a scratch buffer and its size,
   or *RESULTP can initially be NULL.
   May erase the contents of the memory at *RESULTP.
   Return value: 0 if successful, otherwise -1 and errno set.
   If successful: The resulting string is stored in *RESULTP and its length
   in *LENGTHP.  *RESULTP is set to a freshly allocated memory block, or is
   unchanged if no dynamic memory allocation was necessary.
   Particular errno values: EINVAL, EILSEQ, ENOMEM.  */
extern int
       u8_conv_from_encoding (const char *fromcode,
                              enum iconv_ilseq_handler handler,
                              const char *src, size_t srclen,
                              size_t *offsets,
                              uint8_t **resultp, size_t *lengthp);
extern int
       u16_conv_from_encoding (const char *fromcode,
                               enum iconv_ilseq_handler handler,
                               const char *src, size_t srclen,
                               size_t *offsets,
                               uint16_t **resultp, size_t *lengthp);
extern int
       u32_conv_from_encoding (const char *fromcode,
                               enum iconv_ilseq_handler handler,
                               const char *src, size_t srclen,
                               size_t *offsets,
                               uint32_t **resultp, size_t *lengthp);

/* Converts a NUL terminated string from a given encoding.
   The result is malloc allocated, or NULL (with errno set) in case of error.
   Particular errno values: EILSEQ, ENOMEM.  */
extern uint8_t *
       u8_strconv_from_encoding (const char *string,
                                 const char *fromcode,
                                 enum iconv_ilseq_handler handler);
extern uint16_t *
       u16_strconv_from_encoding (const char *string,
                                  const char *fromcode,
                                  enum iconv_ilseq_handler handler);
extern uint32_t *
       u32_strconv_from_encoding (const char *string,
                                  const char *fromcode,
                                  enum iconv_ilseq_handler handler);

/* Converts a NUL terminated string to a given encoding.
   The result is malloc allocated, or NULL (with errno set) in case of error.
   Particular errno values: EILSEQ, ENOMEM.  */
extern char *
       u8_strconv_to_encoding (const uint8_t *string,
                               const char *tocode,
                               enum iconv_ilseq_handler handler);
extern char *
       u16_strconv_to_encoding (const uint16_t *string,
                                const char *tocode,
                                enum iconv_ilseq_handler handler);
extern char *
       u32_strconv_to_encoding (const uint32_t *string,
                                const char *tocode,
                                enum iconv_ilseq_handler handler);

/* Converts a NUL terminated string from the locale encoding.
   The result is malloc allocated, or NULL (with errno set) in case of error.
   Particular errno values: ENOMEM.  */
extern uint8_t *
       u8_strconv_from_locale (const char *string);
extern uint16_t *
       u16_strconv_from_locale (const char *string);
extern uint32_t *
       u32_strconv_from_locale (const char *string);

/* Converts a NUL terminated string to the locale encoding.
   The result is malloc allocated, or NULL (with errno set) in case of error.
   Particular errno values: ENOMEM.  */
extern char *
       u8_strconv_to_locale (const uint8_t *string);
extern char *
       u16_strconv_to_locale (const uint16_t *string);
extern char *
       u32_strconv_to_locale (const uint32_t *string);


#ifdef __cplusplus
}
#endif

#endif /* _UNICONV_H */





reply via email to

[Prev in Thread] Current Thread [Next in Thread]