1 /* Character set conversion with error handling and autodetection. 2 Copyright (C) 2002, 2005, 2007-2021 Free Software Foundation, Inc. 3 Written by Bruno Haible. 4 5 This file is free software: you can redistribute it and/or modify 6 it under the terms of the GNU Lesser General Public License as 7 published by the Free Software Foundation; either version 2.1 of the 8 License, or (at your option) any later version. 9 10 This file is distributed in the hope that it will be useful, 11 but WITHOUT ANY WARRANTY; without even the implied warranty of 12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 13 GNU Lesser General Public License for more details. 14 15 You should have received a copy of the GNU Lesser General Public License 16 along with this program. If not, see <https://www.gnu.org/licenses/>. */ 17 18 #ifndef _STRICONVEHA_H 19 #define _STRICONVEHA_H 20 21 #include <stdbool.h> 22 #include <stdlib.h> 23 24 #include "iconveh.h" 25 26 27 #ifdef __cplusplus 28 extern "C" { 29 #endif 30 31 32 /* Convert an entire string from one encoding to another, using iconv. 33 The original string is at [SRC,...,SRC+SRCLEN-1]. 34 The "from" encoding can also be a name defined for autodetection. 35 If TRANSLITERATE is true, transliteration will attempted to avoid conversion 36 errors, for iconv implementations that support this. Usually you'll choose 37 TRANSLITERATE = true if HANDLER != iconveh_error. 38 If OFFSETS is not NULL, it should point to an array of SRCLEN integers; this 39 array is filled with offsets into the result, i.e. the character starting 40 at SRC[i] corresponds to the character starting at (*RESULTP)[OFFSETS[i]], 41 and other offsets are set to (size_t)(-1). 42 *RESULTP and *LENGTH should initially be a scratch buffer and its size, 43 or *RESULTP can initially be NULL. 44 May erase the contents of the memory at *RESULTP. 45 Return value: 0 if successful, otherwise -1 and errno set. 46 If successful: The resulting string is stored in *RESULTP and its length 47 in *LENGTHP. *RESULTP is set to a freshly allocated memory block, or is 48 unchanged if no dynamic memory allocation was necessary. */ 49 extern int 50 mem_iconveha (const char *src, size_t srclen, 51 const char *from_codeset, const char *to_codeset, 52 bool transliterate, 53 enum iconv_ilseq_handler handler, 54 size_t *offsets, 55 char **resultp, size_t *lengthp); 56 57 /* Convert an entire string from one encoding to another, using iconv. 58 The original string is the NUL-terminated string starting at SRC. 59 Both the "from" and the "to" encoding must use a single NUL byte at the 60 end of the string (i.e. not UCS-2, UCS-4, UTF-16, UTF-32). 61 The "from" encoding can also be a name defined for autodetection. 62 If TRANSLITERATE is true, transliteration will attempted to avoid conversion 63 errors, for iconv implementations that support this. Usually you'll choose 64 TRANSLITERATE = true if HANDLER != iconveh_error. 65 Allocate a malloced memory block for the result. 66 Return value: the freshly allocated resulting NUL-terminated string if 67 successful, otherwise NULL and errno set. */ 68 extern char * 69 str_iconveha (const char *src, 70 const char *from_codeset, const char *to_codeset, 71 bool transliterate, 72 enum iconv_ilseq_handler handler) 73 _GL_ATTRIBUTE_MALLOC _GL_ATTRIBUTE_DEALLOC_FREE; 74 75 76 /* In the above, FROM_CODESET can also be one of the following values: 77 "autodetect_utf8" supports ISO-8859-1 and UTF-8 78 "autodetect_jp" supports EUC-JP, ISO-2022-JP-2 and SHIFT_JIS 79 "autodetect_kr" supports EUC-KR and ISO-2022-KR 80 More names can be defined for autodetection. */ 81 82 /* Registers an encoding name for autodetection. 83 TRY_IN_ORDER is a NULL terminated list of encodings to be tried. 84 Returns 0 upon success, or -1 (with errno set) in case of error. 85 Particular errno values: ENOMEM. */ 86 extern int 87 uniconv_register_autodetect (const char *name, 88 const char * const *try_in_order); 89 90 91 #ifdef __cplusplus 92 } 93 #endif 94 95 96 #endif /* _STRICONVEHA_H */