/*- * Copyright (C) 2009 Gabor Kovesdan * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF * SUCH DAMAGE. */ #include #include #include #include #include #include #include #include #include #include static bool uc_hook = false; static bool wc_hook = false; static bool mb_uc_fb = false; void unicode_hook(unsigned int mbr, void *data); void wchar_hook(wchar_t wc, void *data); void mb_to_uc_fb(const char *, size_t, void (*write_replacement) (const unsigned int *, size_t, void *), void *, void *); static int ctl_get_translit1(void) { iconv_t cd; int arg, ret; cd = iconv_open("ASCII//TRANSLIT", "UTF-8"); if (cd == (iconv_t)-1) return (-1); if (iconvctl(cd, ICONV_GET_TRANSLITERATE, &arg) == 0) ret = (arg == 1) ? 0 : -1; else ret = -1; if (iconv_close(cd) == -1) return (-1); return (ret); } static int ctl_get_translit2(void) { iconv_t cd; int arg, ret; cd = iconv_open("ASCII", "UTF-8"); if (cd == (iconv_t)-1) return (-1); if (iconvctl(cd, ICONV_GET_TRANSLITERATE, &arg) == 0) ret = (arg == 0) ? 0 : -1; else ret = -1; if (iconv_close(cd) == -1) return (-1); return (ret); } static int ctl_set_translit1(void) { iconv_t cd; int arg = 1, ret; cd = iconv_open("ASCII", "UTF-8"); if (cd == (iconv_t)-1) return (-1); ret = iconvctl(cd, ICONV_SET_TRANSLITERATE, &arg) == 0 ? 0 : -1; if (iconv_close(cd) == -1) return (-1); return (ret); } static int ctl_set_translit2(void) { iconv_t cd; int arg = 0, ret; cd = iconv_open("ASCII//TRANSLIT", "UTF-8"); if (cd == (iconv_t)-1) return (-1); ret = iconvctl(cd, ICONV_SET_TRANSLITERATE, &arg) == 0 ? 0 : -1; if (iconv_close(cd) == -1) return (-1); return (ret); } static int ctl_get_discard_ilseq1(void) { iconv_t cd; int arg, ret; cd = iconv_open("ASCII", "UTF-8"); if (cd == (iconv_t)-1) return (-1); if (iconvctl(cd, ICONV_GET_DISCARD_ILSEQ, &arg) == 0) ret = arg == 0 ? 0 : -1; else ret = -1; if (iconv_close(cd) == -1) return (-1); return (ret); } static int ctl_get_discard_ilseq2(void) { iconv_t cd; int arg, ret; cd = iconv_open("ASCII//IGNORE", "UTF-8"); if (cd == (iconv_t)-1) return (-1); if (iconvctl(cd, ICONV_GET_DISCARD_ILSEQ, &arg) == 0) ret = arg == 1 ? 0 : -1; else ret = -1; if (iconv_close(cd) == -1) return (-1); return (ret); } static int ctl_set_discard_ilseq1(void) { iconv_t cd; int arg = 1, ret; cd = iconv_open("ASCII", "UTF-8"); if (cd == (iconv_t)-1) return (-1); ret = iconvctl(cd, ICONV_SET_DISCARD_ILSEQ, &arg) == 0 ? 0 : -1; if (iconv_close(cd) == -1) return (-1); return (ret); } static int ctl_set_discard_ilseq2(void) { iconv_t cd; int arg = 0, ret; cd = iconv_open("ASCII//IGNORE", "UTF-8"); if (cd == (iconv_t)-1) return (-1); ret = iconvctl(cd, ICONV_SET_DISCARD_ILSEQ, &arg) == 0 ? 0 : -1; if (iconv_close(cd) == -1) return (-1); return (ret); } static int ctl_trivialp1(void) { iconv_t cd; int arg, ret; cd = iconv_open("latin2", "latin2"); if (cd == (iconv_t)-1) return (-1); if (iconvctl(cd, ICONV_TRIVIALP, &arg) == 0) { ret = (arg == 1) ? 0 : -1; } else ret = -1; if (iconv_close(cd) == -1) return (-1); return (ret); } static int ctl_trivialp2(void) { iconv_t cd; int arg, ret; cd = iconv_open("ASCII", "KOI8-R"); if (cd == (iconv_t)-1) return (-1); if (iconvctl(cd, ICONV_TRIVIALP, &arg) == 0) { ret = (arg == 0) ? 0 : -1; } else ret = -1; if (iconv_close(cd) == -1) return (-1); return (ret); } void unicode_hook(unsigned int mbr, void *data) { #ifdef VERBOSE printf("Unicode hook: %u\n", mbr); #endif uc_hook = true; } void wchar_hook(wchar_t wc, void *data) { #ifdef VERBOSE printf("Wchar hook: %ull\n", wc); #endif wc_hook = true; } static int ctl_uc_hook(void) { struct iconv_hooks hooks; iconv_t cd; size_t inbytesleft = 15, outbytesleft = 40; char **inptr; char *s = "Hello World!"; char **outptr; char *outbuf; inptr = &s; hooks.uc_hook = unicode_hook; hooks.wc_hook = NULL; outbuf = malloc(40); outptr = &outbuf; cd = iconv_open("UTF-8", "ASCII"); if (cd == (iconv_t)-1) return (-1); if (iconvctl(cd, ICONV_SET_HOOKS, (void *)&hooks) != 0) return (-1); if (iconv(cd, inptr, &inbytesleft, outptr, &outbytesleft) == (size_t)-1) return (-1); if (iconv_close(cd) == -1) return (-1); return (uc_hook ? 0 : 1); } static int ctl_wc_hook(void) { struct iconv_hooks hooks; iconv_t cd; size_t inbytesleft, outbytesleft = 40; char **inptr; char *s = "Hello World!"; char **outptr; char *outbuf; inptr = &s; hooks.wc_hook = wchar_hook; hooks.uc_hook = NULL; outbuf = malloc(40); outptr = &outbuf; inbytesleft = sizeof(s); cd = iconv_open("SHIFT_JIS", "ASCII"); if (cd == (iconv_t)-1) return (-1); if (iconvctl(cd, ICONV_SET_HOOKS, (void *)&hooks) != 0) return (-1); if (iconv(cd, inptr, &inbytesleft, outptr, &outbytesleft) == (size_t)-1) return (-1); if (iconv_close(cd) == -1) return (-1); return (wc_hook ? 0 : 1); } static int gnu_canonicalize1(void) { return (strcmp(iconv_canonicalize("latin2"), "ISO-8859-2")); } static int gnu_canonicalize2(void) { return (!strcmp(iconv_canonicalize("ASCII"), iconv_canonicalize("latin2"))); } static int iconvlist_cb(unsigned int count, const char * const *names, void *data) { return (*(int *)data = ((names == NULL) && (count > 0)) ? -1 : 0); } static int gnu_iconvlist(void) { int i; iconvlist(iconvlist_cb, (void *)&i); return (i); } void mb_to_uc_fb(const char* inbuf, size_t inbufsize, void (*write_replacement)(const unsigned int *buf, size_t buflen, void* callback_arg), void* callback_arg, void* data) { unsigned int c = 0x3F; mb_uc_fb = true; write_replacement((const unsigned int *)&c, 1, NULL); } static int __unused ctl_mb_to_uc_fb(void) { struct iconv_fallbacks fb; iconv_t cd; size_t inbytesleft, outbytesleft; uint16_t inbuf[1] = { 0xF187 }; uint8_t outbuf[4] = { 0x00, 0x00, 0x00, 0x00 }; char *inptr; char *outptr; int ret; if ((cd = iconv_open("UTF-32", "UTF-8")) == (iconv_t)-1) return (1); fb.uc_to_mb_fallback = NULL; fb.mb_to_wc_fallback = NULL; fb.wc_to_mb_fallback = NULL; fb.mb_to_uc_fallback = mb_to_uc_fb; fb.data = NULL; if (iconvctl(cd, ICONV_SET_FALLBACKS, (void *)&fb) != 0) return (1); inptr = (char *)inbuf; outptr = (char *)outbuf; inbytesleft = 2; outbytesleft = 4; errno = 0; ret = iconv(cd, &inptr, &inbytesleft, &outptr, &outbytesleft); #ifdef VERBOSE printf("mb_uc fallback: %c\n", outbuf[0]); #endif if (mb_uc_fb && (outbuf[0] == 0x3F)) return (0); else return (1); } static int gnu_openinto(void) { iconv_allocation_t *myspace; size_t inbytesleft, outbytesleft; char *inptr; char *inbuf = "works!", *outptr; char outbuf[6]; if ((myspace = (iconv_allocation_t *)malloc(sizeof(iconv_allocation_t))) == NULL) return (1); if (iconv_open_into("ASCII", "ASCII", myspace) == -1) return (1); inptr = (char *)inbuf; outptr = (char *)outbuf; inbytesleft = 6; outbytesleft = 6; iconv((iconv_t)myspace, &inptr, &inbytesleft, &outptr, &outbytesleft); return ((memcmp(inbuf, outbuf, 6) == 0) ? 0 : 1); } static void test(int (tester) (void), const char * label) { int ret; if ((ret = tester())) printf("%s failed (%d)\n", label, ret); else printf("%s succeeded\n", label); } int main(void) { test(ctl_get_translit1, "ctl_get_translit1"); test(ctl_get_translit2, "ctl_get_translit2"); test(ctl_set_translit1, "ctl_set_translit1"); test(ctl_set_translit2, "ctl_set_translit2"); test(ctl_get_discard_ilseq1, "ctl_get_discard_ilseq1"); test(ctl_get_discard_ilseq2, "ctl_get_discard_ilseq2"); test(ctl_set_discard_ilseq1, "ctl_set_discard_ilseq1"); test(ctl_set_discard_ilseq2, "ctl_set_discard_ilseq2"); test(ctl_trivialp1, "ctl_trivialp1"); test(ctl_trivialp2, "ctl_trivialp2"); test(ctl_uc_hook, "ctl_uc_hook"); test(ctl_wc_hook, "ctl_wc_hook"); // test(ctl_mb_to_uc_fb, "ctl_mb_to_uc_fb"); test(gnu_openinto, "gnu_openinto"); test(gnu_canonicalize1, "gnu_canonicalize1"); test(gnu_canonicalize2, "gnu_canonicalize2"); test(gnu_iconvlist, "gnu_iconvlist"); }