diff options
author | Kiyoshi Aman <kiyoshi.aman+adelie@gmail.com> | 2019-02-01 22:55:37 +0000 |
---|---|---|
committer | Kiyoshi Aman <kiyoshi.aman+adelie@gmail.com> | 2019-02-03 18:22:05 -0600 |
commit | 5b57d28ffb6e1ef86b50f7d05d977826eae89bfe (patch) | |
tree | 154a22fe556b49e6927197336f8bf91b12eacd5e /usr.bin/iconv/iconv.c | |
download | userland-5b57d28ffb6e1ef86b50f7d05d977826eae89bfe.tar.gz userland-5b57d28ffb6e1ef86b50f7d05d977826eae89bfe.tar.bz2 userland-5b57d28ffb6e1ef86b50f7d05d977826eae89bfe.tar.xz userland-5b57d28ffb6e1ef86b50f7d05d977826eae89bfe.zip |
initial population
Diffstat (limited to 'usr.bin/iconv/iconv.c')
-rw-r--r-- | usr.bin/iconv/iconv.c | 236 |
1 files changed, 236 insertions, 0 deletions
diff --git a/usr.bin/iconv/iconv.c b/usr.bin/iconv/iconv.c new file mode 100644 index 0000000..dd9a5d4 --- /dev/null +++ b/usr.bin/iconv/iconv.c @@ -0,0 +1,236 @@ +/* $NetBSD: iconv.c,v 1.19 2013/10/07 02:00:46 dholland Exp $ */ + +/*- + * Copyright (c)2003 Citrus Project, + * All rights reserved. + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted provided that the following conditions + * are met: + * 1. Redistributions of source code must retain the above copyright + * notice, this list of conditions and the following disclaimer. + * 2. Redistributions in binary form must reproduce the above copyright + * notice, this list of conditions and the following disclaimer in the + * documentation and/or other materials provided with the distribution. + * + * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND + * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE + * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS + * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) + * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT + * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY + * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF + * SUCH DAMAGE. + */ + +#include <sys/cdefs.h> +#if defined(LIBC_SCCS) && !defined(lint) +__RCSID("$NetBSD: iconv.c,v 1.19 2013/10/07 02:00:46 dholland Exp $"); +#endif /* LIBC_SCCS and not lint */ + +#include <err.h> +#include <errno.h> +#include <iconv.h> +#include <langinfo.h> +#include <locale.h> +#include <stdio.h> +#include <stdlib.h> +#include <string.h> +#include <unistd.h> +#include <util.h> + +static void usage(void) __dead; +static int scmp(const void *, const void *); +static void show_codesets(void); +static void do_conv(const char *, FILE *, const char *, const char *, int, int); + +static void +usage(void) +{ + (void)fprintf(stderr, + "Usage:\t%1$s [-cs] -f <from_code> -t <to_code> [file ...]\n" + "\t%1$s -f <from_code> [-cs] [-t <to_code>] [file ...]\n" + "\t%1$s -t <to_code> [-cs] [-f <from_code>] [file ...]\n" + "\t%1$s -l\n", getprogname()); + exit(1); +} + +/* + * qsort() helper function + */ +static int +scmp(const void *v1, const void *v2) +{ + const char * const *s1 = v1; + const char * const *s2 = v2; + + return strcasecmp(*s1, *s2); +} + +static void +show_codesets(void) +{ + char **list; + size_t sz, i; + + if (__iconv_get_list(&list, &sz)) + err(EXIT_FAILURE, "__iconv_get_list()"); + + qsort(list, sz, sizeof(char *), scmp); + + for (i = 0; i < sz; i++) + (void)printf("%s\n", list[i]); + + __iconv_free_list(list, sz); +} + +#define INBUFSIZE 1024 +#define OUTBUFSIZE (INBUFSIZE * 2) +/*ARGSUSED*/ +static void +do_conv(const char *fn, FILE *fp, const char *from, const char *to, int silent, + int hide_invalid) +{ + char inbuf[INBUFSIZE], outbuf[OUTBUFSIZE], *out; + const char *in; + size_t inbytes, outbytes, ret, invalids; + iconv_t cd; + uint32_t flags = 0; + int serrno; + + if (hide_invalid) + flags |= __ICONV_F_HIDE_INVALID; + cd = iconv_open(to, from); + if (cd == (iconv_t)-1) + err(EXIT_FAILURE, "iconv_open(%s, %s)", to, from); + + invalids = 0; + while ((inbytes = fread(inbuf, 1, INBUFSIZE, fp)) > 0) { + in = inbuf; + while (inbytes > 0) { + size_t inval; + + out = outbuf; + outbytes = OUTBUFSIZE; + ret = __iconv(cd, &in, &inbytes, &out, &outbytes, + flags, &inval); + serrno = errno; + invalids += inval; + if (outbytes < OUTBUFSIZE) + (void)fwrite(outbuf, 1, OUTBUFSIZE - outbytes, + stdout); + errno = serrno; + if (ret == (size_t)-1 && errno != E2BIG) { + /* + * XXX: iconv(3) is bad interface. + * invalid character count is lost here. + * instead, we just provide __iconv function. + */ + if (errno != EINVAL || in == inbuf) + err(EXIT_FAILURE, "iconv()"); + + /* incomplete input character */ + (void)memmove(inbuf, in, inbytes); + ret = fread(inbuf + inbytes, 1, + INBUFSIZE - inbytes, fp); + if (ret == 0) { + fflush(stdout); + if (feof(fp)) + errx(EXIT_FAILURE, + "unexpected end of file; " + "the last character is " + "incomplete."); + else + err(EXIT_FAILURE, "fread()"); + } + in = inbuf; + inbytes += ret; + } + } + } + /* reset the shift state of the output buffer */ + outbytes = OUTBUFSIZE; + out = outbuf; + ret = iconv(cd, NULL, NULL, &out, &outbytes); + if (ret == (size_t)-1) + err(EXIT_FAILURE, "iconv()"); + if (outbytes < OUTBUFSIZE) + (void)fwrite(outbuf, 1, OUTBUFSIZE - outbytes, stdout); + + if (invalids > 0 && !silent) + warnx("warning: invalid characters: %lu", + (unsigned long)invalids); + + iconv_close(cd); +} + +int +main(int argc, char **argv) +{ + int ch, i; + int opt_l = 0, opt_s = 0, opt_c = 0; + char *opt_f = NULL, *opt_t = NULL; + FILE *fp; + + setlocale(LC_ALL, ""); + setprogname(argv[0]); + + while ((ch = getopt(argc, argv, "cslf:t:")) != EOF) { + switch (ch) { + case 'c': + opt_c = 1; + break; + case 's': + opt_s = 1; + break; + case 'l': + /* list */ + opt_l = 1; + break; + case 'f': + /* from */ + opt_f = estrdup(optarg); + break; + case 't': + /* to */ + opt_t = estrdup(optarg); + break; + default: + usage(); + } + } + argc -= optind; + argv += optind; + if (opt_l) { + if (argc > 0 || opt_s || opt_f != NULL || opt_t != NULL) { + warnx("-l is not allowed with other flags."); + usage(); + } + show_codesets(); + } else { + if (opt_f == NULL) { + if (opt_t == NULL) + usage(); + opt_f = nl_langinfo(CODESET); + } else if (opt_t == NULL) + opt_t = nl_langinfo(CODESET); + + if (argc == 0) + do_conv("<stdin>", stdin, opt_f, opt_t, opt_s, opt_c); + else { + for (i = 0; i < argc; i++) { + fp = fopen(argv[i], "r"); + if (fp == NULL) + err(EXIT_FAILURE, "Cannot open `%s'", + argv[i]); + do_conv(argv[i], fp, opt_f, opt_t, opt_s, + opt_c); + (void)fclose(fp); + } + } + } + return EXIT_SUCCESS; +} |