# HG changeset patch # User Mychaela Falconia # Date 1517857287 0 # Node ID ec0d6d58e0437efb4a1924e79d919ccce5882b3a # Parent 3bcc56883b1711e959b312c00d084ffa4853ae72 uptools/libcoding: UTF-8 input conversion to 8859-1 implemented diff -r 3bcc56883b17 -r ec0d6d58e043 uptools/libcoding/Makefile --- a/uptools/libcoding/Makefile Mon Feb 05 17:35:49 2018 +0000 +++ b/uptools/libcoding/Makefile Mon Feb 05 19:01:27 2018 +0000 @@ -2,7 +2,7 @@ CFLAGS= -O2 OBJS= alpha_addr.o decode_helpers.o grokdcs.o gsm7_decode.o \ gsm7_decode_tables.o gsm7_unpack.o gsmtime.o hexdecode.o hexdump.o \ - number_decode.o scaddr.o ucs2_decode.o + number_decode.o scaddr.o ucs2_decode.o utf8_decode.o LIB= libcoding.a all: ${LIB} diff -r 3bcc56883b17 -r ec0d6d58e043 uptools/libcoding/utf8_decode.c --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/uptools/libcoding/utf8_decode.c Mon Feb 05 19:01:27 2018 +0000 @@ -0,0 +1,29 @@ +/* + * This library module implements a function that converts text input + * from UTF-8 to ISO 8859-1, rejecting any input Unicode characters + * that aren't in the 8859-1 range. The conversion in done in place. + */ + +#include + +utf8_to_latin1(buf) + u_char *buf; +{ + u_char *ip = buf, *op = buf; + int c, c2; + + while (c = *ip++) { + if (c < 0x80) { + *op++ = c; + continue; + } + if (c != 0xC2 && c != 0xC3) + return(-1); + c2 = *ip++; + if (c2 < 0x80 || c2 > 0xBF) + return(-1); + *op++ = ((c & 3) << 6) | (c2 & 0x3F); + } + *op = '\0'; + return(0); +}