From 395393a49ecd52595cbb10ecd7496156aefd55c4 Mon Sep 17 00:00:00 2001 From: Bruno Haible Date: Sun, 8 Mar 2009 15:14:42 +0100 Subject: [PATCH] New module 'unicase/u8-tolower'. --- ChangeLog | 4 ++ lib/unicase/u8-tolower.c | 118 +++++++++++++++++++++++++++++++++++++ modules/unicase/u8-tolower | 26 ++++++++ 3 files changed, 148 insertions(+) create mode 100644 lib/unicase/u8-tolower.c create mode 100644 modules/unicase/u8-tolower diff --git a/ChangeLog b/ChangeLog index 37ad231144..5ba9c1f7d1 100644 --- a/ChangeLog +++ b/ChangeLog @@ -1,5 +1,9 @@ 2009-03-08 Bruno Haible + New module 'unicase/u8-tolower'. + * lib/unicase/u8-tolower.c: New file. + * modules/unicase/u8-tolower: New file. + Tests for module 'unicase/u32-toupper'. * modules/unicase/u32-toupper-tests: New file. * tests/unicase/test-u32-toupper.c: New file. diff --git a/lib/unicase/u8-tolower.c b/lib/unicase/u8-tolower.c new file mode 100644 index 0000000000..8f8790b27c --- /dev/null +++ b/lib/unicase/u8-tolower.c @@ -0,0 +1,118 @@ +/* Lowercase mapping for UTF-8 strings (locale dependent). + Copyright (C) 2009 Free Software Foundation, Inc. + Written by Bruno Haible , 2009. + + This program is free software: you can redistribute it and/or modify it + under the terms of the GNU Lesser General Public License as published + by the Free Software Foundation; either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + Lesser General Public License for more details. + + You should have received a copy of the GNU Lesser General Public License + along with this program. If not, see . */ + +#include + +/* Specification. */ +#include "unicase.h" + +#include + +#include "unicasemap.h" +#include "special-casing.h" + +uint8_t * +u8_tolower (const uint8_t *s, size_t n, const char *iso639_language, + uninorm_t nf, + uint8_t *resultbuf, size_t *lengthp) +{ + return u8_casemap (s, n, iso639_language, + uc_tolower, offsetof (struct special_casing_rule, lower[0]), + nf, + resultbuf, lengthp); +} + + +#ifdef TEST + +#include +#include +#include +#include + +/* Read the contents of an input stream, and return it, terminated with a NUL + byte. */ +char * +read_file (FILE *stream) +{ +#define BUFSIZE 4096 + char *buf = NULL; + int alloc = 0; + int size = 0; + int count; + + while (! feof (stream)) + { + if (size + BUFSIZE > alloc) + { + alloc = alloc + alloc / 2; + if (alloc < size + BUFSIZE) + alloc = size + BUFSIZE; + buf = realloc (buf, alloc); + if (buf == NULL) + { + fprintf (stderr, "out of memory\n"); + exit (1); + } + } + count = fread (buf + size, 1, BUFSIZE, stream); + if (count == 0) + { + if (ferror (stream)) + { + perror ("fread"); + exit (1); + } + } + else + size += count; + } + buf = realloc (buf, size + 1); + if (buf == NULL) + { + fprintf (stderr, "out of memory\n"); + exit (1); + } + buf[size] = '\0'; + return buf; +#undef BUFSIZE +} + +int +main (int argc, char * argv[]) +{ + setlocale (LC_ALL, ""); + if (argc == 1) + { + /* Display the lower case of the input string. */ + char *input = read_file (stdin); + int length = strlen (input); + size_t output_length; + uint8_t *output = + u8_tolower ((uint8_t *) input, length, uc_locale_language (), + NULL, + NULL, &output_length); + + fwrite (output, 1, output_length, stdout); + + return 0; + } + else + return 1; +} + +#endif /* TEST */ diff --git a/modules/unicase/u8-tolower b/modules/unicase/u8-tolower new file mode 100644 index 0000000000..2a5796197a --- /dev/null +++ b/modules/unicase/u8-tolower @@ -0,0 +1,26 @@ +Description: +Lowercase mapping for UTF-8 strings (locale dependent). + +Files: +lib/unicase/u8-tolower.c + +Depends-on: +unicase/base +unicase/u8-casemap +unicase/special-casing +unicase/tolower + +configure.ac: + +Makefile.am: +lib_SOURCES += unicase/u8-tolower.c + +Include: +"unicase.h" + +License: +LGPL + +Maintainer: +Bruno Haible + -- 2.30.2