utf8proc

A clean C library for processing UTF-8 Unicode data
git clone https://git.sinitax.com/juliastrings/utf8proc
Log | Files | Refs | README | LICENSE | sfeed.txt

commit dad0cbdcabb682c1f26bc38da04608ce91aa19c7
parent 3822984606dd72ab129c0c9b26f496e75e7868e9
Author: Steven G. Johnson <stevenj@mit.edu>
Date:   Thu, 12 Mar 2015 14:29:33 -0400

update NEWS for 1.2-dev

Diffstat:
MNEWS.md | 26+++++++++++++++++++++++---
Mutf8proc.h | 3++-
2 files changed, 25 insertions(+), 4 deletions(-)

diff --git a/NEWS.md b/NEWS.md @@ -1,8 +1,28 @@ -# libutf8proc release history # +# utf8proc release history # -No releases so far. +## Version 1.2-dev ## -# utf8proc release history # +- Updated for Unicode 7.0. + +- New function `utf8proc_grapheme_break(c1,c2)` that returns whether + there is a grapheme break between `c1` and `c2`. + +- New function `utf8proc_charwidth(c)` that returns the number of + column-positions that should be required for `c`; essentially a + portable replacment for `wcwidth(c)`. + +- New function `utf8proc_category(c)` that returns the Unicode + category of `c` (as one of the constants `UTF8PROC_CATEGORY_xx`). + +- New function `utf8proc_category_string(c)` that returns the Unicode + category of `c` as a two-character string. + +- `cmake` script `CMakeLists.txt`, in addition to `Makefile`, for + easier compilation on Windows. + +- The shared library is now versioned (e.g. has a soname on GNU/Linux). + +- C++/MSVC compatibility. ## Version 1.1.6 ## diff --git a/utf8proc.h b/utf8proc.h @@ -398,7 +398,8 @@ DLLEXPORT int utf8proc_category(int32_t c); UTF8PROC_CATEGORY_* constants.) */ DLLEXPORT const char *utf8proc_category_string(int32_t c); -/* Return the two-letter Unicode category string for c (e.g. "Lu" or "Co"). */ +/* Return the two-letter (nul-terminated) Unicode category string for + c (e.g. "Lu" or "Co"). */ DLLEXPORT ssize_t utf8proc_map( const uint8_t *str, ssize_t strlen, uint8_t **dstptr, int options