From 2c595e8ddec759fb94bf1b06d21dada3a1b70978 Mon Sep 17 00:00:00 2001 From: Matthias Melcher Date: Fri, 20 Jan 2023 16:13:00 +0100 Subject: STR 2822: function to count bytes in a UTF-8 string --- src/fl_utf8.cxx | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) (limited to 'src') diff --git a/src/fl_utf8.cxx b/src/fl_utf8.cxx index 72589c8e7..2ca9d6b2f 100644 --- a/src/fl_utf8.cxx +++ b/src/fl_utf8.cxx @@ -118,8 +118,30 @@ int fl_utf8len1(char c) } // fl_utf8len1 +/** + Return the length in bytes of a UTF-8 string. + \param[in] text encoded in UTF-8 + \param[in] len number of Unicode characters, -1 to test until the end of text + \return number of bytes that make up the Unicode string + \see fl_utf_nb_char(const unsigned char *buf, int len) + */ +int fl_utf8strlen(const char *text, int len) +{ + if (len == -1) return (int)strlen(text); + int i, n = 0; + for (i=len; i>0; i--) { + if (*text == 0) return n; // end of string + int nc = fl_utf8len1(*text); + n += nc; + text += nc; + } + return n; +} + + /** Returns the number of Unicode chars in the UTF-8 string. + \see fl_utf8strlen(const char *text, int len) */ int fl_utf_nb_char( -- cgit v1.2.3