summaryrefslogtreecommitdiff
path: root/src/shared/utf8.c
diff options
context:
space:
mode:
authorZbigniew Jędrzejewski-Szmek <zbyszek@in.waw.pl>2014-01-17 21:28:41 -0500
committerZbigniew Jędrzejewski-Szmek <zbyszek@in.waw.pl>2014-02-08 13:07:39 -0500
commit550a40eceb7d1917152fc9317bf2696708d52bc2 (patch)
tree929a5bac5264ad95783b1a68897daa67e3a25428 /src/shared/utf8.c
parentcda7ecb0a3d6cf839ec484a6690c12857a6e8375 (diff)
core: do not print invalid utf-8 in error messages
Diffstat (limited to 'src/shared/utf8.c')
-rw-r--r--src/shared/utf8.c26
1 files changed, 26 insertions, 0 deletions
diff --git a/src/shared/utf8.c b/src/shared/utf8.c
index 6e5ba9abf4..0b524d8a90 100644
--- a/src/shared/utf8.c
+++ b/src/shared/utf8.c
@@ -174,6 +174,32 @@ const char *utf8_is_valid(const char *str) {
return str;
}
+char *utf8_escape_invalid(const char *str) {
+ char *p, *s;
+
+ assert(str);
+
+ p = s = malloc(strlen(str) * 4 + 1);
+ if (!p)
+ return NULL;
+
+ while (*str) {
+ int len;
+
+ len = utf8_encoded_valid_unichar(str);
+ if (len > 0) {
+ s = mempcpy(s, str, len);
+ str += len;
+ } else {
+ s = mempcpy(s, UTF8_REPLACEMENT_CHARACTER, strlen(UTF8_REPLACEMENT_CHARACTER));
+ str += 1;
+ }
+ }
+ *s = '\0';
+
+ return p;
+}
+
char *ascii_is_valid(const char *str) {
const char *p;