diff options
author | Florent Le Coz <louiz@louiz.org> | 2013-12-11 21:07:39 +0100 |
---|---|---|
committer | Florent Le Coz <louiz@louiz.org> | 2013-12-15 00:34:13 +0100 |
commit | 3960e4d5afa09c299f595b411ee8522db30580fd (patch) | |
tree | 74a94c7c16e35e09e20c0bca5f40db10eab9f664 /src/utils/encoding.hpp | |
parent | b29290f73a24f2d5af7bde45c9ff5332c7a1f5a6 (diff) | |
download | biboumi-3960e4d5afa09c299f595b411ee8522db30580fd.tar.gz biboumi-3960e4d5afa09c299f595b411ee8522db30580fd.tar.bz2 biboumi-3960e4d5afa09c299f595b411ee8522db30580fd.tar.xz biboumi-3960e4d5afa09c299f595b411ee8522db30580fd.zip |
Functions to provide xml-valid strings
By removing invalid chars, see http://www.w3.org/TR/xml/#charsets
Diffstat (limited to 'src/utils/encoding.hpp')
-rw-r--r-- | src/utils/encoding.hpp | 8 |
1 files changed, 8 insertions, 0 deletions
diff --git a/src/utils/encoding.hpp b/src/utils/encoding.hpp index 362f1df..a3bccfc 100644 --- a/src/utils/encoding.hpp +++ b/src/utils/encoding.hpp @@ -12,6 +12,14 @@ namespace utils */ bool is_valid_utf8(const char* s); /** + * Remove all invalid codepoints from the given utf-8-encoded string. + * The value returned is a copy of the string, without the removed chars. + * + * See http://www.w3.org/TR/xml/#charsets for the list of valid characters + * in XML. + */ + std::string remove_invalid_xml_chars(const std::string& original); + /** * Convert the given string (encoded is "encoding") into valid utf-8. * If some decoding fails, insert an utf-8 placeholder character instead. */ |