summaryrefslogtreecommitdiff
path: root/src/utils/encoding.hpp
diff options
context:
space:
mode:
authorFlorent Le Coz <louiz@louiz.org>2013-12-11 21:07:39 +0100
committerFlorent Le Coz <louiz@louiz.org>2013-12-15 00:34:13 +0100
commit3960e4d5afa09c299f595b411ee8522db30580fd (patch)
tree74a94c7c16e35e09e20c0bca5f40db10eab9f664 /src/utils/encoding.hpp
parentb29290f73a24f2d5af7bde45c9ff5332c7a1f5a6 (diff)
downloadbiboumi-3960e4d5afa09c299f595b411ee8522db30580fd.tar.gz
biboumi-3960e4d5afa09c299f595b411ee8522db30580fd.tar.bz2
biboumi-3960e4d5afa09c299f595b411ee8522db30580fd.tar.xz
biboumi-3960e4d5afa09c299f595b411ee8522db30580fd.zip
Functions to provide xml-valid strings
By removing invalid chars, see http://www.w3.org/TR/xml/#charsets
Diffstat (limited to 'src/utils/encoding.hpp')
-rw-r--r--src/utils/encoding.hpp8
1 files changed, 8 insertions, 0 deletions
diff --git a/src/utils/encoding.hpp b/src/utils/encoding.hpp
index 362f1df..a3bccfc 100644
--- a/src/utils/encoding.hpp
+++ b/src/utils/encoding.hpp
@@ -12,6 +12,14 @@ namespace utils
*/
bool is_valid_utf8(const char* s);
/**
+ * Remove all invalid codepoints from the given utf-8-encoded string.
+ * The value returned is a copy of the string, without the removed chars.
+ *
+ * See http://www.w3.org/TR/xml/#charsets for the list of valid characters
+ * in XML.
+ */
+ std::string remove_invalid_xml_chars(const std::string& original);
+ /**
* Convert the given string (encoded is "encoding") into valid utf-8.
* If some decoding fails, insert an utf-8 placeholder character instead.
*/