summaryrefslogtreecommitdiff
path: root/test/text_decoder_test.cc
diff options
context:
space:
mode:
authorCarl Hetherington <cth@carlh.net>2023-02-27 23:20:14 +0100
committerCarl Hetherington <cth@carlh.net>2023-02-27 23:20:14 +0100
commit15fe326c723b88f779d69fe0ae737d27d69e6e6f (patch)
tree3c96a84f975b009d6835ec324518d95049bbb7b8 /test/text_decoder_test.cc
parentae859e7d02fb889ab966e0d69e2d0c42937620fe (diff)
Strip disallowed characters from subtitles before they get into the XML.
Diffstat (limited to 'test/text_decoder_test.cc')
-rw-r--r--test/text_decoder_test.cc32
1 files changed, 32 insertions, 0 deletions
diff --git a/test/text_decoder_test.cc b/test/text_decoder_test.cc
new file mode 100644
index 000000000..d6cbd4ce1
--- /dev/null
+++ b/test/text_decoder_test.cc
@@ -0,0 +1,32 @@
+/*
+ Copyright (C) 2023 Carl Hetherington <cth@carlh.net>
+
+ This file is part of DCP-o-matic.
+
+ DCP-o-matic is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License as published by
+ the Free Software Foundation; either version 2 of the License, or
+ (at your option) any later version.
+
+ DCP-o-matic is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with DCP-o-matic. If not, see <http://www.gnu.org/licenses/>.
+
+*/
+
+
+#include "lib/text_decoder.h"
+#include <boost/test/unit_test.hpp>
+
+
+BOOST_AUTO_TEST_CASE(strip_invalid_characters_for_xml_test)
+{
+ BOOST_CHECK_EQUAL(TextDecoder::remove_invalid_characters_for_xml("hello world"), "hello world");
+ BOOST_CHECK_EQUAL(TextDecoder::remove_invalid_characters_for_xml("hello\x0cworld"), "helloworld");
+ BOOST_CHECK_EQUAL(TextDecoder::remove_invalid_characters_for_xml("𒀖hello\x02worl𒁝d"), "𒀖helloworl𒁝d");
+ BOOST_CHECK_EQUAL(TextDecoder::remove_invalid_characters_for_xml("😀œ´®†¥¨ˆø\x09π¬˚∆\x1a˙©ƒ∂ßåΩ≈ç√∫\x02˜µ≤ユーザーコードa"), "😀œ´®†¥¨ˆø\x09π¬˚∆˙©ƒ∂ßåΩ≈ç√∫˜µ≤ユーザーコードa");
+}