220 lines
7.3 KiB
220 lines
7.3 KiB
#include <vector>
#include <iterator>
#include "boost/utf8.hpp"
#include <boost/detail/lightweight_test.hpp>
using namespace boost::utf8;
using namespace std;
int main()
unsigned char u[5] = {0,0,0,0,0};
unsigned char* end = append(0x0448, u);
BOOST_TEST (u[0] == 0xd1 && u[1] == 0x88 && u[2] == 0 && u[3] == 0 && u[4] == 0);
end = append(0x65e5, u);
BOOST_TEST (u[0] == 0xe6 && u[1] == 0x97 && u[2] == 0xa5 && u[3] == 0 && u[4] == 0);
end = append(0x3044, u);
BOOST_TEST (u[0] == 0xe3 && u[1] == 0x81 && u[2] == 0x84 && u[3] == 0 && u[4] == 0);
end = append(0x10346, u);
BOOST_TEST (u[0] == 0xf0 && u[1] == 0x90 && u[2] == 0x8d && u[3] == 0x86 && u[4] == 0);
char* twochars = "\xe6\x97\xa5\xd1\x88";
char* w = twochars;
int cp = next(w, twochars + 6);
BOOST_TEST (cp == 0x65e5);
BOOST_TEST (w == twochars + 3);
char* threechars = "\xf0\x90\x8d\x86\xe6\x97\xa5\xd1\x88";
w = threechars;
cp = next(w, threechars + 9);
BOOST_TEST (cp == 0x10346);
BOOST_TEST (w == threechars + 4);
cp = next(w, threechars + 9);
BOOST_TEST (cp == 0x65e5);
BOOST_TEST (w == threechars + 7);
cp = next(w, threechars + 9);
BOOST_TEST (cp == 0x0448);
BOOST_TEST (w == threechars + 9);
w = twochars + 3;
cp = prior (w, twochars - 1);
BOOST_TEST (cp == 0x65e5);
BOOST_TEST (w == twochars);
w = threechars + 9;
cp = prior(w, threechars - 1);
BOOST_TEST (cp == 0x0448);
BOOST_TEST (w == threechars + 7);
cp = prior(w, threechars -1);
BOOST_TEST (cp == 0x65e5);
BOOST_TEST (w == threechars + 4);
cp = prior(w, threechars - 1);
BOOST_TEST (cp == 0x10346);
BOOST_TEST (w == threechars);
// advance
w = twochars;
advance (w, 2, twochars + 6);
BOOST_TEST (w == twochars + 5);
// distance
size_t dist = boost::utf8::distance(twochars, twochars + 5);
BOOST_TEST (dist == 2);
// utf32to8
int utf32string[] = {0x448, 0x65E5, 0x10346, 0};
vector<char> utf8result;
utf32to8(utf32string, utf32string + 3, back_inserter(utf8result));
BOOST_TEST (utf8result.size() == 9);
// try it with the return value;
char* utf8_end = utf32to8(utf32string, utf32string + 3, &utf8result[0]);
BOOST_TEST (utf8_end == &utf8result[0] + 9);
vector<int> utf32result;
utf8to32(twochars, twochars + 5, back_inserter(utf32result));
BOOST_TEST (utf32result.size() == 2);
// try it with the return value;
int* utf32_end = utf8to32(twochars, twochars + 5, &utf32result[0]);
BOOST_TEST (utf32_end == &utf32result[0] + 2);
unsigned short utf16string[] = {0x41, 0x0448, 0x65e5, 0xd834, 0xdd1e};
utf16to8(utf16string, utf16string + 5, back_inserter(utf8result));
BOOST_TEST (utf8result.size() == 10);
// try it with the return value;
utf8_end = utf16to8 (utf16string, utf16string + 5, &utf8result[0]);
BOOST_TEST (utf8_end == &utf8result[0] + 10);
char utf8_with_surrogates[] = "\xe6\x97\xa5\xd1\x88\xf0\x9d\x84\x9e";
vector <unsigned short> utf16result;
utf8to16(utf8_with_surrogates, utf8_with_surrogates + 9, back_inserter(utf16result));
BOOST_TEST (utf16result.size() == 4);
BOOST_TEST (utf16result[2] == 0xd834);
BOOST_TEST (utf16result[3] == 0xdd1e);
// try it with the return value;
unsigned short* utf16_end = utf8to16 (utf8_with_surrogates, utf8_with_surrogates + 9, &utf16result[0]);
BOOST_TEST (utf16_end == &utf16result[0] + 4);
char utf_invalid[] = "\xe6\x97\xa5\xd1\x88\xfa";
char* invalid = find_invalid(utf_invalid, utf_invalid + 6);
BOOST_TEST (invalid == utf_invalid + 5);
bool bvalid = is_valid(utf_invalid, utf_invalid + 6);
BOOST_TEST (bvalid == false);
bvalid = is_valid(utf8_with_surrogates, utf8_with_surrogates + 9);
BOOST_TEST (bvalid == true);
unsigned char byte_order_mark[] = {0xef, 0xbb, 0xbf};
bool bbom = is_bom(byte_order_mark);
BOOST_TEST (bbom == true);
//// Unchecked variants
memset(u, 0, 5);
end = unchecked::append(0x0448, u);
BOOST_TEST (u[0] == 0xd1 && u[1] == 0x88 && u[2] == 0 && u[3] == 0 && u[4] == 0);
end = unchecked::append(0x65e5, u);
BOOST_TEST (u[0] == 0xe6 && u[1] == 0x97 && u[2] == 0xa5 && u[3] == 0 && u[4] == 0);
end = unchecked::append(0x10346, u);
BOOST_TEST (u[0] == 0xf0 && u[1] == 0x90 && u[2] == 0x8d && u[3] == 0x86 && u[4] == 0);
w = twochars;
cp = unchecked::next(w);
BOOST_TEST (cp == 0x65e5);
BOOST_TEST (w == twochars + 3);
w = threechars;
cp = unchecked::next(w);
BOOST_TEST (cp == 0x10346);
BOOST_TEST (w == threechars + 4);
cp = unchecked::next(w);
BOOST_TEST (cp == 0x65e5);
BOOST_TEST (w == threechars + 7);
cp = unchecked::next(w);
BOOST_TEST (cp == 0x0448);
BOOST_TEST (w == threechars + 9);
w = twochars + 3;
cp = unchecked::prior (w);
BOOST_TEST (cp == 0x65e5);
BOOST_TEST (w == twochars);
w = threechars + 9;
cp = unchecked::prior(w);
BOOST_TEST (cp == 0x0448);
BOOST_TEST (w == threechars + 7);
cp = unchecked::prior(w);
BOOST_TEST (cp == 0x65e5);
BOOST_TEST (w == threechars + 4);
cp = unchecked::prior(w);
BOOST_TEST (cp == 0x10346);
BOOST_TEST (w == threechars);
// advance
w = twochars;
unchecked::advance (w, 2);
BOOST_TEST (w == twochars + 5);
// distance
dist = unchecked::distance(twochars, twochars + 5);
BOOST_TEST (dist == 2);
// utf32to8
unchecked::utf32to8(utf32string, utf32string + 3, back_inserter(utf8result));
BOOST_TEST (utf8result.size() == 9);
// try it with the return value;
utf8_end = utf32to8(utf32string, utf32string + 3, &utf8result[0]);
BOOST_TEST(utf8_end == &utf8result[0] + 9);
unchecked::utf8to32(twochars, twochars + 5, back_inserter(utf32result));
BOOST_TEST (utf32result.size() == 2);
// try it with the return value;
utf32_end = utf8to32(twochars, twochars + 5, &utf32result[0]);
BOOST_TEST (utf32_end == &utf32result[0] + 2);
unchecked::utf16to8(utf16string, utf16string + 5, back_inserter(utf8result));
BOOST_TEST (utf8result.size() == 10);
// try it with the return value;
utf8_end = utf16to8 (utf16string, utf16string + 5, &utf8result[0]);
BOOST_TEST (utf8_end == &utf8result[0] + 10);
unchecked::utf8to16(utf8_with_surrogates, utf8_with_surrogates + 9, back_inserter(utf16result));
BOOST_TEST (utf16result.size() == 4);
BOOST_TEST (utf16result[2] == 0xd834);
BOOST_TEST (utf16result[3] == 0xdd1e);
// try it with the return value;
utf16_end = utf8to16 (utf8_with_surrogates, utf8_with_surrogates + 9, &utf16result[0]);
BOOST_TEST (utf16_end == &utf16result[0] + 4);
return boost::report_errors();