TextUtfEncodingTest.cpp 1.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142
  1. /*
  2. * Copyright 2021 gitlost
  3. */
  4. // SPDX-License-Identifier: Apache-2.0
  5. #include "Utf.h"
  6. #include "gtest/gtest.h"
  7. using namespace ZXing;
  8. #if __cplusplus > 201703L
  9. std::string EscapeNonGraphical(const char8_t* utf8)
  10. {
  11. return EscapeNonGraphical(reinterpret_cast<const char*>(utf8));
  12. }
  13. #endif
  14. TEST(TextUtfEncodingTest, EscapeNonGraphical)
  15. {
  16. EXPECT_EQ(EscapeNonGraphical(u8"\u00B6\u0416"), "¶Ж");
  17. EXPECT_EQ(EscapeNonGraphical(u8"\x01\x1F\x7F"), "<SOH><US><DEL>");
  18. EXPECT_EQ(EscapeNonGraphical(u8"\u0080\u009F"), "<U+80><U+9F>");
  19. EXPECT_EQ(EscapeNonGraphical(u8"\u00A0"), "<U+A0>"); // NO-BREAK space (nbsp)
  20. EXPECT_EQ(EscapeNonGraphical(u8"\u2007"), "<U+2007>"); // NO-BREAK space (numsp)
  21. EXPECT_EQ(EscapeNonGraphical(u8"\u2000"), "<U+2000>"); // Space char (nqsp)
  22. EXPECT_EQ(EscapeNonGraphical(u8"\uFFFD"), "<U+FFFD>");
  23. EXPECT_EQ(EscapeNonGraphical(u8"\uFFFF"), "<U+FFFF>");
  24. }
  25. TEST(TextUtfEncodingTest, FromUtf8)
  26. {
  27. EXPECT_EQ(FromUtf8(u8"\U00010000"), L"\U00010000");
  28. EXPECT_EQ(FromUtf8(u8"\U00010FFF"), L"\U00010FFF");
  29. EXPECT_EQ(FromUtf8("A\xE8\x80\xBFG"), L"A\u803FG"); // U+803F
  30. // EXPECT_EQ(FromUtf8("A\xE8\x80\xBF\x80G"), L"A\u803FG"); // Bad UTF-8 (extra continuation byte)
  31. // EXPECT_EQ(FromUtf8("A\xE8\x80\xC0G"), L"AG"); // Bad UTF-8 (non-continuation byte)
  32. // EXPECT_EQ(FromUtf8("A\xE8\x80G"), L"AG"); // Bad UTF-8 (missing continuation byte)
  33. // EXPECT_EQ(FromUtf8("A\xE8G"), L"AG"); // Bad UTF-8 (missing continuation bytes)
  34. // EXPECT_EQ(FromUtf8("A\xED\xA0\x80G"), L"AG"); // Bad UTF-8 (unpaired high surrogate U+D800)
  35. }