Serenity Operating System
1/*
2 * Copyright (c) 2019-2020, Sergey Bugaev <bugaevc@serenityos.org>
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * 1. Redistributions of source code must retain the above copyright notice, this
9 * list of conditions and the following disclaimer.
10 *
11 * 2. Redistributions in binary form must reproduce the above copyright notice,
12 * this list of conditions and the following disclaimer in the documentation
13 * and/or other materials provided with the distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
16 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
22 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
23 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
24 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25 */
26
27#include <AK/TestSuite.h>
28
29#include <AK/Utf8View.h>
30
31TEST_CASE(decode_ascii)
32{
33 Utf8View utf8 { "Hello World!11" };
34 EXPECT(utf8.validate());
35
36 u32 expected[] = { 72, 101, 108, 108, 111, 32, 87, 111, 114, 108, 100, 33, 49, 49 };
37 size_t expected_size = sizeof(expected) / sizeof(expected[0]);
38
39 size_t i = 0;
40 for (u32 codepoint : utf8) {
41 ASSERT(i < expected_size);
42 EXPECT_EQ(codepoint, expected[i]);
43 i++;
44 }
45 EXPECT_EQ(i, expected_size);
46}
47
48TEST_CASE(decode_utf8)
49{
50 Utf8View utf8 { "Привет, мир! 😀 γειά σου κόσμος こんにちは世界" };
51 EXPECT(utf8.validate());
52
53 u32 expected[] = { 1055, 1088, 1080, 1074, 1077, 1090, 44, 32, 1084, 1080, 1088, 33, 32, 128512, 32, 947, 949, 953, 940, 32, 963, 959, 965, 32, 954, 972, 963, 956, 959, 962, 32, 12371, 12435, 12395, 12385, 12399, 19990, 30028 };
54 size_t expected_size = sizeof(expected) / sizeof(expected[0]);
55
56 size_t i = 0;
57 for (u32 codepoint : utf8) {
58 ASSERT(i < expected_size);
59 EXPECT_EQ(codepoint, expected[i]);
60 i++;
61 }
62 EXPECT_EQ(i, expected_size);
63}
64
65TEST_CASE(validate_invalid_ut8)
66{
67 char invalid_utf8_1[] = { 42, 35, (char)182, 9, 0 };
68 Utf8View utf8_1 { invalid_utf8_1 };
69 EXPECT(!utf8_1.validate());
70
71 char invalid_utf8_2[] = { 42, 35, (char)208, (char)208, 0 };
72 Utf8View utf8_2 { invalid_utf8_2 };
73 EXPECT(!utf8_2.validate());
74
75 char invalid_utf8_3[] = { (char)208, 0 };
76 Utf8View utf8_3 { invalid_utf8_3 };
77 EXPECT(!utf8_3.validate());
78
79 char invalid_utf8_4[] = { (char)208, 35, 0 };
80 Utf8View utf8_4 { invalid_utf8_4 };
81 EXPECT(!utf8_4.validate());
82}
83
84TEST_MAIN(UTF8)