Serenity Operating System
at hosted 84 lines 3.1 kB view raw
1/* 2 * Copyright (c) 2019-2020, Sergey Bugaev <bugaevc@serenityos.org> 3 * All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions are met: 7 * 8 * 1. Redistributions of source code must retain the above copyright notice, this 9 * list of conditions and the following disclaimer. 10 * 11 * 2. Redistributions in binary form must reproduce the above copyright notice, 12 * this list of conditions and the following disclaimer in the documentation 13 * and/or other materials provided with the distribution. 14 * 15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 16 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 17 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 18 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE 19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR 21 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER 22 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, 23 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 24 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 25 */ 26 27#include <AK/TestSuite.h> 28 29#include <AK/Utf8View.h> 30 31TEST_CASE(decode_ascii) 32{ 33 Utf8View utf8 { "Hello World!11" }; 34 EXPECT(utf8.validate()); 35 36 u32 expected[] = { 72, 101, 108, 108, 111, 32, 87, 111, 114, 108, 100, 33, 49, 49 }; 37 size_t expected_size = sizeof(expected) / sizeof(expected[0]); 38 39 size_t i = 0; 40 for (u32 codepoint : utf8) { 41 ASSERT(i < expected_size); 42 EXPECT_EQ(codepoint, expected[i]); 43 i++; 44 } 45 EXPECT_EQ(i, expected_size); 46} 47 48TEST_CASE(decode_utf8) 49{ 50 Utf8View utf8 { "Привет, мир! 😀 γειά σου κόσμος こんにちは世界" }; 51 EXPECT(utf8.validate()); 52 53 u32 expected[] = { 1055, 1088, 1080, 1074, 1077, 1090, 44, 32, 1084, 1080, 1088, 33, 32, 128512, 32, 947, 949, 953, 940, 32, 963, 959, 965, 32, 954, 972, 963, 956, 959, 962, 32, 12371, 12435, 12395, 12385, 12399, 19990, 30028 }; 54 size_t expected_size = sizeof(expected) / sizeof(expected[0]); 55 56 size_t i = 0; 57 for (u32 codepoint : utf8) { 58 ASSERT(i < expected_size); 59 EXPECT_EQ(codepoint, expected[i]); 60 i++; 61 } 62 EXPECT_EQ(i, expected_size); 63} 64 65TEST_CASE(validate_invalid_ut8) 66{ 67 char invalid_utf8_1[] = { 42, 35, (char)182, 9, 0 }; 68 Utf8View utf8_1 { invalid_utf8_1 }; 69 EXPECT(!utf8_1.validate()); 70 71 char invalid_utf8_2[] = { 42, 35, (char)208, (char)208, 0 }; 72 Utf8View utf8_2 { invalid_utf8_2 }; 73 EXPECT(!utf8_2.validate()); 74 75 char invalid_utf8_3[] = { (char)208, 0 }; 76 Utf8View utf8_3 { invalid_utf8_3 }; 77 EXPECT(!utf8_3.validate()); 78 79 char invalid_utf8_4[] = { (char)208, 35, 0 }; 80 Utf8View utf8_4 { invalid_utf8_4 }; 81 EXPECT(!utf8_4.validate()); 82} 83 84TEST_MAIN(UTF8)