1d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien/*
2d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien * Copyright (C) 2015 The Android Open Source Project
3d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien *
4d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien * Licensed under the Apache License, Version 2.0 (the "License");
5d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien * you may not use this file except in compliance with the License.
6d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien * You may obtain a copy of the License at
7d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien *
8d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien *      http://www.apache.org/licenses/LICENSE-2.0
9d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien *
10d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien * Unless required by applicable law or agreed to in writing, software
11d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien * distributed under the License is distributed on an "AS IS" BASIS,
12d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien * See the License for the specific language governing permissions and
14d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien * limitations under the License.
15d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien */
16d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
171d461589869ee5b7102f96271b0ef0a776ab513cSeigo Nonaka#include "minikin/GraphemeBreak.h"
181d461589869ee5b7102f96271b0ef0a776ab513cSeigo Nonaka
191d461589869ee5b7102f96271b0ef0a776ab513cSeigo Nonaka#include <vector>
201d461589869ee5b7102f96271b0ef0a776ab513cSeigo Nonaka
21d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien#include <gtest/gtest.h>
221d461589869ee5b7102f96271b0ef0a776ab513cSeigo Nonaka
231d461589869ee5b7102f96271b0ef0a776ab513cSeigo Nonaka#include "UnicodeUtils.h"
24d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
2514e2d136aaef271ba131f917cf5f27baa31ae5adSeigo Nonakanamespace minikin {
26d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
27d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levienbool IsBreak(const char* src) {
28d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    const size_t BUF_SIZE = 256;
29d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    uint16_t buf[BUF_SIZE];
30d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    size_t offset;
31d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    size_t size;
32d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    ParseUnicode(buf, BUF_SIZE, src, &size, &offset);
33b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    return GraphemeBreak::isGraphemeBreak(nullptr, buf, 0, size, offset);
34b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader}
35b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader
36b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournaderbool IsBreakWithAdvances(const float* advances, const char* src) {
37b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    const size_t BUF_SIZE = 256;
38b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    uint16_t buf[BUF_SIZE];
39b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    size_t offset;
40b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    size_t size;
41b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    ParseUnicode(buf, BUF_SIZE, src, &size, &offset);
42b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    return GraphemeBreak::isGraphemeBreak(advances, buf, 0, size, offset);
43d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien}
44d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
45d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph LevienTEST(GraphemeBreak, utf16) {
46d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+D83C | U+DC31"));  // emoji, U+1F431
47d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
48d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // tests for invalid UTF-16
49d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+D800 | U+D800"));  // two leading surrogates
50d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+DC00 | U+DC00"));  // two trailing surrogates
516c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("'a' | U+D800"));     // lonely leading surrogate
526c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("U+DC00 | 'a'"));     // lonely trailing surrogate
536c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("U+D800 | 'a'"));     // leading surrogate followed by non-surrogate
546c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("'a' | U+DC00"));     // non-surrogate followed by trailing surrogate
55d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien}
56d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
57d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph LevienTEST(GraphemeBreak, rules) {
58d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Rule GB1, sot ÷; Rule GB2, ÷ eot
59d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("| 'a'"));
60d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("'a' |"));
61d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
62d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Rule GB3, CR x LF
63d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+000D | U+000A"));  // CR x LF
64d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
65d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Rule GB4, (Control | CR | LF) ÷
66d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("'a' | U+2028"));  // Line separator
67d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("'a' | U+000D"));  // LF
68d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("'a' | U+000A"));  // CR
69d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
70d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Rule GB5, ÷ (Control | CR | LF)
71d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+2028 | 'a'"));  // Line separator
72d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+000D | 'a'"));  // LF
73d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+000A | 'a'"));  // CR
74d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
75d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Rule GB6, L x ( L | V | LV | LVT )
76d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+1100 | U+1100"));  // L x L
77d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+1100 | U+1161"));  // L x V
78d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+1100 | U+AC00"));  // L x LV
79d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+1100 | U+AC01"));  // L x LVT
80d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
81d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Rule GB7, ( LV | V ) x ( V | T )
82d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+AC00 | U+1161"));  // LV x V
83d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+1161 | U+1161"));  // V x V
84d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+AC00 | U+11A8"));  // LV x T
85d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+1161 | U+11A8"));  // V x T
86d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
87d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Rule GB8, ( LVT | T ) x T
88d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+AC01 | U+11A8"));  // LVT x T
89d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+11A8 | U+11A8"));  // T x T
90d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
91d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Other hangul pairs not counted above _are_ breaks (GB10)
92d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+AC00 | U+1100"));  // LV x L
93d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+AC01 | U+1100"));  // LVT x L
94d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+11A8 | U+1100"));  // T x L
95d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+11A8 | U+AC00"));  // T x LV
96d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+11A8 | U+AC01"));  // T x LVT
97d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
9893e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // Rule GB12 and Rule GB13, Regional_Indicator x Regional_Indicator
99d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+1F1FA | U+1F1F8"));
1006c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("U+1F1FA U+1F1F8 | U+1F1FA U+1F1F8"));   // Regional indicator pair (flag)
1016c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F1FA | U+1F1F8 U+1F1FA U+1F1F8"));  // Regional indicator pair (flag)
1026c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F1FA U+1F1F8 U+1F1FA | U+1F1F8"));  // Regional indicator pair (flag)
103450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka
1046c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("U+1F1FA U+1F1F8 | U+1F1FA"));   // Regional indicator pair (flag)
105450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F1FA | U+1F1F8 U+1F1FA"));  // Regional indicator pair (flag)
10693e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // Same case as the two above, knowing that the first two characters ligate, which is what
10793e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // would typically happen.
1086c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    const float firstPairLigated[] = {1.0, 0.0, 0.0, 0.0, 1.0, 0.0};  // Two entries per codepoint
10993e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(firstPairLigated, "U+1F1FA U+1F1F8 | U+1F1FA"));
11093e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(firstPairLigated, "U+1F1FA | U+1F1F8 U+1F1FA"));
11193e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // Repeat the tests, But now the font doesn't have a ligature for the first two characters,
11293e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // while it does have a ligature for the last two. This could happen for fonts that do not
11393e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // support some (potentially encoded later than they were developed) flags.
11493e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    const float secondPairLigated[] = {1.0, 0.0, 1.0, 0.0, 0.0, 0.0};
11593e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(secondPairLigated, "U+1F1FA U+1F1F8 | U+1F1FA"));
11693e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(secondPairLigated, "U+1F1FA | U+1F1F8 U+1F1FA"));
117450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka
1186c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("'a' U+1F1FA U+1F1F8 | U+1F1FA"));   // Regional indicator pair (flag)
119450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka    EXPECT_FALSE(IsBreak("'a' U+1F1FA | U+1F1F8 U+1F1FA"));  // Regional indicator pair (flag)
120450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka
121450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka    EXPECT_TRUE(
122450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka            IsBreak("'a' U+1F1FA U+1F1F8 | U+1F1FA U+1F1F8"));  // Regional indicator pair (flag)
123450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka    EXPECT_FALSE(
124450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka            IsBreak("'a' U+1F1FA | U+1F1F8 U+1F1FA U+1F1F8"));  // Regional indicator pair (flag)
125450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka    EXPECT_FALSE(
126450e96c8170c3d59a5896e734c90d3f9def505f8Seigo Nonaka            IsBreak("'a' U+1F1FA U+1F1F8 U+1F1FA | U+1F1F8"));  // Regional indicator pair (flag)
127d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
12893e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // Rule GB9, x (Extend | ZWJ)
129d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("'a' | U+0301"));  // combining accent
13093e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreak("'a' | U+200D"));  // ZWJ
131d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Rule GB9a, x SpacingMark
132d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+0915 | U+093E"));  // KA, AA (spacing mark)
133d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // Rule GB9b, Prepend x
134d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // see tailoring test for prepend, as current ICU doesn't have any characters in the class
135d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
13693e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // Rule GB999, Any ÷ Any
137d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("'a' | 'b'"));
1386c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("'f' | 'i'"));              // probable ligature
1396c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("U+0644 | U+0627"));        // probable ligature, lam + alef
1406c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("U+4E00 | U+4E00"));        // CJK ideographs
141d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("'a' | U+1F1FA U+1F1F8"));  // Regional indicator pair (flag)
142d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+1F1FA U+1F1F8 | 'a'"));  // Regional indicator pair (flag)
143e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka
144e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // Extended rule for emoji tag sequence.
145e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_TRUE(IsBreak("'a' | U+1F3F4 'a'"));
146e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_TRUE(IsBreak("'a' U+1F3F4 | 'a'"));
147e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka
148e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // Immediate tag_term after tag_base.
149e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_TRUE(IsBreak("'a' | U+1F3F4 U+E007F 'a'"));
150e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F3F4 | U+E007F"));
151e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_TRUE(IsBreak("'a' U+1F3F4 U+E007F | 'a'"));
152e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka
153e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // Flag sequence
154e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // U+1F3F4 U+E0067 U+E0062 U+E0073 U+E0063 U+E0074 U+E007F is emoji tag sequence for the flag
155e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // of Scotland.
156e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // U+1F3F4 is WAVING BLACK FLAG. This can be a tag_base character.
157e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // U+E0067 is TAG LATIN SMALL LETTER G. This can be a part of tag_spec.
158e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // U+E0062 is TAG LATIN SMALL LETTER B. This can be a part of tag_spec.
159e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // U+E0073 is TAG LATIN SMALL LETTER S. This can be a part of tag_spec.
160e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // U+E0063 is TAG LATIN SMALL LETTER C. This can be a part of tag_spec.
161e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // U+E0074 is TAG LATIN SMALL LETTER T. This can be a part of tag_spec.
162e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    // U+E007F is CANCEL TAG. This is a tag_term character.
163e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_TRUE(IsBreak("'a' | U+1F3F4 U+E0067 U+E0062 U+E0073 U+E0063 U+E0074 U+E007F"));
164e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F3F4 | U+E0067 U+E0062 U+E0073 U+E0063 U+E0074 U+E007F"));
165e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F3F4 U+E0067 | U+E0062 U+E0073 U+E0063 U+E0074 U+E007F"));
166e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F3F4 U+E0067 U+E0062 | U+E0073 U+E0063 U+E0074 U+E007F"));
167e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F3F4 U+E0067 U+E0062 U+E0073 | U+E0063 U+E0074 U+E007F"));
168e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F3F4 U+E0067 U+E0062 U+E0073 U+E0063 | U+E0074 U+E007F"));
169e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F3F4 U+E0067 U+E0062 U+E0073 U+E0063 U+E0074 | U+E007F"));
170e05034f356a4a1e6ad0e7b57a1992e87304f24a7Seigo Nonaka    EXPECT_TRUE(IsBreak("U+1F3F4 U+E0067 U+E0062 U+E0073 U+E0063 U+E0074 U+E007F | 'a'"));
171d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien}
172d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
173d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph LevienTEST(GraphemeBreak, tailoring) {
174d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // control characters that we interpret as "extend"
1756c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_FALSE(IsBreak("'a' | U+00AD"));   // soft hyphen
1766c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_FALSE(IsBreak("'a' | U+200B"));   // zwsp
1776c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_FALSE(IsBreak("'a' | U+200E"));   // lrm
1786c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_FALSE(IsBreak("'a' | U+202A"));   // lre
179d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("'a' | U+E0041"));  // tag character
180d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
181d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // UTC-approved characters for the Prepend class
182d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+06DD | U+0661"));  // arabic subtending mark + digit one
183d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
184d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_TRUE(IsBreak("U+0E01 | U+0E33"));  // Thai sara am
185d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
186d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    // virama is not a grapheme break, but "pure killer" is
187d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+0915 | U+094D U+0915"));  // Devanagari ka+virama+ka
188d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+0915 U+094D | U+0915"));  // Devanagari ka+virama+ka
189d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien    EXPECT_FALSE(IsBreak("U+0E01 | U+0E3A U+0E01"));  // thai phinthu = pure killer
1906c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("U+0E01 U+0E3A | U+0E01"));   // thai phinthu = pure killer
1916638e05ac2de397455c30cae05aca399a567428dRaph Levien
192b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    // Repetition of above tests, but with a given advances array that implies everything
193b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    // became just one cluster.
194b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    const float conjoined[] = {1.0, 0.0, 0.0};
195b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(conjoined,
1966c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka                                     "U+0915 | U+094D U+0915"));  // Devanagari ka+virama+ka
197b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(conjoined,
1986c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka                                     "U+0915 U+094D | U+0915"));  // Devanagari ka+virama+ka
199b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(conjoined,
2006c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka                                     "U+0E01 | U+0E3A U+0E01"));  // thai phinthu = pure killer
201b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(conjoined,
2026c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka                                    "U+0E01 U+0E3A | U+0E01"));  // thai phinthu = pure killer
203b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader
204b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    // Repetition of above tests, but with a given advances array that the virama did not
205b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    // form a cluster with the following consonant. The difference is that there is now
206b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    // a grapheme break after the virama in ka+virama+ka.
207b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    const float separate[] = {1.0, 0.0, 1.0};
208b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(separate,
2096c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka                                     "U+0915 | U+094D U+0915"));  // Devanagari ka+virama+ka
210b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(separate,
2116c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka                                    "U+0915 U+094D | U+0915"));  // Devanagari ka+virama+ka
212b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(separate,
2136c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka                                     "U+0E01 | U+0E3A U+0E01"));  // thai phinthu = pure killer
214b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(separate,
2156c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka                                    "U+0E01 U+0E3A | U+0E01"));  // thai phinthu = pure killer
216b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader
21793e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // suppress grapheme breaks in zwj emoji sequences
2186638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_FALSE(IsBreak("U+1F469 U+200D | U+2764 U+FE0F U+200D U+1F48B U+200D U+1F468"));
2196638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_FALSE(IsBreak("U+1F469 U+200D U+2764 U+FE0F U+200D | U+1F48B U+200D U+1F468"));
2206638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_FALSE(IsBreak("U+1F469 U+200D U+2764 U+FE0F U+200D U+1F48B U+200D | U+1F468"));
2216638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_FALSE(IsBreak("U+1F468 U+200D | U+1F469 U+200D U+1F466"));
2226638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_FALSE(IsBreak("U+1F468 U+200D U+1F469 U+200D | U+1F466"));
2236638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_FALSE(IsBreak("U+1F469 U+200D | U+1F469 U+200D U+1F467 U+200D U+1F466"));
2246638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_FALSE(IsBreak("U+1F469 U+200D U+1F469 U+200D | U+1F467 U+200D U+1F466"));
2256638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_FALSE(IsBreak("U+1F469 U+200D U+1F469 U+200D U+1F467 U+200D | U+1F466"));
2266638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_FALSE(IsBreak("U+1F441 U+200D | U+1F5E8"));
2276638e05ac2de397455c30cae05aca399a567428dRaph Levien
22877f488345316fba46c271fc04bea470819ae1712Seigo Nonaka    // Do not break before and after zwj with all kind of emoji characters.
22977f488345316fba46c271fc04bea470819ae1712Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F431 | U+200D U+1F464"));
23077f488345316fba46c271fc04bea470819ae1712Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F431 U+200D | U+1F464"));
23177f488345316fba46c271fc04bea470819ae1712Seigo Nonaka
2326638e05ac2de397455c30cae05aca399a567428dRaph Levien    // ARABIC LETTER BEH + ZWJ + heart, not a zwj emoji sequence, so we preserve the break
2336638e05ac2de397455c30cae05aca399a567428dRaph Levien    EXPECT_TRUE(IsBreak("U+0628 U+200D | U+2764"));
234d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien}
235d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien
236adfa580f1f067c846509b4346e5be2cb19177c1bRaph LevienTEST(GraphemeBreak, emojiModifiers) {
2376c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_FALSE(IsBreak("U+261D | U+1F3FB"));   // white up pointing index + modifier
2386c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_FALSE(IsBreak("U+270C | U+1F3FB"));   // victory hand + modifier
239adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_FALSE(IsBreak("U+1F466 | U+1F3FB"));  // boy + modifier
240adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_FALSE(IsBreak("U+1F466 | U+1F3FC"));  // boy + modifier
241adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_FALSE(IsBreak("U+1F466 | U+1F3FD"));  // boy + modifier
242adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_FALSE(IsBreak("U+1F466 | U+1F3FE"));  // boy + modifier
243adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_FALSE(IsBreak("U+1F466 | U+1F3FF"));  // boy + modifier
244adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_FALSE(IsBreak("U+1F918 | U+1F3FF"));  // sign of the horns + modifier
245adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_FALSE(IsBreak("U+1F933 | U+1F3FF"));  // selfie (Unicode 9) + modifier
24693e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // Reptition of the tests above, with the knowledge that they are ligated.
24793e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    const float ligated1_2[] = {1.0, 0.0, 0.0};
24893e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    const float ligated2_2[] = {1.0, 0.0, 0.0, 0.0};
24993e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated1_2, "U+261D | U+1F3FB"));
25093e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated1_2, "U+270C | U+1F3FB"));
25193e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated2_2, "U+1F466 | U+1F3FB"));
25293e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated2_2, "U+1F466 | U+1F3FC"));
25393e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated2_2, "U+1F466 | U+1F3FD"));
25493e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated2_2, "U+1F466 | U+1F3FE"));
25593e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated2_2, "U+1F466 | U+1F3FF"));
25693e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated2_2, "U+1F918 | U+1F3FF"));
25793e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated2_2, "U+1F933 | U+1F3FF"));
25893e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // Reptition of the tests above, with the knowledge that they are not ligated.
25993e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    const float unligated1_2[] = {1.0, 1.0, 0.0};
26093e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    const float unligated2_2[] = {1.0, 0.0, 1.0, 0.0};
26193e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated1_2, "U+261D | U+1F3FB"));
26293e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated1_2, "U+270C | U+1F3FB"));
26393e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated2_2, "U+1F466 | U+1F3FB"));
26493e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated2_2, "U+1F466 | U+1F3FC"));
26593e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated2_2, "U+1F466 | U+1F3FD"));
26693e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated2_2, "U+1F466 | U+1F3FE"));
26793e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated2_2, "U+1F466 | U+1F3FF"));
26893e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated2_2, "U+1F918 | U+1F3FF"));
26993e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated2_2, "U+1F933 | U+1F3FF"));
27093e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader
27193e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // adding extend characters between emoji base and modifier doesn't affect grapheme cluster
27293e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreak("U+270C U+FE0E | U+1F3FB"));  // victory hand + text style + modifier
273adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_FALSE(IsBreak("U+270C U+FE0F | U+1F3FB"));  // heart + emoji style + modifier
27493e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // Reptition of the two tests above, with the knowledge that they are ligated.
27593e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    const float ligated1_1_2[] = {1.0, 0.0, 0.0, 0.0};
27693e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated1_1_2, "U+270C U+FE0E | U+1F3FB"));
27793e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(ligated1_1_2, "U+270C U+FE0F | U+1F3FB"));
27893e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // Reptition of the first two tests, with the knowledge that they are not ligated.
27993e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    const float unligated1_1_2[] = {1.0, 0.0, 1.0, 0.0};
28093e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated1_1_2, "U+270C U+FE0E | U+1F3FB"));
28193e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated1_1_2, "U+270C U+FE0F | U+1F3FB"));
282adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien
283adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    // heart is not an emoji base
2846c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("U+2764 | U+1F3FB"));         // heart + modifier
285adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_TRUE(IsBreak("U+2764 U+FE0E | U+1F3FB"));  // heart + emoji style + modifier
286adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_TRUE(IsBreak("U+2764 U+FE0F | U+1F3FB"));  // heart + emoji style + modifier
2876c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    EXPECT_TRUE(IsBreak("U+1F3FB | U+1F3FB"));        // modifier + modifier
288adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien
289adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    // rat is not an emoji modifer
290adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien    EXPECT_TRUE(IsBreak("U+1F466 | U+1F400"));  // boy + rat
2911946f48e84fd67943dd2d09b3fee94028fbfe762Seigo Nonaka}
2921946f48e84fd67943dd2d09b3fee94028fbfe762Seigo Nonaka
2931946f48e84fd67943dd2d09b3fee94028fbfe762Seigo NonakaTEST(GraphemeBreak, genderBalancedEmoji) {
2941946f48e84fd67943dd2d09b3fee94028fbfe762Seigo Nonaka    // U+1F469 is WOMAN, U+200D is ZWJ, U+1F4BC is BRIEFCASE.
2951946f48e84fd67943dd2d09b3fee94028fbfe762Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F469 | U+200D U+1F4BC"));
2961946f48e84fd67943dd2d09b3fee94028fbfe762Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F469 U+200D | U+1F4BC"));
29793e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // The above two cases, when the ligature is not supported in the font. We now expect a break
29893e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // between them.
29993e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    const float unligated2_1_2[] = {1.0, 0.0, 0.0, 1.0, 0.0};
30093e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(unligated2_1_2, "U+1F469 | U+200D U+1F4BC"));
30193e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated2_1_2, "U+1F469 U+200D | U+1F4BC"));
3021946f48e84fd67943dd2d09b3fee94028fbfe762Seigo Nonaka
3031946f48e84fd67943dd2d09b3fee94028fbfe762Seigo Nonaka    // U+2695 has now emoji property, so should be part of ZWJ sequence.
3041946f48e84fd67943dd2d09b3fee94028fbfe762Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F469 | U+200D U+2695"));
3051946f48e84fd67943dd2d09b3fee94028fbfe762Seigo Nonaka    EXPECT_FALSE(IsBreak("U+1F469 U+200D | U+2695"));
30693e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // The above two cases, when the ligature is not supported in the font. We now expect a break
30793e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    // between them.
30893e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    const float unligated2_1_1[] = {1.0, 0.0, 0.0, 1.0};
30993e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_FALSE(IsBreakWithAdvances(unligated2_1_1, "U+1F469 | U+200D U+2695"));
31093e9c9f71e7cb418287a0acc8d188e385ba11e43Roozbeh Pournader    EXPECT_TRUE(IsBreakWithAdvances(unligated2_1_1, "U+1F469 U+200D | U+2695"));
311adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien}
312adfa580f1f067c846509b4346e5be2cb19177c1bRaph Levien
313d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph LevienTEST(GraphemeBreak, offsets) {
3146c8722e217ff5238f0b849152d7936959a728103Seigo Nonaka    uint16_t string[] = {0x0041, 0x06DD, 0x0045, 0x0301, 0x0049, 0x0301};
315b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_TRUE(GraphemeBreak::isGraphemeBreak(nullptr, string, 2, 3, 2));
316b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_FALSE(GraphemeBreak::isGraphemeBreak(nullptr, string, 2, 3, 3));
317b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_TRUE(GraphemeBreak::isGraphemeBreak(nullptr, string, 2, 3, 4));
318b01028d1d7bc3906ef71c72ad985919f79304b5eRoozbeh Pournader    EXPECT_TRUE(GraphemeBreak::isGraphemeBreak(nullptr, string, 2, 3, 5));
319d8dd94b81ea7efd776859fbbdf4a76458e270eabRaph Levien}
32014e2d136aaef271ba131f917cf5f27baa31ae5adSeigo Nonaka
32114e2d136aaef271ba131f917cf5f27baa31ae5adSeigo Nonaka}  // namespace minikin
322