FontCollection.cpp revision 6d9dcd2cf3d3ed26a886e02d94c907311e7b1f83
19cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien/*
29cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien * Copyright (C) 2013 The Android Open Source Project
39cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien *
49cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien * Licensed under the Apache License, Version 2.0 (the "License");
59cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien * you may not use this file except in compliance with the License.
69cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien * You may obtain a copy of the License at
79cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien *
89cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien *      http://www.apache.org/licenses/LICENSE-2.0
99cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien *
109cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien * Unless required by applicable law or agreed to in writing, software
119cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien * distributed under the License is distributed on an "AS IS" BASIS,
129cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
139cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien * See the License for the specific language governing permissions and
149cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien * limitations under the License.
159cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien */
169cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
17ecc2d34ac23a497988f21e5f415b53c007b9d8c5Raph Levien// #define VERBOSE_DEBUG
18ecc2d34ac23a497988f21e5f415b53c007b9d8c5Raph Levien
19ecc2d34ac23a497988f21e5f415b53c007b9d8c5Raph Levien#define LOG_TAG "Minikin"
20ecc2d34ac23a497988f21e5f415b53c007b9d8c5Raph Levien#include <cutils/log.h>
219cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
22997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien#include "unicode/unistr.h"
23997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien#include "unicode/unorm2.h"
24997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien
256d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka#include "FontLanguageListCache.h"
26c31e3883456e018d742e9f29815ba5ff8b315ea1Raph Levien#include "MinikinInternal.h"
279cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien#include <minikin/FontCollection.h>
289cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
299cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levienusing std::vector;
309cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
319cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Leviennamespace android {
329cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
339cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levientemplate <typename T>
349cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levienstatic inline T max(T a, T b) {
359cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    return a>b ? a : b;
369cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien}
379cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
384d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levienuint32_t FontCollection::sNextId = 0;
394d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levien
409cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph LevienFontCollection::FontCollection(const vector<FontFamily*>& typefaces) :
419cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    mMaxChar(0) {
42c31e3883456e018d742e9f29815ba5ff8b315ea1Raph Levien    AutoMutex _l(gMinikinLock);
434d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levien    mId = sNextId++;
449cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    vector<uint32_t> lastChar;
459cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    size_t nTypefaces = typefaces.size();
469cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien#ifdef VERBOSE_DEBUG
47bae347682989d2627081310129a5b60541ed6ad0Seigo Nonaka    ALOGD("nTypefaces = %zd\n", nTypefaces);
489cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien#endif
499cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    const FontStyle defaultStyle;
509cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    for (size_t i = 0; i < nTypefaces; i++) {
519cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        FontFamily* family = typefaces[i];
529a5f713add8cfb91ac2c9ed5c917309053201ab6Raph Levien        MinikinFont* typeface = family->getClosestMatch(defaultStyle).font;
534d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levien        if (typeface == NULL) {
544d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levien            continue;
554d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levien        }
56bd36ec766a451c62ffdd407d5ce1a355e8f7dfd8Raph Levien        family->RefLocked();
5713f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien        const SparseBitSet* coverage = family->getCoverage();
58cb20a2f0b366bfc16db3a489a60156dec7a9fe21Andreas Gampe        if (coverage == nullptr) {
59cb20a2f0b366bfc16db3a489a60156dec7a9fe21Andreas Gampe            family->UnrefLocked();
60cb20a2f0b366bfc16db3a489a60156dec7a9fe21Andreas Gampe            continue;
61cb20a2f0b366bfc16db3a489a60156dec7a9fe21Andreas Gampe        }
62cb20a2f0b366bfc16db3a489a60156dec7a9fe21Andreas Gampe        mFamilies.push_back(family);  // emplace_back would be better
6313f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien        mMaxChar = max(mMaxChar, coverage->length());
6413f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien        lastChar.push_back(coverage->nextSetBit(0));
659cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    }
6613f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien    nTypefaces = mFamilies.size();
67156acb18f53b32655abb34166ea737e4320ca366Raph Levien    LOG_ALWAYS_FATAL_IF(nTypefaces == 0,
68156acb18f53b32655abb34166ea737e4320ca366Raph Levien        "Font collection must have at least one valid typeface");
6972fe9422c869b7878240a23e4650d9d90edb1c2aRaph Levien    size_t nPages = (mMaxChar + kPageMask) >> kLogCharsPerPage;
709cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    size_t offset = 0;
7180d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    // TODO: Use variation selector map for mRanges construction.
7280d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    // A font can have a glyph for a base code point and variation selector pair but no glyph for
7380d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    // the base code point without variation selector. The family won't be listed in the range in
7480d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    // this case.
759cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    for (size_t i = 0; i < nPages; i++) {
769cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        Range dummy;
779cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        mRanges.push_back(dummy);
789cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        Range* range = &mRanges.back();
799cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien#ifdef VERBOSE_DEBUG
80bae347682989d2627081310129a5b60541ed6ad0Seigo Nonaka        ALOGD("i=%zd: range start = %zd\n", i, offset);
819cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien#endif
829cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        range->start = offset;
839cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        for (size_t j = 0; j < nTypefaces; j++) {
849cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien            if (lastChar[j] < (i + 1) << kLogCharsPerPage) {
8513f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien                FontFamily* family = mFamilies[j];
8613f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien                mFamilyVec.push_back(family);
879cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien                offset++;
8813f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien                uint32_t nextChar = family->getCoverage()->nextSetBit((i + 1) << kLogCharsPerPage);
899cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien#ifdef VERBOSE_DEBUG
90bae347682989d2627081310129a5b60541ed6ad0Seigo Nonaka                ALOGD("nextChar = %d (j = %zd)\n", nextChar, j);
919cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien#endif
929cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien                lastChar[j] = nextChar;
939cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien            }
949cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        }
959cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        range->end = offset;
969cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    }
979cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien}
989cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
999cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph LevienFontCollection::~FontCollection() {
10013f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien    for (size_t i = 0; i < mFamilies.size(); i++) {
10113f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien        mFamilies[i]->UnrefLocked();
1029cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    }
1039cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien}
1049cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
1057b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien// Implement heuristic for choosing best-match font. Here are the rules:
1067b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien// 1. If first font in the collection has the character, it wins.
1077b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien// 2. If a font matches both language and script, it gets a score of 4.
1087b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien// 3. If a font matches just language, it gets a score of 2.
1097b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien// 4. Matching the "compact" or "elegant" variant adds one to the score.
110369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka// 5. If there is a variation selector and a font supports the complete variation sequence, we add
111369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka//    12 to the score.
112369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka// 6. If there is a color variation selector (U+FE0F), we add 6 to the score if the font is an emoji
113369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka//    font. This additional score of 6 is only given if the base character is supported in the font,
114369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka//    but not the whole variation sequence.
115369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka// 7. If there is a text variation selector (U+FE0E), we add 6 to the score if the font is not an
116369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka//    emoji font. This additional score of 6 is only given if the base character is supported in the
117369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka//    font, but not the whole variation sequence.
118369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka// 8. Highest score wins, with ties resolved to the first font.
119bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo NonakaFontFamily* FontCollection::getFamilyForChar(uint32_t ch, uint32_t vs,
1206d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka            uint32_t langListId, int variant) const {
1219cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    if (ch >= mMaxChar) {
1229cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        return NULL;
1239cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    }
124fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka
1256d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka    const FontLanguages& langList = FontLanguageListCache::getById(langListId);
1266d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka    // TODO: use all languages in langList.
1276d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka    const FontLanguage lang = (langList.size() == 0) ? FontLanguage() : langList[0];
1286d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka
129fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka    // Even if the font supports variation sequence, mRanges isn't aware of the base character of
130fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka    // the sequence. Search all FontFamilies if variation sequence is specified.
131fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka    // TODO: Always use mRanges for font search.
132fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka    const std::vector<FontFamily*>& familyVec = (vs == 0) ? mFamilyVec : mFamilies;
133fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka    Range range;
134fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka    if (vs == 0) {
135fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka        range = mRanges[ch >> kLogCharsPerPage];
136fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka    } else {
137fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka        range = { 0, mFamilies.size() };
138fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka    }
139fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka
1409cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien#ifdef VERBOSE_DEBUG
141bae347682989d2627081310129a5b60541ed6ad0Seigo Nonaka    ALOGD("querying range %zd:%zd\n", range.start, range.end);
1429cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien#endif
143bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    FontFamily* bestFamily = nullptr;
1447b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien    int bestScore = -1;
1459cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    for (size_t i = range.start; i < range.end; i++) {
146fc119c68f5def1e44e65ae4cdd147c01d62c9ad2Seigo Nonaka        FontFamily* family = familyVec[i];
147369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka        const bool hasVSGlyph = (vs != 0) && family->hasVariationSelector(ch, vs);
148369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka        if (hasVSGlyph || family->getCoverage()->get(ch)) {
149369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka            if ((vs == 0 || hasVSGlyph) && mFamilies[0] == family) {
150369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka                // If the first font family in collection supports the given character or sequence,
151369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka                // always use it.
15213f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien                return family;
1537b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien            }
1547b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien            int score = lang.match(family->lang()) * 2;
15590a09c3f36d98530822392446884b8af68035908Raph Levien            if (family->variant() == 0 || family->variant() == variant) {
1567b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien                score++;
1577b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien            }
158369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka            if (hasVSGlyph) {
159369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka                score += 12;
160369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka            } else if (((vs == 0xFE0F) && family->lang().hasEmojiFlag()) ||
161369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka                    ((vs == 0xFE0E) && !family->lang().hasEmojiFlag())) {
162369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka                score += 6;
163369d2d44cb09ac4346cdd9e3b131bb173d764f88Seigo Nonaka            }
1647b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien            if (score > bestScore) {
1657b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien                bestScore = score;
16613f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien                bestFamily = family;
1677b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien            }
1689cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        }
1699cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    }
1706d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka    if (bestFamily == nullptr && vs != 0) {
1716d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka        // If no fonts support the codepoint and variation selector pair,
1726d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka        // fallback to select a font family that supports just the base
1736d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka        // character, ignoring the variation selector.
1746d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka        return getFamilyForChar(ch, 0, langListId, variant);
1756d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka    }
176bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    if (bestFamily == nullptr && !mFamilyVec.empty()) {
177997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien        UErrorCode errorCode = U_ZERO_ERROR;
178997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien        const UNormalizer2* normalizer = unorm2_getNFDInstance(&errorCode);
179997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien        if (U_SUCCESS(errorCode)) {
180997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien            UChar decomposed[4];
181997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien            int len = unorm2_getRawDecomposition(normalizer, ch, decomposed, 4, &errorCode);
182997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien            if (U_SUCCESS(errorCode) && len > 0) {
183997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien                int off = 0;
184997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien                U16_NEXT_UNSAFE(decomposed, off, ch);
1856d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka                return getFamilyForChar(ch, vs, langListId, variant);
186997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien            }
187997c799e3ec6bf8adf687e29670d23d91e0f5feeRaph Levien        }
18813f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien        bestFamily = mFamilies[0];
189156acb18f53b32655abb34166ea737e4320ca366Raph Levien    }
19013f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien    return bestFamily;
1919cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien}
1929cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
193bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levienconst uint32_t NBSP = 0xa0;
194bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levienconst uint32_t ZWJ = 0x200c;
195bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levienconst uint32_t ZWNJ = 0x200d;
196f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbodconst uint32_t KEYCAP = 0x20e3;
19790a09c3f36d98530822392446884b8af68035908Raph Levienconst uint32_t HYPHEN = 0x2010;
19890a09c3f36d98530822392446884b8af68035908Raph Levienconst uint32_t NB_HYPHEN = 0x2011;
199f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod
200bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levien// Characters where we want to continue using existing font run instead of
201bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levien// recomputing the best match in the fallback list.
20290a09c3f36d98530822392446884b8af68035908Raph Levienstatic const uint32_t stickyWhitelist[] = { '!', ',', '-', '.', ':', ';', '?', NBSP, ZWJ, ZWNJ,
20390a09c3f36d98530822392446884b8af68035908Raph Levien        KEYCAP, HYPHEN, NB_HYPHEN };
204bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levien
205bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levienstatic bool isStickyWhitelisted(uint32_t c) {
206bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levien    for (size_t i = 0; i < sizeof(stickyWhitelist) / sizeof(stickyWhitelist[0]); i++) {
207bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levien        if (stickyWhitelist[i] == c) return true;
208bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levien    }
209bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levien    return false;
210bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levien}
211bb601b67dd05947f92cc23092bfb8a059c2e3377Raph Levien
212bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonakastatic bool isVariationSelector(uint32_t c) {
213bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    return (0xFE00 <= c && c <= 0xFE0F) || (0xE0100 <= c && c <= 0xE01EF);
214bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka}
215bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka
21680d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonakabool FontCollection::hasVariationSelector(uint32_t baseCodepoint,
21780d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka        uint32_t variationSelector) const {
21880d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    if (!isVariationSelector(variationSelector)) {
21980d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka        return false;
22080d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    }
22180d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    if (baseCodepoint >= mMaxChar) {
22280d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka        return false;
22380d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    }
22480d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    // Currently mRanges can not be used here since it isn't aware of the variation sequence.
22580d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    // TODO: Use mRanges for narrowing down the search range.
22680d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    for (size_t i = 0; i < mFamilies.size(); i++) {
22780d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka        if (mFamilies[i]->hasVariationSelector(baseCodepoint, variationSelector)) {
22880d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka          return true;
22980d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka        }
23080d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    }
23180d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka    return false;
23280d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka}
23380d113bcd4bbc395218503354af1a5a6dba59b4bSeigo Nonaka
2349cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levienvoid FontCollection::itemize(const uint16_t *string, size_t string_size, FontStyle style,
2359cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        vector<Run>* result) const {
2366d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka    const uint32_t langListId = style.getLanguageListId();
2377b221d97b7b64dc5ce457e19666d55d042e22e62Raph Levien    int variant = style.getVariant();
23813f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien    FontFamily* lastFamily = NULL;
2399cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien    Run* run = NULL;
240bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka
241bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    if (string_size == 0) {
242bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        return;
243bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    }
244bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka
245bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    const uint32_t kEndOfString = 0xFFFFFFFF;
246bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka
247bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    uint32_t nextCh = 0;
248bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    uint32_t prevCh = 0;
249bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    size_t nextUtf16Pos = 0;
250bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    size_t readLength = 0;
251bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    U16_NEXT(string, readLength, string_size, nextCh);
252bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka
253bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    do {
254bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        const uint32_t ch = nextCh;
255bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        const size_t utf16Pos = nextUtf16Pos;
256bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        nextUtf16Pos = readLength;
257bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        if (readLength < string_size) {
258bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka            U16_NEXT(string, readLength, string_size, nextCh);
259bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        } else {
260bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka            nextCh = kEndOfString;
261bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        }
262bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka
263bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        bool shouldContinueRun = false;
264bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        if (lastFamily != nullptr) {
265bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka            if (isStickyWhitelisted(ch)) {
266bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka                // Continue using existing font as long as it has coverage and is whitelisted
267bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka                shouldContinueRun = lastFamily->getCoverage()->get(ch);
268bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka            } else if (isVariationSelector(ch)) {
269bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka                // Always continue if the character is a variation selector.
270bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka                shouldContinueRun = true;
2719cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien            }
2729cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        }
273bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka
274bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        if (!shouldContinueRun) {
2756d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka            FontFamily* family = getFamilyForChar(ch, isVariationSelector(nextCh) ? nextCh : 0,
2766d9dcd2cf3d3ed26a886e02d94c907311e7b1f83Seigo Nonaka                    langListId, variant);
277bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka            if (utf16Pos == 0 || family != lastFamily) {
278bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka                size_t start = utf16Pos;
279f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod                // Workaround for Emoji keycap until we implement per-cluster font
280f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod                // selection: if keycap is found in a different font that also
281f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod                // supports previous char, attach previous char to the new run.
282f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod                // Bug 7557244.
283bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka                if (ch == KEYCAP && utf16Pos != 0 && family && family->getCoverage()->get(prevCh)) {
2843dd8757fcf48976295bac566277b6da1046e8362Seigo Nonaka                    const size_t prevChLength = U16_LENGTH(prevCh);
2853dd8757fcf48976295bac566277b6da1046e8362Seigo Nonaka                    run->end -= prevChLength;
286f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod                    if (run->start == run->end) {
287f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod                        result->pop_back();
288f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod                    }
2893dd8757fcf48976295bac566277b6da1046e8362Seigo Nonaka                    start -= prevChLength;
290f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod                }
291066e8575af64fb452617ac6005de6ccf6509553bRaph Levien                Run dummy;
292066e8575af64fb452617ac6005de6ccf6509553bRaph Levien                result->push_back(dummy);
293066e8575af64fb452617ac6005de6ccf6509553bRaph Levien                run = &result->back();
29413f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien                if (family == NULL) {
2959a5f713add8cfb91ac2c9ed5c917309053201ab6Raph Levien                    run->fakedFont.font = NULL;
296066e8575af64fb452617ac6005de6ccf6509553bRaph Levien                } else {
29713f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien                    run->fakedFont = family->getClosestMatch(style);
298066e8575af64fb452617ac6005de6ccf6509553bRaph Levien                }
29913f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien                lastFamily = family;
300f952161b874fd2e9af474b9fd2ebcca1f3bb4555Behdad Esfahbod                run->start = start;
3019cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien            }
3029cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien        }
303bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        prevCh = ch;
304bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka        run->end = nextUtf16Pos;  // exclusive
305bbdd73ec077a1bb6801b25a639834be16dfd78cbSeigo Nonaka    } while (nextCh != kEndOfString);
3069cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien}
3079cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien
30889566f0ada1cafe673efa064cde38467990235d4Raph LevienMinikinFont* FontCollection::baseFont(FontStyle style) {
3099a5f713add8cfb91ac2c9ed5c917309053201ab6Raph Levien    return baseFontFaked(style).font;
3109a5f713add8cfb91ac2c9ed5c917309053201ab6Raph Levien}
3119a5f713add8cfb91ac2c9ed5c917309053201ab6Raph Levien
3129a5f713add8cfb91ac2c9ed5c917309053201ab6Raph LevienFakedFont FontCollection::baseFontFaked(FontStyle style) {
31313f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien    if (mFamilies.empty()) {
3149a5f713add8cfb91ac2c9ed5c917309053201ab6Raph Levien        return FakedFont();
31589566f0ada1cafe673efa064cde38467990235d4Raph Levien    }
31613f1aae02bacd475722bc8ea3fc2cf6abc1a82e3Raph Levien    return mFamilies[0]->getClosestMatch(style);
31789566f0ada1cafe673efa064cde38467990235d4Raph Levien}
31889566f0ada1cafe673efa064cde38467990235d4Raph Levien
3194d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levienuint32_t FontCollection::getId() const {
3204d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levien    return mId;
3214d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levien}
3224d4e6bc8118d15542f1f2a9218f0f7a91a29474fRaph Levien
3230f2a025d135f9ca52cc3cf917fffc29d6c126094Seigo Nonakavoid FontCollection::purgeFontFamilyHbFontCache() const {
3240f2a025d135f9ca52cc3cf917fffc29d6c126094Seigo Nonaka    assertMinikinLocked();
3250f2a025d135f9ca52cc3cf917fffc29d6c126094Seigo Nonaka    for (size_t i = 0; i < mFamilies.size(); ++i) {
3260f2a025d135f9ca52cc3cf917fffc29d6c126094Seigo Nonaka        mFamilies[i]->purgeHbFontCache();
3270f2a025d135f9ca52cc3cf917fffc29d6c126094Seigo Nonaka    }
3280f2a025d135f9ca52cc3cf917fffc29d6c126094Seigo Nonaka}
3290f2a025d135f9ca52cc3cf917fffc29d6c126094Seigo Nonaka
3309cc9bbe1461f359f0b27c5e7645c17dda001ab1dRaph Levien}  // namespace android
331