1//
2// Copyright 2006 The Android Open Source Project
3//
4// Build resource files from raw assets.
5//
6#include "StringPool.h"
7
8#include <utils/ByteOrder.h>
9#include <utils/SortedVector.h>
10
11#include <algorithm>
12
13#include "ResourceTable.h"
14
15// SSIZE: mingw does not have signed size_t == ssize_t.
16#if !defined(_WIN32)
17#  define SSIZE(x) x
18#else
19#  define SSIZE(x) (signed size_t)x
20#endif
21
22// Set to true for noisy debug output.
23static const bool kIsDebug = false;
24
25#if __cplusplus >= 201103L
26void strcpy16_htod(char16_t* dst, const char16_t* src)
27{
28    while (*src) {
29        char16_t s = htods(*src);
30        *dst++ = s;
31        src++;
32    }
33    *dst = 0;
34}
35#endif
36
37void strcpy16_htod(uint16_t* dst, const char16_t* src)
38{
39    while (*src) {
40        uint16_t s = htods(static_cast<uint16_t>(*src));
41        *dst++ = s;
42        src++;
43    }
44    *dst = 0;
45}
46
47void printStringPool(const ResStringPool* pool)
48{
49    if (pool->getError() == NO_INIT) {
50        printf("String pool is unitialized.\n");
51        return;
52    } else if (pool->getError() != NO_ERROR) {
53        printf("String pool is corrupt/invalid.\n");
54        return;
55    }
56
57    SortedVector<const void*> uniqueStrings;
58    const size_t N = pool->size();
59    for (size_t i=0; i<N; i++) {
60        size_t len;
61        if (pool->isUTF8()) {
62            uniqueStrings.add(pool->string8At(i, &len));
63        } else {
64            uniqueStrings.add(pool->stringAt(i, &len));
65        }
66    }
67
68    printf("String pool of " ZD " unique %s %s strings, " ZD " entries and "
69            ZD " styles using " ZD " bytes:\n",
70            (ZD_TYPE)uniqueStrings.size(), pool->isUTF8() ? "UTF-8" : "UTF-16",
71            pool->isSorted() ? "sorted" : "non-sorted",
72            (ZD_TYPE)N, (ZD_TYPE)pool->styleCount(), (ZD_TYPE)pool->bytes());
73
74    const size_t NS = pool->size();
75    for (size_t s=0; s<NS; s++) {
76        String8 str = pool->string8ObjectAt(s);
77        printf("String #" ZD ": %s\n", (ZD_TYPE) s, str.string());
78    }
79}
80
81String8 StringPool::entry::makeConfigsString() const {
82    String8 configStr(configTypeName);
83    if (configStr.size() > 0) configStr.append(" ");
84    if (configs.size() > 0) {
85        for (size_t j=0; j<configs.size(); j++) {
86            if (j > 0) configStr.append(", ");
87            configStr.append(configs[j].toString());
88        }
89    } else {
90        configStr = "(none)";
91    }
92    return configStr;
93}
94
95int StringPool::entry::compare(const entry& o) const {
96    // Strings with styles go first, to reduce the size of the styles array.
97    // We don't care about the relative order of these strings.
98    if (hasStyles) {
99        return o.hasStyles ? 0 : -1;
100    }
101    if (o.hasStyles) {
102        return 1;
103    }
104
105    // Sort unstyled strings by type, then by logical configuration.
106    int comp = configTypeName.compare(o.configTypeName);
107    if (comp != 0) {
108        return comp;
109    }
110    const size_t LHN = configs.size();
111    const size_t RHN = o.configs.size();
112    size_t i=0;
113    while (i < LHN && i < RHN) {
114        comp = configs[i].compareLogical(o.configs[i]);
115        if (comp != 0) {
116            return comp;
117        }
118        i++;
119    }
120    if (LHN < RHN) return -1;
121    else if (LHN > RHN) return 1;
122    return 0;
123}
124
125StringPool::StringPool(bool utf8) :
126        mUTF8(utf8), mValues(-1)
127{
128}
129
130ssize_t StringPool::add(const String16& value, const Vector<entry_style_span>& spans,
131        const String8* configTypeName, const ResTable_config* config)
132{
133    ssize_t res = add(value, false, configTypeName, config);
134    if (res >= 0) {
135        addStyleSpans(res, spans);
136    }
137    return res;
138}
139
140ssize_t StringPool::add(const String16& value,
141        bool mergeDuplicates, const String8* configTypeName, const ResTable_config* config)
142{
143    ssize_t vidx = mValues.indexOfKey(value);
144    ssize_t pos = vidx >= 0 ? mValues.valueAt(vidx) : -1;
145    ssize_t eidx = pos >= 0 ? mEntryArray.itemAt(pos) : -1;
146    if (eidx < 0) {
147        eidx = mEntries.add(entry(value));
148        if (eidx < 0) {
149            fprintf(stderr, "Failure adding string %s\n", String8(value).string());
150            return eidx;
151        }
152    }
153
154    if (configTypeName != NULL) {
155        entry& ent = mEntries.editItemAt(eidx);
156        if (kIsDebug) {
157            printf("*** adding config type name %s, was %s\n",
158                    configTypeName->string(), ent.configTypeName.string());
159        }
160        if (ent.configTypeName.size() <= 0) {
161            ent.configTypeName = *configTypeName;
162        } else if (ent.configTypeName != *configTypeName) {
163            ent.configTypeName = " ";
164        }
165    }
166
167    if (config != NULL) {
168        // Add this to the set of configs associated with the string.
169        entry& ent = mEntries.editItemAt(eidx);
170        size_t addPos;
171        for (addPos=0; addPos<ent.configs.size(); addPos++) {
172            int cmp = ent.configs.itemAt(addPos).compareLogical(*config);
173            if (cmp >= 0) {
174                if (cmp > 0) {
175                    if (kIsDebug) {
176                        printf("*** inserting config: %s\n", config->toString().string());
177                    }
178                    ent.configs.insertAt(*config, addPos);
179                }
180                break;
181            }
182        }
183        if (addPos >= ent.configs.size()) {
184            if (kIsDebug) {
185                printf("*** adding config: %s\n", config->toString().string());
186            }
187            ent.configs.add(*config);
188        }
189    }
190
191    const bool first = vidx < 0;
192    const bool styled = (pos >= 0 && (size_t)pos < mEntryStyleArray.size()) ?
193        mEntryStyleArray[pos].spans.size() : 0;
194    if (first || styled || !mergeDuplicates) {
195        pos = mEntryArray.add(eidx);
196        if (first) {
197            vidx = mValues.add(value, pos);
198        }
199        entry& ent = mEntries.editItemAt(eidx);
200        ent.indices.add(pos);
201    }
202
203    if (kIsDebug) {
204        printf("Adding string %s to pool: pos=%zd eidx=%zd vidx=%zd\n",
205                String8(value).string(), SSIZE(pos), SSIZE(eidx), SSIZE(vidx));
206    }
207
208    return pos;
209}
210
211status_t StringPool::addStyleSpan(size_t idx, const String16& name,
212                                  uint32_t start, uint32_t end)
213{
214    entry_style_span span;
215    span.name = name;
216    span.span.firstChar = start;
217    span.span.lastChar = end;
218    return addStyleSpan(idx, span);
219}
220
221status_t StringPool::addStyleSpans(size_t idx, const Vector<entry_style_span>& spans)
222{
223    const size_t N=spans.size();
224    for (size_t i=0; i<N; i++) {
225        status_t err = addStyleSpan(idx, spans[i]);
226        if (err != NO_ERROR) {
227            return err;
228        }
229    }
230    return NO_ERROR;
231}
232
233status_t StringPool::addStyleSpan(size_t idx, const entry_style_span& span)
234{
235    // Place blank entries in the span array up to this index.
236    while (mEntryStyleArray.size() <= idx) {
237        mEntryStyleArray.add();
238    }
239
240    entry_style& style = mEntryStyleArray.editItemAt(idx);
241    style.spans.add(span);
242    mEntries.editItemAt(mEntryArray[idx]).hasStyles = true;
243    return NO_ERROR;
244}
245
246StringPool::ConfigSorter::ConfigSorter(const StringPool& pool) : pool(pool)
247{
248}
249
250bool StringPool::ConfigSorter::operator()(size_t l, size_t r)
251{
252    const StringPool::entry& lhe = pool.mEntries[pool.mEntryArray[l]];
253    const StringPool::entry& rhe = pool.mEntries[pool.mEntryArray[r]];
254    return lhe.compare(rhe) < 0;
255}
256
257void StringPool::sortByConfig()
258{
259    LOG_ALWAYS_FATAL_IF(mOriginalPosToNewPos.size() > 0, "Can't sort string pool after already sorted.");
260
261    const size_t N = mEntryArray.size();
262
263    // This is a vector that starts out with a 1:1 mapping to entries
264    // in the array, which we will sort to come up with the desired order.
265    // At that point it maps from the new position in the array to the
266    // original position the entry appeared.
267    Vector<size_t> newPosToOriginalPos;
268    newPosToOriginalPos.setCapacity(N);
269    for (size_t i=0; i < N; i++) {
270        newPosToOriginalPos.add(i);
271    }
272
273    // Sort the array.
274    if (kIsDebug) {
275        printf("SORTING STRINGS BY CONFIGURATION...\n");
276    }
277    ConfigSorter sorter(*this);
278    std::sort(newPosToOriginalPos.begin(), newPosToOriginalPos.end(), sorter);
279    if (kIsDebug) {
280        printf("DONE SORTING STRINGS BY CONFIGURATION.\n");
281    }
282
283    // Create the reverse mapping from the original position in the array
284    // to the new position where it appears in the sorted array.  This is
285    // so that clients can re-map any positions they had previously stored.
286    mOriginalPosToNewPos = newPosToOriginalPos;
287    for (size_t i=0; i<N; i++) {
288        mOriginalPosToNewPos.editItemAt(newPosToOriginalPos[i]) = i;
289    }
290
291#if 0
292    SortedVector<entry> entries;
293
294    for (size_t i=0; i<N; i++) {
295        printf("#%d was %d: %s\n", i, newPosToOriginalPos[i],
296                mEntries[mEntryArray[newPosToOriginalPos[i]]].makeConfigsString().string());
297        entries.add(mEntries[mEntryArray[i]]);
298    }
299
300    for (size_t i=0; i<entries.size(); i++) {
301        printf("Sorted config #%d: %s\n", i,
302                entries[i].makeConfigsString().string());
303    }
304#endif
305
306    // Now we rebuild the arrays.
307    Vector<entry> newEntries;
308    Vector<size_t> newEntryArray;
309    Vector<entry_style> newEntryStyleArray;
310    DefaultKeyedVector<size_t, size_t> origOffsetToNewOffset;
311
312    for (size_t i=0; i<N; i++) {
313        // We are filling in new offset 'i'; oldI is where we can find it
314        // in the original data structure.
315        size_t oldI = newPosToOriginalPos[i];
316        // This is the actual entry associated with the old offset.
317        const entry& oldEnt = mEntries[mEntryArray[oldI]];
318        // This is the same entry the last time we added it to the
319        // new entry array, if any.
320        ssize_t newIndexOfOffset = origOffsetToNewOffset.indexOfKey(oldI);
321        size_t newOffset;
322        if (newIndexOfOffset < 0) {
323            // This is the first time we have seen the entry, so add
324            // it.
325            newOffset = newEntries.add(oldEnt);
326            newEntries.editItemAt(newOffset).indices.clear();
327        } else {
328            // We have seen this entry before, use the existing one
329            // instead of adding it again.
330            newOffset = origOffsetToNewOffset.valueAt(newIndexOfOffset);
331        }
332        // Update the indices to include this new position.
333        newEntries.editItemAt(newOffset).indices.add(i);
334        // And add the offset of the entry to the new entry array.
335        newEntryArray.add(newOffset);
336        // Add any old style to the new style array.
337        if (mEntryStyleArray.size() > 0) {
338            if (oldI < mEntryStyleArray.size()) {
339                newEntryStyleArray.add(mEntryStyleArray[oldI]);
340            } else {
341                newEntryStyleArray.add(entry_style());
342            }
343        }
344    }
345
346    // Now trim any entries at the end of the new style array that are
347    // not needed.
348    for (ssize_t i=newEntryStyleArray.size()-1; i>=0; i--) {
349        const entry_style& style = newEntryStyleArray[i];
350        if (style.spans.size() > 0) {
351            // That's it.
352            break;
353        }
354        // This one is not needed; remove.
355        newEntryStyleArray.removeAt(i);
356    }
357
358    // All done, install the new data structures and upate mValues with
359    // the new positions.
360    mEntries = newEntries;
361    mEntryArray = newEntryArray;
362    mEntryStyleArray = newEntryStyleArray;
363    mValues.clear();
364    for (size_t i=0; i<mEntries.size(); i++) {
365        const entry& ent = mEntries[i];
366        mValues.add(ent.value, ent.indices[0]);
367    }
368
369#if 0
370    printf("FINAL SORTED STRING CONFIGS:\n");
371    for (size_t i=0; i<mEntries.size(); i++) {
372        const entry& ent = mEntries[i];
373        printf("#" ZD " %s: %s\n", (ZD_TYPE)i, ent.makeConfigsString().string(),
374                String8(ent.value).string());
375    }
376#endif
377}
378
379sp<AaptFile> StringPool::createStringBlock()
380{
381    sp<AaptFile> pool = new AaptFile(String8(), AaptGroupEntry(),
382                                     String8());
383    status_t err = writeStringBlock(pool);
384    return err == NO_ERROR ? pool : NULL;
385}
386
387#define ENCODE_LENGTH(str, chrsz, strSize) \
388{ \
389    size_t maxMask = 1 << (((chrsz)*8)-1); \
390    size_t maxSize = maxMask-1; \
391    if ((strSize) > maxSize) { \
392        *(str)++ = maxMask | (((strSize)>>((chrsz)*8))&maxSize); \
393    } \
394    *(str)++ = strSize; \
395}
396
397status_t StringPool::writeStringBlock(const sp<AaptFile>& pool)
398{
399    // Allow appending.  Sorry this is a little wacky.
400    if (pool->getSize() > 0) {
401        sp<AaptFile> block = createStringBlock();
402        if (block == NULL) {
403            return UNKNOWN_ERROR;
404        }
405        ssize_t res = pool->writeData(block->getData(), block->getSize());
406        return (res >= 0) ? (status_t)NO_ERROR : res;
407    }
408
409    // First we need to add all style span names to the string pool.
410    // We do this now (instead of when the span is added) so that these
411    // will appear at the end of the pool, not disrupting the order
412    // our client placed their own strings in it.
413
414    const size_t STYLES = mEntryStyleArray.size();
415    size_t i;
416
417    for (i=0; i<STYLES; i++) {
418        entry_style& style = mEntryStyleArray.editItemAt(i);
419        const size_t N = style.spans.size();
420        for (size_t i=0; i<N; i++) {
421            entry_style_span& span = style.spans.editItemAt(i);
422            ssize_t idx = add(span.name, true);
423            if (idx < 0) {
424                fprintf(stderr, "Error adding span for style tag '%s'\n",
425                        String8(span.name).string());
426                return idx;
427            }
428            span.span.name.index = (uint32_t)idx;
429        }
430    }
431
432    const size_t ENTRIES = mEntryArray.size();
433
434    // Now build the pool of unique strings.
435
436    const size_t STRINGS = mEntries.size();
437    const size_t preSize = sizeof(ResStringPool_header)
438                         + (sizeof(uint32_t)*ENTRIES)
439                         + (sizeof(uint32_t)*STYLES);
440    if (pool->editData(preSize) == NULL) {
441        fprintf(stderr, "ERROR: Out of memory for string pool\n");
442        return NO_MEMORY;
443    }
444
445    const size_t charSize = mUTF8 ? sizeof(uint8_t) : sizeof(uint16_t);
446
447    size_t strPos = 0;
448    for (i=0; i<STRINGS; i++) {
449        entry& ent = mEntries.editItemAt(i);
450        const size_t strSize = (ent.value.size());
451        const size_t lenSize = strSize > (size_t)(1<<((charSize*8)-1))-1 ?
452            charSize*2 : charSize;
453
454        String8 encStr;
455        if (mUTF8) {
456            encStr = String8(ent.value);
457        }
458
459        const size_t encSize = mUTF8 ? encStr.size() : 0;
460        const size_t encLenSize = mUTF8 ?
461            (encSize > (size_t)(1<<((charSize*8)-1))-1 ?
462                charSize*2 : charSize) : 0;
463
464        ent.offset = strPos;
465
466        const size_t totalSize = lenSize + encLenSize +
467            ((mUTF8 ? encSize : strSize)+1)*charSize;
468
469        void* dat = (void*)pool->editData(preSize + strPos + totalSize);
470        if (dat == NULL) {
471            fprintf(stderr, "ERROR: Out of memory for string pool\n");
472            return NO_MEMORY;
473        }
474        dat = (uint8_t*)dat + preSize + strPos;
475        if (mUTF8) {
476            uint8_t* strings = (uint8_t*)dat;
477
478            ENCODE_LENGTH(strings, sizeof(uint8_t), strSize)
479
480            ENCODE_LENGTH(strings, sizeof(uint8_t), encSize)
481
482            strncpy((char*)strings, encStr, encSize+1);
483        } else {
484            char16_t* strings = (char16_t*)dat;
485
486            ENCODE_LENGTH(strings, sizeof(char16_t), strSize)
487
488            strcpy16_htod(strings, ent.value);
489        }
490
491        strPos += totalSize;
492    }
493
494    // Pad ending string position up to a uint32_t boundary.
495
496    if (strPos&0x3) {
497        size_t padPos = ((strPos+3)&~0x3);
498        uint8_t* dat = (uint8_t*)pool->editData(preSize + padPos);
499        if (dat == NULL) {
500            fprintf(stderr, "ERROR: Out of memory padding string pool\n");
501            return NO_MEMORY;
502        }
503        memset(dat+preSize+strPos, 0, padPos-strPos);
504        strPos = padPos;
505    }
506
507    // Build the pool of style spans.
508
509    size_t styPos = strPos;
510    for (i=0; i<STYLES; i++) {
511        entry_style& ent = mEntryStyleArray.editItemAt(i);
512        const size_t N = ent.spans.size();
513        const size_t totalSize = (N*sizeof(ResStringPool_span))
514                               + sizeof(ResStringPool_ref);
515
516        ent.offset = styPos-strPos;
517        uint8_t* dat = (uint8_t*)pool->editData(preSize + styPos + totalSize);
518        if (dat == NULL) {
519            fprintf(stderr, "ERROR: Out of memory for string styles\n");
520            return NO_MEMORY;
521        }
522        ResStringPool_span* span = (ResStringPool_span*)(dat+preSize+styPos);
523        for (size_t i=0; i<N; i++) {
524            span->name.index = htodl(ent.spans[i].span.name.index);
525            span->firstChar = htodl(ent.spans[i].span.firstChar);
526            span->lastChar = htodl(ent.spans[i].span.lastChar);
527            span++;
528        }
529        span->name.index = htodl(ResStringPool_span::END);
530
531        styPos += totalSize;
532    }
533
534    if (STYLES > 0) {
535        // Add full terminator at the end (when reading we validate that
536        // the end of the pool is fully terminated to simplify error
537        // checking).
538        size_t extra = sizeof(ResStringPool_span)-sizeof(ResStringPool_ref);
539        uint8_t* dat = (uint8_t*)pool->editData(preSize + styPos + extra);
540        if (dat == NULL) {
541            fprintf(stderr, "ERROR: Out of memory for string styles\n");
542            return NO_MEMORY;
543        }
544        uint32_t* p = (uint32_t*)(dat+preSize+styPos);
545        while (extra > 0) {
546            *p++ = htodl(ResStringPool_span::END);
547            extra -= sizeof(uint32_t);
548        }
549        styPos += extra;
550    }
551
552    // Write header.
553
554    ResStringPool_header* header =
555        (ResStringPool_header*)pool->padData(sizeof(uint32_t));
556    if (header == NULL) {
557        fprintf(stderr, "ERROR: Out of memory for string pool\n");
558        return NO_MEMORY;
559    }
560    memset(header, 0, sizeof(*header));
561    header->header.type = htods(RES_STRING_POOL_TYPE);
562    header->header.headerSize = htods(sizeof(*header));
563    header->header.size = htodl(pool->getSize());
564    header->stringCount = htodl(ENTRIES);
565    header->styleCount = htodl(STYLES);
566    if (mUTF8) {
567        header->flags |= htodl(ResStringPool_header::UTF8_FLAG);
568    }
569    header->stringsStart = htodl(preSize);
570    header->stylesStart = htodl(STYLES > 0 ? (preSize+strPos) : 0);
571
572    // Write string index array.
573
574    uint32_t* index = (uint32_t*)(header+1);
575    for (i=0; i<ENTRIES; i++) {
576        entry& ent = mEntries.editItemAt(mEntryArray[i]);
577        *index++ = htodl(ent.offset);
578        if (kIsDebug) {
579            printf("Writing entry #%zu: \"%s\" ent=%zu off=%zu\n",
580                    i,
581                    String8(ent.value).string(),
582                    mEntryArray[i],
583                    ent.offset);
584        }
585    }
586
587    // Write style index array.
588
589    for (i=0; i<STYLES; i++) {
590        *index++ = htodl(mEntryStyleArray[i].offset);
591    }
592
593    return NO_ERROR;
594}
595
596ssize_t StringPool::offsetForString(const String16& val) const
597{
598    const Vector<size_t>* indices = offsetsForString(val);
599    ssize_t res = indices != NULL && indices->size() > 0 ? indices->itemAt(0) : -1;
600    if (kIsDebug) {
601        printf("Offset for string %s: %zd (%s)\n", String8(val).string(), SSIZE(res),
602                res >= 0 ? String8(mEntries[mEntryArray[res]].value).string() : String8());
603    }
604    return res;
605}
606
607const Vector<size_t>* StringPool::offsetsForString(const String16& val) const
608{
609    ssize_t pos = mValues.valueFor(val);
610    if (pos < 0) {
611        return NULL;
612    }
613    return &mEntries[mEntryArray[pos]].indices;
614}
615