1// Copyright (C) 2016 and later: Unicode, Inc. and others.
2// License & terms of use: http://www.unicode.org/copyright.html
3/*
4*******************************************************************************
5* Copyright (C) 2013-2015, International Business Machines
6* Corporation and others.  All Rights Reserved.
7*******************************************************************************
8* collationinfo.cpp
9*
10* created on: 2013aug05
11* created by: Markus W. Scherer
12*/
13
14#include <stdio.h>
15#include <string.h>
16
17#include "unicode/utypes.h"
18
19#if !UCONFIG_NO_COLLATION
20
21#include "collationdata.h"
22#include "collationdatareader.h"
23#include "collationinfo.h"
24#include "uassert.h"
25#include "uvectr32.h"
26
27U_NAMESPACE_BEGIN
28
29void
30CollationInfo::printSizes(int32_t sizeWithHeader, const int32_t indexes[]) {
31    int32_t totalSize = indexes[CollationDataReader::IX_TOTAL_SIZE];
32    if(sizeWithHeader > totalSize) {
33        printf("  header size:                  %6ld\n", (long)(sizeWithHeader - totalSize));
34    }
35
36    int32_t length = indexes[CollationDataReader::IX_INDEXES_LENGTH];
37    printf("  indexes:          %6ld *4 = %6ld\n", (long)length, (long)length * 4);
38
39    length = getDataLength(indexes, CollationDataReader::IX_REORDER_CODES_OFFSET);
40    if(length != 0) {
41        printf("  reorder codes:    %6ld *4 = %6ld\n", (long)length / 4, (long)length);
42    }
43
44    length = getDataLength(indexes, CollationDataReader::IX_REORDER_TABLE_OFFSET);
45    if(length != 0) {
46        U_ASSERT(length >= 256);
47        printf("  reorder table:                %6ld\n", (long)length);
48    }
49
50    length = getDataLength(indexes, CollationDataReader::IX_TRIE_OFFSET);
51    if(length != 0) {
52        printf("  trie size:                    %6ld\n", (long)length);
53    }
54
55    length = getDataLength(indexes, CollationDataReader::IX_RESERVED8_OFFSET);
56    if(length != 0) {
57        printf("  reserved (offset 8):          %6ld\n", (long)length);
58    }
59
60    length = getDataLength(indexes, CollationDataReader::IX_CES_OFFSET);
61    if(length != 0) {
62        printf("  CEs:              %6ld *8 = %6ld\n", (long)length / 8, (long)length);
63    }
64
65    length = getDataLength(indexes, CollationDataReader::IX_RESERVED10_OFFSET);
66    if(length != 0) {
67        printf("  reserved (offset 10):         %6ld\n", (long)length);
68    }
69
70    length = getDataLength(indexes, CollationDataReader::IX_CE32S_OFFSET);
71    if(length != 0) {
72        printf("  CE32s:            %6ld *4 = %6ld\n", (long)length / 4, (long)length);
73    }
74
75    length = getDataLength(indexes, CollationDataReader::IX_ROOT_ELEMENTS_OFFSET);
76    if(length != 0) {
77        printf("  rootElements:     %6ld *4 = %6ld\n", (long)length / 4, (long)length);
78    }
79
80    length = getDataLength(indexes, CollationDataReader::IX_CONTEXTS_OFFSET);
81    if(length != 0) {
82        printf("  contexts:         %6ld *2 = %6ld\n", (long)length / 2, (long)length);
83    }
84
85    length = getDataLength(indexes, CollationDataReader::IX_UNSAFE_BWD_OFFSET);
86    if(length != 0) {
87        printf("  unsafeBwdSet:     %6ld *2 = %6ld\n", (long)length / 2, (long)length);
88    }
89
90    length = getDataLength(indexes, CollationDataReader::IX_FAST_LATIN_TABLE_OFFSET);
91    if(length != 0) {
92        printf("  fastLatin table:  %6ld *2 = %6ld\n", (long)length / 2, (long)length);
93    }
94
95    length = getDataLength(indexes, CollationDataReader::IX_SCRIPTS_OFFSET);
96    if(length != 0) {
97        printf("  scripts data:     %6ld *2 = %6ld\n", (long)length / 2, (long)length);
98    }
99
100    length = getDataLength(indexes, CollationDataReader::IX_COMPRESSIBLE_BYTES_OFFSET);
101    if(length != 0) {
102        U_ASSERT(length >= 256);
103        printf("  compressibleBytes:            %6ld\n", (long)length);
104    }
105
106    length = getDataLength(indexes, CollationDataReader::IX_RESERVED18_OFFSET);
107    if(length != 0) {
108        printf("  reserved (offset 18):         %6ld\n", (long)length);
109    }
110
111    printf(" collator binary total size:    %6ld\n", (long)sizeWithHeader);
112}
113
114int32_t
115CollationInfo::getDataLength(const int32_t indexes[], int32_t startIndex) {
116    return indexes[startIndex + 1] - indexes[startIndex];
117}
118
119void
120CollationInfo::printReorderRanges(const CollationData &data, const int32_t *codes, int32_t length) {
121    UErrorCode errorCode = U_ZERO_ERROR;
122    UVector32 ranges(errorCode);
123    data.makeReorderRanges(codes, length, ranges, errorCode);
124    if(U_FAILURE(errorCode)) {
125        printf("  error building reorder ranges: %s\n", u_errorName(errorCode));
126        return;
127    }
128
129    int32_t start = 0;
130    for(int32_t i = 0; i < ranges.size(); ++i) {
131        int32_t pair = ranges.elementAti(i);
132        int32_t limit = (pair >> 16) & 0xffff;
133        int16_t offset = (int16_t)pair;
134        if(offset == 0) {
135            // [inclusive-start, exclusive-limit[
136            printf("          [%04x, %04x[\n", start, limit);
137        } else if(offset > 0) {
138            printf("  reorder [%04x, %04x[ by offset  %02x to [%04x, %04x[\n",
139                    start, limit, offset,
140                    start + (offset << 8), limit + (offset << 8));
141        } else /* offset < 0 */ {
142            printf("  reorder [%04x, %04x[ by offset -%02x to [%04x, %04x[\n",
143                    start, limit, -offset,
144                    start + (offset << 8), limit + (offset << 8));
145        }
146        start = limit;
147    }
148}
149
150U_NAMESPACE_END
151
152#endif  // !UCONFIG_NO_COLLATION
153