1/*
2 * Copyright (C) 2013 Google Inc. All rights reserved.
3 *
4 * Redistribution and use in source and binary forms, with or without
5 * modification, are permitted provided that the following conditions are
6 * met:
7 *
8 *     * Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 *     * Redistributions in binary form must reproduce the above
11 * copyright notice, this list of conditions and the following disclaimer
12 * in the documentation and/or other materials provided with the
13 * distribution.
14 *     * Neither the name of Google Inc. nor the names of its
15 * contributors may be used to endorse or promote products derived from
16 * this software without specific prior written permission.
17 *
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 */
30
31#include "config.h"
32
33#include "wtf/text/TextCodecUTF8.h"
34
35#include "wtf/OwnPtr.h"
36#include "wtf/text/TextCodec.h"
37#include "wtf/text/TextEncoding.h"
38#include "wtf/text/TextEncodingRegistry.h"
39#include "wtf/text/WTFString.h"
40#include <gtest/gtest.h>
41
42namespace WTF {
43
44namespace {
45
46TEST(TextCodecUTF8, DecodeAscii)
47{
48    TextEncoding encoding("UTF-8");
49    OwnPtr<TextCodec> codec(newTextCodec(encoding));
50
51    const char testCase[] = "HelloWorld";
52    size_t testCaseSize = sizeof(testCase) - 1;
53
54    bool sawError = false;
55    const String& result = codec->decode(testCase, testCaseSize, DataEOF, false, sawError);
56    EXPECT_FALSE(sawError);
57    ASSERT_EQ(testCaseSize, result.length());
58    for (size_t i = 0; i < testCaseSize; ++i) {
59        EXPECT_EQ(testCase[i], result[i]);
60    }
61}
62
63TEST(TextCodecUTF8, DecodeChineseCharacters)
64{
65    TextEncoding encoding("UTF-8");
66    OwnPtr<TextCodec> codec(newTextCodec(encoding));
67
68    // "Kanji" in Chinese characters.
69    const char testCase[] = "\xe6\xbc\xa2\xe5\xad\x97";
70    size_t testCaseSize = sizeof(testCase) - 1;
71
72    bool sawError = false;
73    const String& result = codec->decode(testCase, testCaseSize, DataEOF, false, sawError);
74    EXPECT_FALSE(sawError);
75    ASSERT_EQ(2u, result.length());
76    EXPECT_EQ(0x6f22U, result[0]);
77    EXPECT_EQ(0x5b57U, result[1]);
78}
79
80TEST(TextCodecUTF8, Decode0xFF)
81{
82    TextEncoding encoding("UTF-8");
83    OwnPtr<TextCodec> codec(newTextCodec(encoding));
84
85    bool sawError = false;
86    const String& result = codec->decode("\xff", 1, DataEOF, false, sawError);
87    EXPECT_TRUE(sawError);
88    ASSERT_EQ(1u, result.length());
89    EXPECT_EQ(0xFFFDU, result[0]);
90}
91
92} // namespace
93
94} // namespace WTF
95