15c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)/* 25c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * Copyright (C) 2007, 2008 Apple, Inc. All rights reserved. 35c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * 45c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * Redistribution and use in source and binary forms, with or without 55c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * modification, are permitted provided that the following conditions 65c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * are met: 75c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * 1. Redistributions of source code must retain the above copyright 85c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * notice, this list of conditions and the following disclaimer. 95c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * 2. Redistributions in binary form must reproduce the above copyright 105c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * notice, this list of conditions and the following disclaimer in the 115c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * documentation and/or other materials provided with the distribution. 125c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * 135c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * THIS SOFTWARE IS PROVIDED BY APPLE COMPUTER, INC. ``AS IS'' AND ANY 145c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 155c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 165c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE COMPUTER, INC. OR 175c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 185c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 195c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 205c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY 215c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 225c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 2302772c6a72f1ee0b226341a4f4439970c29fc861Ben Murdoch * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 245c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) */ 255c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 265c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)#include "config.h" 2781a5157921f1d2a7ff6aae115bfe3c139b38a5c8Torne (Richard Coles)#include "wtf/text/TextCodecUserDefined.h" 285c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 29591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch#include "wtf/PassOwnPtr.h" 30591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch#include "wtf/text/CString.h" 31591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch#include "wtf/text/StringBuffer.h" 32591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch#include "wtf/text/StringBuilder.h" 33591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch#include "wtf/text/WTFString.h" 345c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 3581a5157921f1d2a7ff6aae115bfe3c139b38a5c8Torne (Richard Coles)namespace WTF { 365c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 375c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)void TextCodecUserDefined::registerEncodingNames(EncodingNameRegistrar registrar) 385c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles){ 395c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) registrar("x-user-defined", "x-user-defined"); 405c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)} 415c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 425c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)static PassOwnPtr<TextCodec> newStreamingTextDecoderUserDefined(const TextEncoding&, const void*) 435c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles){ 445c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) return adoptPtr(new TextCodecUserDefined); 455c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)} 465c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 475c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)void TextCodecUserDefined::registerCodecs(TextCodecRegistrar registrar) 485c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles){ 495c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) registrar("x-user-defined", newStreamingTextDecoderUserDefined, 0); 505c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)} 515c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 52d5428f32f5d1719f774f62e19147104ca245a3abTorne (Richard Coles)String TextCodecUserDefined::decode(const char* bytes, size_t length, FlushBehavior, bool, bool&) 535c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles){ 545c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) StringBuilder result; 555c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) result.reserveCapacity(length); 565c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 575c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) for (size_t i = 0; i < length; ++i) { 585c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) signed char c = bytes[i]; 595c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) result.append(static_cast<UChar>(c & 0xF7FF)); 605c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) } 615c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 625c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) return result.toString(); 635c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)} 645c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 65591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdochtemplate<typename CharType> 66591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdochstatic CString encodeComplexUserDefined(const CharType* characters, size_t length, UnencodableHandling handling) 675c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles){ 685c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) Vector<char> result(length); 695c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) char* bytes = result.data(); 705c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 715c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) size_t resultLength = 0; 725c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) for (size_t i = 0; i < length; ) { 735c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) UChar32 c; 745c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) U16_NEXT(characters, i, length, c); 755c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) signed char signedByte = c; 765c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) if ((signedByte & 0xF7FF) == c) 775c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) bytes[resultLength++] = signedByte; 785c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) else { 795c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) // No way to encode this character with x-user-defined. 805c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) UnencodableReplacementArray replacement; 815c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) int replacementLength = TextCodec::getUnencodableReplacement(c, handling, replacement); 825c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) result.grow(resultLength + replacementLength + length - i); 835c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) bytes = result.data(); 845c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) memcpy(bytes + resultLength, replacement, replacementLength); 855c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) resultLength += replacementLength; 865c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) } 875c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) } 885c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 895c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) return CString(bytes, resultLength); 905c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)} 915c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 92591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdochtemplate<typename CharType> 93591b958dee2cf159d33a0b931e6231072eaf38d5Ben MurdochCString TextCodecUserDefined::encodeCommon(const CharType* characters, size_t length, UnencodableHandling handling) 945c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles){ 955c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) char* bytes; 96591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch CString result = CString::newUninitialized(length, bytes); 975c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 985c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) // Convert the string a fast way and simultaneously do an efficient check to see if it's all ASCII. 995c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) UChar ored = 0; 1005c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) for (size_t i = 0; i < length; ++i) { 1015c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) UChar c = characters[i]; 1025c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) bytes[i] = c; 1035c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) ored |= c; 1045c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) } 1055c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 1065c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) if (!(ored & 0xFF80)) 107591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch return result; 1085c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 1095c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) // If it wasn't all ASCII, call the function that handles more-complex cases. 1105c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) return encodeComplexUserDefined(characters, length, handling); 1115c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles)} 1125c87bf8b86a7c82ef50fb7a89697d8e02e2553beTorne (Richard Coles) 113591b958dee2cf159d33a0b931e6231072eaf38d5Ben MurdochCString TextCodecUserDefined::encode(const UChar* characters, size_t length, UnencodableHandling handling) 114591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch{ 115591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch return encodeCommon(characters, length, handling); 116591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch} 117591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch 118591b958dee2cf159d33a0b931e6231072eaf38d5Ben MurdochCString TextCodecUserDefined::encode(const LChar* characters, size_t length, UnencodableHandling handling) 119591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch{ 120591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch return encodeCommon(characters, length, handling); 121591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch} 122591b958dee2cf159d33a0b931e6231072eaf38d5Ben Murdoch 12381a5157921f1d2a7ff6aae115bfe3c139b38a5c8Torne (Richard Coles)} // namespace WTF 124