1 | /* |
2 | * Copyright (C) 2007-2017 Apple, Inc. All rights reserved. |
3 | * |
4 | * Redistribution and use in source and binary forms, with or without |
5 | * modification, are permitted provided that the following conditions |
6 | * are met: |
7 | * 1. Redistributions of source code must retain the above copyright |
8 | * notice, this list of conditions and the following disclaimer. |
9 | * 2. Redistributions in binary form must reproduce the above copyright |
10 | * notice, this list of conditions and the following disclaimer in the |
11 | * documentation and/or other materials provided with the distribution. |
12 | * |
13 | * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY |
14 | * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
15 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
16 | * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR |
17 | * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
18 | * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
19 | * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
20 | * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY |
21 | * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
22 | * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
23 | * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
24 | */ |
25 | |
26 | #include "config.h" |
27 | #include "TextCodecUserDefined.h" |
28 | |
29 | #include <array> |
30 | #include <wtf/text/CString.h> |
31 | #include <wtf/text/StringBuilder.h> |
32 | #include <wtf/text/WTFString.h> |
33 | |
34 | namespace WebCore { |
35 | |
36 | void TextCodecUserDefined::registerEncodingNames(EncodingNameRegistrar registrar) |
37 | { |
38 | registrar("x-user-defined" , "x-user-defined" ); |
39 | } |
40 | |
41 | void TextCodecUserDefined::registerCodecs(TextCodecRegistrar registrar) |
42 | { |
43 | registrar("x-user-defined" , [] { |
44 | return std::make_unique<TextCodecUserDefined>(); |
45 | }); |
46 | } |
47 | |
48 | String TextCodecUserDefined::decode(const char* bytes, size_t length, bool, bool, bool&) |
49 | { |
50 | StringBuilder result; |
51 | result.reserveCapacity(length); |
52 | for (size_t i = 0; i < length; ++i) { |
53 | signed char c = bytes[i]; |
54 | result.append(static_cast<UChar>(c & 0xF7FF)); |
55 | } |
56 | return result.toString(); |
57 | } |
58 | |
59 | static Vector<uint8_t> encodeComplexUserDefined(StringView string, UnencodableHandling handling) |
60 | { |
61 | Vector<uint8_t> result; |
62 | |
63 | for (auto character : string.codePoints()) { |
64 | int8_t signedByte = character; |
65 | if ((signedByte & 0xF7FF) == character) |
66 | result.append(signedByte); |
67 | else { |
68 | // No way to encode this character with x-user-defined. |
69 | UnencodableReplacementArray replacement; |
70 | int replacementLength = TextCodec::getUnencodableReplacement(character, handling, replacement); |
71 | result.append(replacement.data(), replacementLength); |
72 | } |
73 | } |
74 | |
75 | return result; |
76 | } |
77 | |
78 | Vector<uint8_t> TextCodecUserDefined::encode(StringView string, UnencodableHandling handling) |
79 | { |
80 | { |
81 | Vector<uint8_t> result(string.length()); |
82 | auto* bytes = result.data(); |
83 | |
84 | // Convert and simultaneously do a check to see if it's all ASCII. |
85 | UChar ored = 0; |
86 | for (auto character : string.codeUnits()) { |
87 | *bytes++ = character; |
88 | ored |= character; |
89 | } |
90 | |
91 | if (!(ored & 0xFF80)) |
92 | return result; |
93 | } |
94 | |
95 | // If it wasn't all ASCII, call the function that handles more-complex cases. |
96 | return encodeComplexUserDefined(string, handling); |
97 | } |
98 | |
99 | } // namespace WebCore |
100 | |