1 | /* |
2 | * Copyright (C) 2017 Apple Inc. All rights reserved. |
3 | * |
4 | * Redistribution and use in source and binary forms, with or without |
5 | * modification, are permitted provided that the following conditions |
6 | * are met: |
7 | * 1. Redistributions of source code must retain the above copyright |
8 | * notice, this list of conditions and the following disclaimer. |
9 | * 2. Redistributions in binary form must reproduce the above copyright |
10 | * notice, this list of conditions and the following disclaimer in the |
11 | * documentation and/or other materials provided with the distribution. |
12 | * |
13 | * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY |
14 | * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
15 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
16 | * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR |
17 | * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
18 | * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
19 | * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
20 | * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY |
21 | * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
22 | * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
23 | * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
24 | */ |
25 | |
26 | #include "config.h" |
27 | #include "YarrUnicodeProperties.h" |
28 | |
29 | #include "Yarr.h" |
30 | #include "YarrPattern.h" |
31 | #include <wtf/Optional.h> |
32 | #include <wtf/text/WTFString.h> |
33 | |
34 | namespace JSC { namespace Yarr { |
35 | |
36 | struct HashIndex { |
37 | int16_t value; |
38 | int16_t next; |
39 | }; |
40 | |
41 | struct HashValue { |
42 | const char* key; |
43 | int index; |
44 | }; |
45 | |
46 | struct HashTable { |
47 | int numberOfValues; |
48 | int indexMask; |
49 | const HashValue* values; |
50 | const HashIndex* index; |
51 | |
52 | ALWAYS_INLINE int entry(WTF::String& key) const |
53 | { |
54 | int indexEntry = key.impl()->hash() & indexMask; |
55 | int valueIndex = index[indexEntry].value; |
56 | |
57 | if (valueIndex == -1) |
58 | return -1; |
59 | |
60 | while (true) { |
61 | if (WTF::equal(key, values[valueIndex].key)) |
62 | return values[valueIndex].index; |
63 | |
64 | indexEntry = index[indexEntry].next; |
65 | if (indexEntry == -1) |
66 | return -1; |
67 | valueIndex = index[indexEntry].value; |
68 | ASSERT(valueIndex != -1); |
69 | }; |
70 | } |
71 | }; |
72 | |
73 | #include "UnicodePatternTables.h" |
74 | |
75 | Optional<BuiltInCharacterClassID> unicodeMatchPropertyValue(WTF::String unicodePropertyName, WTF::String unicodePropertyValue) |
76 | { |
77 | int propertyIndex = -1; |
78 | |
79 | if (unicodePropertyName == "Script" || unicodePropertyName == "sc" ) |
80 | propertyIndex = scriptHashTable.entry(unicodePropertyValue); |
81 | else if (unicodePropertyName == "Script_Extensions" || unicodePropertyName == "scx" ) |
82 | propertyIndex = scriptExtensionHashTable.entry(unicodePropertyValue); |
83 | else if (unicodePropertyName == "General_Category" || unicodePropertyName == "gc" ) |
84 | propertyIndex = generalCategoryHashTable.entry(unicodePropertyValue); |
85 | |
86 | if (propertyIndex == -1) |
87 | return WTF::nullopt; |
88 | |
89 | return Optional<BuiltInCharacterClassID>(static_cast<BuiltInCharacterClassID>(static_cast<int>(BuiltInCharacterClassID::BaseUnicodePropertyID) + propertyIndex)); |
90 | } |
91 | |
92 | Optional<BuiltInCharacterClassID> unicodeMatchProperty(WTF::String unicodePropertyValue) |
93 | { |
94 | int propertyIndex = -1; |
95 | |
96 | propertyIndex = binaryPropertyHashTable.entry(unicodePropertyValue); |
97 | if (propertyIndex == -1) |
98 | propertyIndex = generalCategoryHashTable.entry(unicodePropertyValue); |
99 | |
100 | if (propertyIndex == -1) |
101 | return WTF::nullopt; |
102 | |
103 | return Optional<BuiltInCharacterClassID>(static_cast<BuiltInCharacterClassID>(static_cast<int>(BuiltInCharacterClassID::BaseUnicodePropertyID) + propertyIndex)); |
104 | } |
105 | |
106 | std::unique_ptr<CharacterClass> createUnicodeCharacterClassFor(BuiltInCharacterClassID unicodeClassID) |
107 | { |
108 | unsigned unicodePropertyIndex = static_cast<unsigned>(unicodeClassID) - static_cast<unsigned>(BuiltInCharacterClassID::BaseUnicodePropertyID); |
109 | |
110 | return createFunctions[unicodePropertyIndex](); |
111 | } |
112 | |
113 | } } // namespace JSC::Yarr |
114 | |