Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2015 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
Adam Lesinski | 52364f7 | 2016-01-11 13:10:24 -0800 | [diff] [blame] | 17 | #include "StringPool.h" |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 18 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 19 | #include <algorithm> |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 20 | #include <memory> |
| 21 | #include <string> |
| 22 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 23 | #include "android-base/logging.h" |
| 24 | #include "androidfw/ResourceTypes.h" |
Adam Lesinski | d5083f6 | 2017-01-16 15:07:21 -0800 | [diff] [blame] | 25 | #include "androidfw/StringPiece.h" |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 26 | |
| 27 | #include "util/BigBuffer.h" |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 28 | #include "util/Util.h" |
| 29 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 30 | using ::android::StringPiece; |
Adam Lesinski | d5083f6 | 2017-01-16 15:07:21 -0800 | [diff] [blame] | 31 | |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 32 | namespace aapt { |
| 33 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 34 | StringPool::Ref::Ref() : entry_(nullptr) {} |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 35 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 36 | StringPool::Ref::Ref(const StringPool::Ref& rhs) : entry_(rhs.entry_) { |
| 37 | if (entry_ != nullptr) { |
| 38 | entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 39 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 40 | } |
| 41 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 42 | StringPool::Ref::Ref(StringPool::Entry* entry) : entry_(entry) { |
| 43 | if (entry_ != nullptr) { |
| 44 | entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 45 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 46 | } |
| 47 | |
| 48 | StringPool::Ref::~Ref() { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 49 | if (entry_ != nullptr) { |
| 50 | entry_->ref_--; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 51 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 52 | } |
| 53 | |
| 54 | StringPool::Ref& StringPool::Ref::operator=(const StringPool::Ref& rhs) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 55 | if (rhs.entry_ != nullptr) { |
| 56 | rhs.entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 57 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 58 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 59 | if (entry_ != nullptr) { |
| 60 | entry_->ref_--; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 61 | } |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 62 | entry_ = rhs.entry_; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 63 | return *this; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 64 | } |
| 65 | |
Adam Lesinski | 7542162 | 2017-01-06 15:20:04 -0800 | [diff] [blame] | 66 | bool StringPool::Ref::operator==(const Ref& rhs) const { |
| 67 | return entry_->value == rhs.entry_->value; |
| 68 | } |
| 69 | |
| 70 | bool StringPool::Ref::operator!=(const Ref& rhs) const { |
| 71 | return entry_->value != rhs.entry_->value; |
| 72 | } |
| 73 | |
Adam Lesinski | d0f116b | 2016-07-08 15:00:32 -0700 | [diff] [blame] | 74 | const std::string* StringPool::Ref::operator->() const { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 75 | return &entry_->value; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 76 | } |
| 77 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 78 | const std::string& StringPool::Ref::operator*() const { |
| 79 | return entry_->value; |
| 80 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 81 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 82 | size_t StringPool::Ref::index() const { |
| 83 | // Account for the styles, which *always* come first. |
| 84 | return entry_->pool_->styles_.size() + entry_->index_; |
| 85 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 86 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 87 | const StringPool::Context& StringPool::Ref::GetContext() const { |
| 88 | return entry_->context; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 89 | } |
| 90 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 91 | StringPool::StyleRef::StyleRef() : entry_(nullptr) {} |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 92 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 93 | StringPool::StyleRef::StyleRef(const StringPool::StyleRef& rhs) |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 94 | : entry_(rhs.entry_) { |
| 95 | if (entry_ != nullptr) { |
| 96 | entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 97 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 98 | } |
| 99 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 100 | StringPool::StyleRef::StyleRef(StringPool::StyleEntry* entry) : entry_(entry) { |
| 101 | if (entry_ != nullptr) { |
| 102 | entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 103 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 104 | } |
| 105 | |
| 106 | StringPool::StyleRef::~StyleRef() { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 107 | if (entry_ != nullptr) { |
| 108 | entry_->ref_--; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 109 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 110 | } |
| 111 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 112 | StringPool::StyleRef& StringPool::StyleRef::operator=(const StringPool::StyleRef& rhs) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 113 | if (rhs.entry_ != nullptr) { |
| 114 | rhs.entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 115 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 116 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 117 | if (entry_ != nullptr) { |
| 118 | entry_->ref_--; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 119 | } |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 120 | entry_ = rhs.entry_; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 121 | return *this; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 122 | } |
| 123 | |
Adam Lesinski | 7542162 | 2017-01-06 15:20:04 -0800 | [diff] [blame] | 124 | bool StringPool::StyleRef::operator==(const StyleRef& rhs) const { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 125 | if (entry_->value != rhs.entry_->value) { |
Adam Lesinski | 7542162 | 2017-01-06 15:20:04 -0800 | [diff] [blame] | 126 | return false; |
| 127 | } |
| 128 | |
| 129 | if (entry_->spans.size() != rhs.entry_->spans.size()) { |
| 130 | return false; |
| 131 | } |
| 132 | |
| 133 | auto rhs_iter = rhs.entry_->spans.begin(); |
| 134 | for (const Span& span : entry_->spans) { |
| 135 | const Span& rhs_span = *rhs_iter; |
| 136 | if (span.first_char != rhs_span.first_char || span.last_char != rhs_span.last_char || |
| 137 | span.name != rhs_span.name) { |
| 138 | return false; |
| 139 | } |
| 140 | } |
| 141 | return true; |
| 142 | } |
| 143 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 144 | bool StringPool::StyleRef::operator!=(const StyleRef& rhs) const { |
| 145 | return !operator==(rhs); |
| 146 | } |
Adam Lesinski | 7542162 | 2017-01-06 15:20:04 -0800 | [diff] [blame] | 147 | |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 148 | const StringPool::StyleEntry* StringPool::StyleRef::operator->() const { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 149 | return entry_; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 150 | } |
| 151 | |
| 152 | const StringPool::StyleEntry& StringPool::StyleRef::operator*() const { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 153 | return *entry_; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 154 | } |
| 155 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 156 | size_t StringPool::StyleRef::index() const { |
| 157 | return entry_->index_; |
| 158 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 159 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 160 | const StringPool::Context& StringPool::StyleRef::GetContext() const { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 161 | return entry_->context; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 162 | } |
| 163 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 164 | StringPool::Ref StringPool::MakeRef(const StringPiece& str) { |
| 165 | return MakeRefImpl(str, Context{}, true); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 166 | } |
| 167 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 168 | StringPool::Ref StringPool::MakeRef(const StringPiece& str, const Context& context) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 169 | return MakeRefImpl(str, context, true); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 170 | } |
| 171 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 172 | StringPool::Ref StringPool::MakeRefImpl(const StringPiece& str, const Context& context, |
| 173 | bool unique) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 174 | if (unique) { |
y | 4602926 | 2018-04-16 18:13:14 -0700 | [diff] [blame] | 175 | auto range = indexed_strings_.equal_range(str); |
| 176 | for (auto iter = range.first; iter != range.second; ++iter) { |
| 177 | if (context.priority == iter->second->context.priority) { |
| 178 | return Ref(iter->second); |
| 179 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 180 | } |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 181 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 182 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 183 | std::unique_ptr<Entry> entry(new Entry()); |
Adam Lesinski | d5083f6 | 2017-01-16 15:07:21 -0800 | [diff] [blame] | 184 | entry->value = str.to_string(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 185 | entry->context = context; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 186 | entry->index_ = strings_.size(); |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 187 | entry->ref_ = 0; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 188 | entry->pool_ = this; |
| 189 | |
| 190 | Entry* borrow = entry.get(); |
| 191 | strings_.emplace_back(std::move(entry)); |
| 192 | indexed_strings_.insert(std::make_pair(StringPiece(borrow->value), borrow)); |
| 193 | return Ref(borrow); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 194 | } |
| 195 | |
Adam Lesinski | 8a0b238 | 2017-10-18 15:07:33 -0700 | [diff] [blame] | 196 | StringPool::Ref StringPool::MakeRef(const Ref& ref) { |
| 197 | if (ref.entry_->pool_ == this) { |
| 198 | return ref; |
| 199 | } |
| 200 | return MakeRef(ref.entry_->value, ref.entry_->context); |
| 201 | } |
| 202 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 203 | StringPool::StyleRef StringPool::MakeRef(const StyleString& str) { |
| 204 | return MakeRef(str, Context{}); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 205 | } |
| 206 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 207 | StringPool::StyleRef StringPool::MakeRef(const StyleString& str, const Context& context) { |
| 208 | std::unique_ptr<StyleEntry> entry(new StyleEntry()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 209 | entry->value = str.str; |
| 210 | entry->context = context; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 211 | entry->index_ = styles_.size(); |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 212 | entry->ref_ = 0; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 213 | for (const aapt::Span& span : str.spans) { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 214 | entry->spans.emplace_back(Span{MakeRef(span.name), span.first_char, span.last_char}); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 215 | } |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 216 | |
| 217 | StyleEntry* borrow = entry.get(); |
| 218 | styles_.emplace_back(std::move(entry)); |
| 219 | return StyleRef(borrow); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 220 | } |
| 221 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 222 | StringPool::StyleRef StringPool::MakeRef(const StyleRef& ref) { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 223 | std::unique_ptr<StyleEntry> entry(new StyleEntry()); |
| 224 | entry->value = ref.entry_->value; |
| 225 | entry->context = ref.entry_->context; |
| 226 | entry->index_ = styles_.size(); |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 227 | entry->ref_ = 0; |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 228 | for (const Span& span : ref.entry_->spans) { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 229 | entry->spans.emplace_back(Span{MakeRef(*span.name), span.first_char, span.last_char}); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 230 | } |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 231 | |
| 232 | StyleEntry* borrow = entry.get(); |
| 233 | styles_.emplace_back(std::move(entry)); |
| 234 | return StyleRef(borrow); |
| 235 | } |
| 236 | |
| 237 | void StringPool::ReAssignIndices() { |
| 238 | // Assign the style indices. |
| 239 | const size_t style_len = styles_.size(); |
| 240 | for (size_t index = 0; index < style_len; index++) { |
| 241 | styles_[index]->index_ = index; |
| 242 | } |
| 243 | |
| 244 | // Assign the string indices. |
| 245 | const size_t string_len = strings_.size(); |
| 246 | for (size_t index = 0; index < string_len; index++) { |
| 247 | strings_[index]->index_ = index; |
| 248 | } |
Adam Lesinski | 769de98 | 2015-04-10 19:43:55 -0700 | [diff] [blame] | 249 | } |
| 250 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 251 | void StringPool::Merge(StringPool&& pool) { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 252 | // First, change the owning pool for the incoming strings. |
| 253 | for (std::unique_ptr<Entry>& entry : pool.strings_) { |
| 254 | entry->pool_ = this; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 255 | } |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 256 | |
| 257 | // Now move the styles, strings, and indices over. |
| 258 | std::move(pool.styles_.begin(), pool.styles_.end(), std::back_inserter(styles_)); |
| 259 | pool.styles_.clear(); |
| 260 | std::move(pool.strings_.begin(), pool.strings_.end(), std::back_inserter(strings_)); |
| 261 | pool.strings_.clear(); |
| 262 | indexed_strings_.insert(pool.indexed_strings_.begin(), pool.indexed_strings_.end()); |
| 263 | pool.indexed_strings_.clear(); |
| 264 | |
| 265 | ReAssignIndices(); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 266 | } |
| 267 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 268 | void StringPool::HintWillAdd(size_t string_count, size_t style_count) { |
| 269 | strings_.reserve(strings_.size() + string_count); |
| 270 | styles_.reserve(styles_.size() + style_count); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 271 | } |
| 272 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 273 | void StringPool::Prune() { |
| 274 | const auto iter_end = indexed_strings_.end(); |
| 275 | auto index_iter = indexed_strings_.begin(); |
| 276 | while (index_iter != iter_end) { |
| 277 | if (index_iter->second->ref_ <= 0) { |
| 278 | index_iter = indexed_strings_.erase(index_iter); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 279 | } else { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 280 | ++index_iter; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 281 | } |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 282 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 283 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 284 | auto end_iter2 = |
| 285 | std::remove_if(strings_.begin(), strings_.end(), |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 286 | [](const std::unique_ptr<Entry>& entry) -> bool { return entry->ref_ <= 0; }); |
| 287 | auto end_iter3 = std::remove_if( |
| 288 | styles_.begin(), styles_.end(), |
| 289 | [](const std::unique_ptr<StyleEntry>& entry) -> bool { return entry->ref_ <= 0; }); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 290 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 291 | // Remove the entries at the end or else we'll be accessing a deleted string from the StyleEntry. |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 292 | strings_.erase(end_iter2, strings_.end()); |
| 293 | styles_.erase(end_iter3, styles_.end()); |
Adam Lesinski | 1ab598f | 2015-08-14 14:26:04 -0700 | [diff] [blame] | 294 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 295 | ReAssignIndices(); |
| 296 | } |
| 297 | |
| 298 | template <typename E> |
| 299 | static void SortEntries( |
| 300 | std::vector<std::unique_ptr<E>>& entries, |
| 301 | const std::function<int(const StringPool::Context&, const StringPool::Context&)>& cmp) { |
| 302 | using UEntry = std::unique_ptr<E>; |
| 303 | |
| 304 | if (cmp != nullptr) { |
| 305 | std::sort(entries.begin(), entries.end(), [&cmp](const UEntry& a, const UEntry& b) -> bool { |
| 306 | int r = cmp(a->context, b->context); |
| 307 | if (r == 0) { |
| 308 | r = a->value.compare(b->value); |
| 309 | } |
| 310 | return r < 0; |
| 311 | }); |
| 312 | } else { |
| 313 | std::sort(entries.begin(), entries.end(), |
| 314 | [](const UEntry& a, const UEntry& b) -> bool { return a->value < b->value; }); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 315 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 316 | } |
| 317 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 318 | void StringPool::Sort(const std::function<int(const Context&, const Context&)>& cmp) { |
| 319 | SortEntries(styles_, cmp); |
| 320 | SortEntries(strings_, cmp); |
| 321 | ReAssignIndices(); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 322 | } |
| 323 | |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 324 | template <typename T> |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 325 | static T* EncodeLength(T* data, size_t length) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 326 | static_assert(std::is_integral<T>::value, "wat."); |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 327 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 328 | constexpr size_t kMask = 1 << ((sizeof(T) * 8) - 1); |
| 329 | constexpr size_t kMaxSize = kMask - 1; |
| 330 | if (length > kMaxSize) { |
| 331 | *data++ = kMask | (kMaxSize & (length >> (sizeof(T) * 8))); |
| 332 | } |
| 333 | *data++ = length; |
| 334 | return data; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 335 | } |
| 336 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 337 | /** |
| 338 | * Returns the maximum possible string length that can be successfully encoded |
| 339 | * using 2 units of the specified T. |
| 340 | * EncodeLengthMax<char> -> maximum unit length of 0x7FFF |
| 341 | * EncodeLengthMax<char16_t> -> maximum unit length of 0x7FFFFFFF |
| 342 | **/ |
| 343 | template <typename T> |
| 344 | static size_t EncodeLengthMax() { |
| 345 | static_assert(std::is_integral<T>::value, "wat."); |
| 346 | |
| 347 | constexpr size_t kMask = 1 << ((sizeof(T) * 8 * 2) - 1); |
| 348 | constexpr size_t max = kMask - 1; |
| 349 | return max; |
| 350 | } |
| 351 | |
| 352 | /** |
| 353 | * Returns the number of units (1 or 2) needed to encode the string length |
| 354 | * before writing the string. |
| 355 | */ |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 356 | template <typename T> |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 357 | static size_t EncodedLengthUnits(size_t length) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 358 | static_assert(std::is_integral<T>::value, "wat."); |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 359 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 360 | constexpr size_t kMask = 1 << ((sizeof(T) * 8) - 1); |
| 361 | constexpr size_t kMaxSize = kMask - 1; |
| 362 | return length > kMaxSize ? 2 : 1; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 363 | } |
| 364 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 365 | const std::string kStringTooLarge = "STRING_TOO_LARGE"; |
| 366 | |
| 367 | static bool EncodeString(const std::string& str, const bool utf8, BigBuffer* out, |
| 368 | IDiagnostics* diag) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 369 | if (utf8) { |
Ryan Mitchell | d86ea58 | 2018-06-27 11:57:18 -0700 | [diff] [blame] | 370 | const std::string& encoded = util::Utf8ToModifiedUtf8(str); |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 371 | const ssize_t utf16_length = utf8_to_utf16_length( |
| 372 | reinterpret_cast<const uint8_t*>(encoded.data()), encoded.size()); |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 373 | CHECK(utf16_length >= 0); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 374 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 375 | // Make sure the lengths to be encoded do not exceed the maximum length that |
| 376 | // can be encoded using chars |
| 377 | if ((((size_t)encoded.size()) > EncodeLengthMax<char>()) |
| 378 | || (((size_t)utf16_length) > EncodeLengthMax<char>())) { |
| 379 | |
| 380 | diag->Error(DiagMessage() << "string too large to encode using UTF-8 " |
| 381 | << "written instead as '" << kStringTooLarge << "'"); |
| 382 | |
| 383 | EncodeString(kStringTooLarge, utf8, out, diag); |
| 384 | return false; |
| 385 | } |
| 386 | |
| 387 | const size_t total_size = EncodedLengthUnits<char>(utf16_length) |
| 388 | + EncodedLengthUnits<char>(encoded.size()) + encoded.size() + 1; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 389 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 390 | char* data = out->NextBlock<char>(total_size); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 391 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 392 | // First encode the UTF16 string length. |
| 393 | data = EncodeLength(data, utf16_length); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 394 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 395 | // Now encode the size of the real UTF8 string. |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 396 | data = EncodeLength(data, encoded.size()); |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 397 | strncpy(data, encoded.data(), encoded.size()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 398 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 399 | } else { |
| 400 | const std::u16string encoded = util::Utf8ToUtf16(str); |
| 401 | const ssize_t utf16_length = encoded.size(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 402 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 403 | // Make sure the length to be encoded does not exceed the maximum possible |
| 404 | // length that can be encoded |
| 405 | if (((size_t)utf16_length) > EncodeLengthMax<char16_t>()) { |
| 406 | diag->Error(DiagMessage() << "string too large to encode using UTF-16 " |
| 407 | << "written instead as '" << kStringTooLarge << "'"); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 408 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 409 | EncodeString(kStringTooLarge, utf8, out, diag); |
| 410 | return false; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 411 | } |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 412 | |
| 413 | // Total number of 16-bit words to write. |
| 414 | const size_t total_size = EncodedLengthUnits<char16_t>(utf16_length) |
| 415 | + encoded.size() + 1; |
| 416 | |
| 417 | char16_t* data = out->NextBlock<char16_t>(total_size); |
| 418 | |
| 419 | // Encode the actual UTF16 string length. |
| 420 | data = EncodeLength(data, utf16_length); |
| 421 | const size_t byte_length = encoded.size() * sizeof(char16_t); |
| 422 | |
| 423 | // NOTE: For some reason, strncpy16(data, entry->value.data(), |
| 424 | // entry->value.size()) truncates the string. |
| 425 | memcpy(data, encoded.data(), byte_length); |
| 426 | |
| 427 | // The null-terminating character is already here due to the block of data |
| 428 | // being set to 0s on allocation. |
| 429 | } |
| 430 | |
| 431 | return true; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 432 | } |
| 433 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 434 | bool StringPool::Flatten(BigBuffer* out, const StringPool& pool, bool utf8, |
| 435 | IDiagnostics* diag) { |
| 436 | bool no_error = true; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 437 | const size_t start_index = out->size(); |
| 438 | android::ResStringPool_header* header = out->NextBlock<android::ResStringPool_header>(); |
| 439 | header->header.type = util::HostToDevice16(android::RES_STRING_POOL_TYPE); |
| 440 | header->header.headerSize = util::HostToDevice16(sizeof(*header)); |
| 441 | header->stringCount = util::HostToDevice32(pool.size()); |
| 442 | header->styleCount = util::HostToDevice32(pool.styles_.size()); |
| 443 | if (utf8) { |
| 444 | header->flags |= android::ResStringPool_header::UTF8_FLAG; |
| 445 | } |
| 446 | |
| 447 | uint32_t* indices = pool.size() != 0 ? out->NextBlock<uint32_t>(pool.size()) : nullptr; |
| 448 | uint32_t* style_indices = |
| 449 | pool.styles_.size() != 0 ? out->NextBlock<uint32_t>(pool.styles_.size()) : nullptr; |
| 450 | |
| 451 | const size_t before_strings_index = out->size(); |
| 452 | header->stringsStart = before_strings_index - start_index; |
| 453 | |
| 454 | // Styles always come first. |
| 455 | for (const std::unique_ptr<StyleEntry>& entry : pool.styles_) { |
| 456 | *indices++ = out->size() - before_strings_index; |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 457 | no_error = EncodeString(entry->value, utf8, out, diag) && no_error; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 458 | } |
| 459 | |
| 460 | for (const std::unique_ptr<Entry>& entry : pool.strings_) { |
| 461 | *indices++ = out->size() - before_strings_index; |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 462 | no_error = EncodeString(entry->value, utf8, out, diag) && no_error; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 463 | } |
| 464 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 465 | out->Align4(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 466 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 467 | if (style_indices != nullptr) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 468 | const size_t before_styles_index = out->size(); |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 469 | header->stylesStart = util::HostToDevice32(before_styles_index - start_index); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 470 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 471 | for (const std::unique_ptr<StyleEntry>& entry : pool.styles_) { |
| 472 | *style_indices++ = out->size() - before_styles_index; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 473 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 474 | if (!entry->spans.empty()) { |
| 475 | android::ResStringPool_span* span = |
| 476 | out->NextBlock<android::ResStringPool_span>(entry->spans.size()); |
| 477 | for (const Span& s : entry->spans) { |
| 478 | span->name.index = util::HostToDevice32(s.name.index()); |
| 479 | span->firstChar = util::HostToDevice32(s.first_char); |
| 480 | span->lastChar = util::HostToDevice32(s.last_char); |
| 481 | span++; |
| 482 | } |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 483 | } |
| 484 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 485 | uint32_t* spanEnd = out->NextBlock<uint32_t>(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 486 | *spanEnd = android::ResStringPool_span::END; |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 487 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 488 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 489 | // The error checking code in the platform looks for an entire |
| 490 | // ResStringPool_span structure worth of 0xFFFFFFFF at the end |
| 491 | // of the style block, so fill in the remaining 2 32bit words |
| 492 | // with 0xFFFFFFFF. |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 493 | const size_t padding_length = sizeof(android::ResStringPool_span) - |
| 494 | sizeof(android::ResStringPool_span::name); |
| 495 | uint8_t* padding = out->NextBlock<uint8_t>(padding_length); |
| 496 | memset(padding, 0xff, padding_length); |
| 497 | out->Align4(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 498 | } |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 499 | header->header.size = util::HostToDevice32(out->size() - start_index); |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 500 | return no_error; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 501 | } |
| 502 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 503 | bool StringPool::FlattenUtf8(BigBuffer* out, const StringPool& pool, IDiagnostics* diag) { |
| 504 | return Flatten(out, pool, true, diag); |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 505 | } |
| 506 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame] | 507 | bool StringPool::FlattenUtf16(BigBuffer* out, const StringPool& pool, IDiagnostics* diag) { |
| 508 | return Flatten(out, pool, false, diag); |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 509 | } |
| 510 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 511 | } // namespace aapt |