Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2015 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
Adam Lesinski | 52364f7 | 2016-01-11 13:10:24 -0800 | [diff] [blame] | 17 | #include "StringPool.h" |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 18 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 19 | #include <algorithm> |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 20 | #include <memory> |
| 21 | #include <string> |
| 22 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 23 | #include "android-base/logging.h" |
| 24 | #include "androidfw/ResourceTypes.h" |
Adam Lesinski | d5083f6 | 2017-01-16 15:07:21 -0800 | [diff] [blame] | 25 | #include "androidfw/StringPiece.h" |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 26 | |
| 27 | #include "util/BigBuffer.h" |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 28 | #include "util/Util.h" |
| 29 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 30 | using ::android::StringPiece; |
Adam Lesinski | d5083f6 | 2017-01-16 15:07:21 -0800 | [diff] [blame] | 31 | |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 32 | namespace aapt { |
| 33 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 34 | StringPool::Ref::Ref() : entry_(nullptr) {} |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 35 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 36 | StringPool::Ref::Ref(const StringPool::Ref& rhs) : entry_(rhs.entry_) { |
| 37 | if (entry_ != nullptr) { |
| 38 | entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 39 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 40 | } |
| 41 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 42 | StringPool::Ref::Ref(StringPool::Entry* entry) : entry_(entry) { |
| 43 | if (entry_ != nullptr) { |
| 44 | entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 45 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 46 | } |
| 47 | |
| 48 | StringPool::Ref::~Ref() { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 49 | if (entry_ != nullptr) { |
| 50 | entry_->ref_--; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 51 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 52 | } |
| 53 | |
| 54 | StringPool::Ref& StringPool::Ref::operator=(const StringPool::Ref& rhs) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 55 | if (rhs.entry_ != nullptr) { |
| 56 | rhs.entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 57 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 58 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 59 | if (entry_ != nullptr) { |
| 60 | entry_->ref_--; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 61 | } |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 62 | entry_ = rhs.entry_; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 63 | return *this; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 64 | } |
| 65 | |
Adam Lesinski | 7542162 | 2017-01-06 15:20:04 -0800 | [diff] [blame] | 66 | bool StringPool::Ref::operator==(const Ref& rhs) const { |
| 67 | return entry_->value == rhs.entry_->value; |
| 68 | } |
| 69 | |
| 70 | bool StringPool::Ref::operator!=(const Ref& rhs) const { |
| 71 | return entry_->value != rhs.entry_->value; |
| 72 | } |
| 73 | |
Adam Lesinski | d0f116b | 2016-07-08 15:00:32 -0700 | [diff] [blame] | 74 | const std::string* StringPool::Ref::operator->() const { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 75 | return &entry_->value; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 76 | } |
| 77 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 78 | const std::string& StringPool::Ref::operator*() const { |
| 79 | return entry_->value; |
| 80 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 81 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 82 | size_t StringPool::Ref::index() const { |
| 83 | // Account for the styles, which *always* come first. |
| 84 | return entry_->pool_->styles_.size() + entry_->index_; |
| 85 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 86 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 87 | const StringPool::Context& StringPool::Ref::GetContext() const { |
| 88 | return entry_->context; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 89 | } |
| 90 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 91 | StringPool::StyleRef::StyleRef() : entry_(nullptr) {} |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 92 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 93 | StringPool::StyleRef::StyleRef(const StringPool::StyleRef& rhs) |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 94 | : entry_(rhs.entry_) { |
| 95 | if (entry_ != nullptr) { |
| 96 | entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 97 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 98 | } |
| 99 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 100 | StringPool::StyleRef::StyleRef(StringPool::StyleEntry* entry) : entry_(entry) { |
| 101 | if (entry_ != nullptr) { |
| 102 | entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 103 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 104 | } |
| 105 | |
| 106 | StringPool::StyleRef::~StyleRef() { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 107 | if (entry_ != nullptr) { |
| 108 | entry_->ref_--; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 109 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 110 | } |
| 111 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 112 | StringPool::StyleRef& StringPool::StyleRef::operator=(const StringPool::StyleRef& rhs) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 113 | if (rhs.entry_ != nullptr) { |
| 114 | rhs.entry_->ref_++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 115 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 116 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 117 | if (entry_ != nullptr) { |
| 118 | entry_->ref_--; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 119 | } |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 120 | entry_ = rhs.entry_; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 121 | return *this; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 122 | } |
| 123 | |
Adam Lesinski | 7542162 | 2017-01-06 15:20:04 -0800 | [diff] [blame] | 124 | bool StringPool::StyleRef::operator==(const StyleRef& rhs) const { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 125 | if (entry_->value != rhs.entry_->value) { |
Adam Lesinski | 7542162 | 2017-01-06 15:20:04 -0800 | [diff] [blame] | 126 | return false; |
| 127 | } |
| 128 | |
| 129 | if (entry_->spans.size() != rhs.entry_->spans.size()) { |
| 130 | return false; |
| 131 | } |
| 132 | |
| 133 | auto rhs_iter = rhs.entry_->spans.begin(); |
| 134 | for (const Span& span : entry_->spans) { |
| 135 | const Span& rhs_span = *rhs_iter; |
| 136 | if (span.first_char != rhs_span.first_char || span.last_char != rhs_span.last_char || |
| 137 | span.name != rhs_span.name) { |
| 138 | return false; |
| 139 | } |
| 140 | } |
| 141 | return true; |
| 142 | } |
| 143 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 144 | bool StringPool::StyleRef::operator!=(const StyleRef& rhs) const { |
| 145 | return !operator==(rhs); |
| 146 | } |
Adam Lesinski | 7542162 | 2017-01-06 15:20:04 -0800 | [diff] [blame] | 147 | |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 148 | const StringPool::StyleEntry* StringPool::StyleRef::operator->() const { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 149 | return entry_; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 150 | } |
| 151 | |
| 152 | const StringPool::StyleEntry& StringPool::StyleRef::operator*() const { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 153 | return *entry_; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 154 | } |
| 155 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 156 | size_t StringPool::StyleRef::index() const { |
| 157 | return entry_->index_; |
| 158 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 159 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 160 | const StringPool::Context& StringPool::StyleRef::GetContext() const { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 161 | return entry_->context; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 162 | } |
| 163 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 164 | StringPool::Ref StringPool::MakeRef(const StringPiece& str) { |
| 165 | return MakeRefImpl(str, Context{}, true); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 166 | } |
| 167 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 168 | StringPool::Ref StringPool::MakeRef(const StringPiece& str, const Context& context) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 169 | return MakeRefImpl(str, context, true); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 170 | } |
| 171 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 172 | StringPool::Ref StringPool::MakeRefImpl(const StringPiece& str, const Context& context, |
| 173 | bool unique) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 174 | if (unique) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 175 | auto iter = indexed_strings_.find(str); |
| 176 | if (iter != std::end(indexed_strings_)) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 177 | return Ref(iter->second); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 178 | } |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 179 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 180 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 181 | std::unique_ptr<Entry> entry(new Entry()); |
Adam Lesinski | d5083f6 | 2017-01-16 15:07:21 -0800 | [diff] [blame] | 182 | entry->value = str.to_string(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 183 | entry->context = context; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 184 | entry->index_ = strings_.size(); |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 185 | entry->ref_ = 0; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 186 | entry->pool_ = this; |
| 187 | |
| 188 | Entry* borrow = entry.get(); |
| 189 | strings_.emplace_back(std::move(entry)); |
| 190 | indexed_strings_.insert(std::make_pair(StringPiece(borrow->value), borrow)); |
| 191 | return Ref(borrow); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 192 | } |
| 193 | |
Adam Lesinski | 8a0b238 | 2017-10-18 15:07:33 -0700 | [diff] [blame] | 194 | StringPool::Ref StringPool::MakeRef(const Ref& ref) { |
| 195 | if (ref.entry_->pool_ == this) { |
| 196 | return ref; |
| 197 | } |
| 198 | return MakeRef(ref.entry_->value, ref.entry_->context); |
| 199 | } |
| 200 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 201 | StringPool::StyleRef StringPool::MakeRef(const StyleString& str) { |
| 202 | return MakeRef(str, Context{}); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 203 | } |
| 204 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 205 | StringPool::StyleRef StringPool::MakeRef(const StyleString& str, const Context& context) { |
| 206 | std::unique_ptr<StyleEntry> entry(new StyleEntry()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 207 | entry->value = str.str; |
| 208 | entry->context = context; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 209 | entry->index_ = styles_.size(); |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 210 | entry->ref_ = 0; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 211 | for (const aapt::Span& span : str.spans) { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 212 | entry->spans.emplace_back(Span{MakeRef(span.name), span.first_char, span.last_char}); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 213 | } |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 214 | |
| 215 | StyleEntry* borrow = entry.get(); |
| 216 | styles_.emplace_back(std::move(entry)); |
| 217 | return StyleRef(borrow); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 218 | } |
| 219 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 220 | StringPool::StyleRef StringPool::MakeRef(const StyleRef& ref) { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 221 | std::unique_ptr<StyleEntry> entry(new StyleEntry()); |
| 222 | entry->value = ref.entry_->value; |
| 223 | entry->context = ref.entry_->context; |
| 224 | entry->index_ = styles_.size(); |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 225 | entry->ref_ = 0; |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 226 | for (const Span& span : ref.entry_->spans) { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 227 | entry->spans.emplace_back(Span{MakeRef(*span.name), span.first_char, span.last_char}); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 228 | } |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 229 | |
| 230 | StyleEntry* borrow = entry.get(); |
| 231 | styles_.emplace_back(std::move(entry)); |
| 232 | return StyleRef(borrow); |
| 233 | } |
| 234 | |
| 235 | void StringPool::ReAssignIndices() { |
| 236 | // Assign the style indices. |
| 237 | const size_t style_len = styles_.size(); |
| 238 | for (size_t index = 0; index < style_len; index++) { |
| 239 | styles_[index]->index_ = index; |
| 240 | } |
| 241 | |
| 242 | // Assign the string indices. |
| 243 | const size_t string_len = strings_.size(); |
| 244 | for (size_t index = 0; index < string_len; index++) { |
| 245 | strings_[index]->index_ = index; |
| 246 | } |
Adam Lesinski | 769de98 | 2015-04-10 19:43:55 -0700 | [diff] [blame] | 247 | } |
| 248 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 249 | void StringPool::Merge(StringPool&& pool) { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 250 | // First, change the owning pool for the incoming strings. |
| 251 | for (std::unique_ptr<Entry>& entry : pool.strings_) { |
| 252 | entry->pool_ = this; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 253 | } |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 254 | |
| 255 | // Now move the styles, strings, and indices over. |
| 256 | std::move(pool.styles_.begin(), pool.styles_.end(), std::back_inserter(styles_)); |
| 257 | pool.styles_.clear(); |
| 258 | std::move(pool.strings_.begin(), pool.strings_.end(), std::back_inserter(strings_)); |
| 259 | pool.strings_.clear(); |
| 260 | indexed_strings_.insert(pool.indexed_strings_.begin(), pool.indexed_strings_.end()); |
| 261 | pool.indexed_strings_.clear(); |
| 262 | |
| 263 | ReAssignIndices(); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 264 | } |
| 265 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 266 | void StringPool::HintWillAdd(size_t string_count, size_t style_count) { |
| 267 | strings_.reserve(strings_.size() + string_count); |
| 268 | styles_.reserve(styles_.size() + style_count); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 269 | } |
| 270 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 271 | void StringPool::Prune() { |
| 272 | const auto iter_end = indexed_strings_.end(); |
| 273 | auto index_iter = indexed_strings_.begin(); |
| 274 | while (index_iter != iter_end) { |
| 275 | if (index_iter->second->ref_ <= 0) { |
| 276 | index_iter = indexed_strings_.erase(index_iter); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 277 | } else { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 278 | ++index_iter; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 279 | } |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 280 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 281 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 282 | auto end_iter2 = |
| 283 | std::remove_if(strings_.begin(), strings_.end(), |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 284 | [](const std::unique_ptr<Entry>& entry) -> bool { return entry->ref_ <= 0; }); |
| 285 | auto end_iter3 = std::remove_if( |
| 286 | styles_.begin(), styles_.end(), |
| 287 | [](const std::unique_ptr<StyleEntry>& entry) -> bool { return entry->ref_ <= 0; }); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 288 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 289 | // Remove the entries at the end or else we'll be accessing a deleted string from the StyleEntry. |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 290 | strings_.erase(end_iter2, strings_.end()); |
| 291 | styles_.erase(end_iter3, styles_.end()); |
Adam Lesinski | 1ab598f | 2015-08-14 14:26:04 -0700 | [diff] [blame] | 292 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 293 | ReAssignIndices(); |
| 294 | } |
| 295 | |
| 296 | template <typename E> |
| 297 | static void SortEntries( |
| 298 | std::vector<std::unique_ptr<E>>& entries, |
| 299 | const std::function<int(const StringPool::Context&, const StringPool::Context&)>& cmp) { |
| 300 | using UEntry = std::unique_ptr<E>; |
| 301 | |
| 302 | if (cmp != nullptr) { |
| 303 | std::sort(entries.begin(), entries.end(), [&cmp](const UEntry& a, const UEntry& b) -> bool { |
| 304 | int r = cmp(a->context, b->context); |
| 305 | if (r == 0) { |
| 306 | r = a->value.compare(b->value); |
| 307 | } |
| 308 | return r < 0; |
| 309 | }); |
| 310 | } else { |
| 311 | std::sort(entries.begin(), entries.end(), |
| 312 | [](const UEntry& a, const UEntry& b) -> bool { return a->value < b->value; }); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 313 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 314 | } |
| 315 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 316 | void StringPool::Sort(const std::function<int(const Context&, const Context&)>& cmp) { |
| 317 | SortEntries(styles_, cmp); |
| 318 | SortEntries(strings_, cmp); |
| 319 | ReAssignIndices(); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 320 | } |
| 321 | |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 322 | template <typename T> |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 323 | static T* EncodeLength(T* data, size_t length) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 324 | static_assert(std::is_integral<T>::value, "wat."); |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 325 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 326 | constexpr size_t kMask = 1 << ((sizeof(T) * 8) - 1); |
| 327 | constexpr size_t kMaxSize = kMask - 1; |
| 328 | if (length > kMaxSize) { |
| 329 | *data++ = kMask | (kMaxSize & (length >> (sizeof(T) * 8))); |
| 330 | } |
| 331 | *data++ = length; |
| 332 | return data; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 333 | } |
| 334 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 335 | /** |
| 336 | * Returns the maximum possible string length that can be successfully encoded |
| 337 | * using 2 units of the specified T. |
| 338 | * EncodeLengthMax<char> -> maximum unit length of 0x7FFF |
| 339 | * EncodeLengthMax<char16_t> -> maximum unit length of 0x7FFFFFFF |
| 340 | **/ |
| 341 | template <typename T> |
| 342 | static size_t EncodeLengthMax() { |
| 343 | static_assert(std::is_integral<T>::value, "wat."); |
| 344 | |
| 345 | constexpr size_t kMask = 1 << ((sizeof(T) * 8 * 2) - 1); |
| 346 | constexpr size_t max = kMask - 1; |
| 347 | return max; |
| 348 | } |
| 349 | |
| 350 | /** |
| 351 | * Returns the number of units (1 or 2) needed to encode the string length |
| 352 | * before writing the string. |
| 353 | */ |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 354 | template <typename T> |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 355 | static size_t EncodedLengthUnits(size_t length) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 356 | static_assert(std::is_integral<T>::value, "wat."); |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 357 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 358 | constexpr size_t kMask = 1 << ((sizeof(T) * 8) - 1); |
| 359 | constexpr size_t kMaxSize = kMask - 1; |
| 360 | return length > kMaxSize ? 2 : 1; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 361 | } |
| 362 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 363 | const std::string kStringTooLarge = "STRING_TOO_LARGE"; |
| 364 | |
| 365 | static bool EncodeString(const std::string& str, const bool utf8, BigBuffer* out, |
| 366 | IDiagnostics* diag) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 367 | if (utf8) { |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 368 | const std::string& encoded = str; |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 369 | const ssize_t utf16_length = utf8_to_utf16_length( |
| 370 | reinterpret_cast<const uint8_t*>(encoded.data()), encoded.size()); |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 371 | CHECK(utf16_length >= 0); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 372 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 373 | // Make sure the lengths to be encoded do not exceed the maximum length that |
| 374 | // can be encoded using chars |
| 375 | if ((((size_t)encoded.size()) > EncodeLengthMax<char>()) |
| 376 | || (((size_t)utf16_length) > EncodeLengthMax<char>())) { |
| 377 | |
| 378 | diag->Error(DiagMessage() << "string too large to encode using UTF-8 " |
| 379 | << "written instead as '" << kStringTooLarge << "'"); |
| 380 | |
| 381 | EncodeString(kStringTooLarge, utf8, out, diag); |
| 382 | return false; |
| 383 | } |
| 384 | |
| 385 | const size_t total_size = EncodedLengthUnits<char>(utf16_length) |
| 386 | + EncodedLengthUnits<char>(encoded.size()) + encoded.size() + 1; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 387 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 388 | char* data = out->NextBlock<char>(total_size); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 389 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 390 | // First encode the UTF16 string length. |
| 391 | data = EncodeLength(data, utf16_length); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 392 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 393 | // Now encode the size of the real UTF8 string. |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 394 | data = EncodeLength(data, encoded.size()); |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 395 | strncpy(data, encoded.data(), encoded.size()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 396 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 397 | } else { |
| 398 | const std::u16string encoded = util::Utf8ToUtf16(str); |
| 399 | const ssize_t utf16_length = encoded.size(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 400 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 401 | // Make sure the length to be encoded does not exceed the maximum possible |
| 402 | // length that can be encoded |
| 403 | if (((size_t)utf16_length) > EncodeLengthMax<char16_t>()) { |
| 404 | diag->Error(DiagMessage() << "string too large to encode using UTF-16 " |
| 405 | << "written instead as '" << kStringTooLarge << "'"); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 406 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 407 | EncodeString(kStringTooLarge, utf8, out, diag); |
| 408 | return false; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 409 | } |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 410 | |
| 411 | // Total number of 16-bit words to write. |
| 412 | const size_t total_size = EncodedLengthUnits<char16_t>(utf16_length) |
| 413 | + encoded.size() + 1; |
| 414 | |
| 415 | char16_t* data = out->NextBlock<char16_t>(total_size); |
| 416 | |
| 417 | // Encode the actual UTF16 string length. |
| 418 | data = EncodeLength(data, utf16_length); |
| 419 | const size_t byte_length = encoded.size() * sizeof(char16_t); |
| 420 | |
| 421 | // NOTE: For some reason, strncpy16(data, entry->value.data(), |
| 422 | // entry->value.size()) truncates the string. |
| 423 | memcpy(data, encoded.data(), byte_length); |
| 424 | |
| 425 | // The null-terminating character is already here due to the block of data |
| 426 | // being set to 0s on allocation. |
| 427 | } |
| 428 | |
| 429 | return true; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 430 | } |
| 431 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 432 | bool StringPool::Flatten(BigBuffer* out, const StringPool& pool, bool utf8, |
| 433 | IDiagnostics* diag) { |
| 434 | bool no_error = true; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 435 | const size_t start_index = out->size(); |
| 436 | android::ResStringPool_header* header = out->NextBlock<android::ResStringPool_header>(); |
| 437 | header->header.type = util::HostToDevice16(android::RES_STRING_POOL_TYPE); |
| 438 | header->header.headerSize = util::HostToDevice16(sizeof(*header)); |
| 439 | header->stringCount = util::HostToDevice32(pool.size()); |
| 440 | header->styleCount = util::HostToDevice32(pool.styles_.size()); |
| 441 | if (utf8) { |
| 442 | header->flags |= android::ResStringPool_header::UTF8_FLAG; |
| 443 | } |
| 444 | |
| 445 | uint32_t* indices = pool.size() != 0 ? out->NextBlock<uint32_t>(pool.size()) : nullptr; |
| 446 | uint32_t* style_indices = |
| 447 | pool.styles_.size() != 0 ? out->NextBlock<uint32_t>(pool.styles_.size()) : nullptr; |
| 448 | |
| 449 | const size_t before_strings_index = out->size(); |
| 450 | header->stringsStart = before_strings_index - start_index; |
| 451 | |
| 452 | // Styles always come first. |
| 453 | for (const std::unique_ptr<StyleEntry>& entry : pool.styles_) { |
| 454 | *indices++ = out->size() - before_strings_index; |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 455 | no_error = EncodeString(entry->value, utf8, out, diag) && no_error; |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 456 | } |
| 457 | |
| 458 | for (const std::unique_ptr<Entry>& entry : pool.strings_) { |
| 459 | *indices++ = out->size() - before_strings_index; |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 460 | no_error = EncodeString(entry->value, utf8, out, diag) && no_error; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 461 | } |
| 462 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 463 | out->Align4(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 464 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 465 | if (style_indices != nullptr) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 466 | const size_t before_styles_index = out->size(); |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 467 | header->stylesStart = util::HostToDevice32(before_styles_index - start_index); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 468 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 469 | for (const std::unique_ptr<StyleEntry>& entry : pool.styles_) { |
| 470 | *style_indices++ = out->size() - before_styles_index; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 471 | |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 472 | if (!entry->spans.empty()) { |
| 473 | android::ResStringPool_span* span = |
| 474 | out->NextBlock<android::ResStringPool_span>(entry->spans.size()); |
| 475 | for (const Span& s : entry->spans) { |
| 476 | span->name.index = util::HostToDevice32(s.name.index()); |
| 477 | span->firstChar = util::HostToDevice32(s.first_char); |
| 478 | span->lastChar = util::HostToDevice32(s.last_char); |
| 479 | span++; |
| 480 | } |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 481 | } |
| 482 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 483 | uint32_t* spanEnd = out->NextBlock<uint32_t>(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 484 | *spanEnd = android::ResStringPool_span::END; |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 485 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 486 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 487 | // The error checking code in the platform looks for an entire |
| 488 | // ResStringPool_span structure worth of 0xFFFFFFFF at the end |
| 489 | // of the style block, so fill in the remaining 2 32bit words |
| 490 | // with 0xFFFFFFFF. |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 491 | const size_t padding_length = sizeof(android::ResStringPool_span) - |
| 492 | sizeof(android::ResStringPool_span::name); |
| 493 | uint8_t* padding = out->NextBlock<uint8_t>(padding_length); |
| 494 | memset(padding, 0xff, padding_length); |
| 495 | out->Align4(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 496 | } |
Adam Lesinski | 5b6ee11 | 2017-07-28 17:10:35 -0700 | [diff] [blame] | 497 | header->header.size = util::HostToDevice32(out->size() - start_index); |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 498 | return no_error; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 499 | } |
| 500 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 501 | bool StringPool::FlattenUtf8(BigBuffer* out, const StringPool& pool, IDiagnostics* diag) { |
| 502 | return Flatten(out, pool, true, diag); |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 503 | } |
| 504 | |
Ryan Mitchell | 70414f2 | 2018-03-26 11:05:31 -0700 | [diff] [blame^] | 505 | bool StringPool::FlattenUtf16(BigBuffer* out, const StringPool& pool, IDiagnostics* diag) { |
| 506 | return Flatten(out, pool, false, diag); |
Adam Lesinski | 24aad16 | 2015-04-24 19:19:30 -0700 | [diff] [blame] | 507 | } |
| 508 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 509 | } // namespace aapt |