Blame - tools/aapt2/util/Util.cpp - platform_frameworks_base

blob: b0bec624cc9cd065a968fa95c41482cc560778cc [file] [log] [blame]

Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	1	/*
				2	* Copyright (C) 2015 The Android Open Source Project
				3	*
				4	* Licensed under the Apache License, Version 2.0 (the "License");
				5	* you may not use this file except in compliance with the License.
				6	* You may obtain a copy of the License at
				7	*
				8	* http://www.apache.org/licenses/LICENSE-2.0
				9	*
				10	* Unless required by applicable law or agreed to in writing, software
				11	* distributed under the License is distributed on an "AS IS" BASIS,
				12	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
				13	* See the License for the specific language governing permissions and
				14	* limitations under the License.
				15	*/
				16
Adam Lesinski	1ab598f	2015-08-14 14:26:04 -0700	[diff] [blame]	17	#include "util/BigBuffer.h"
				18	#include "util/Maybe.h"
				19	#include "util/StringPiece.h"
				20	#include "util/Util.h"
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	21
				22	#include <algorithm>
				23	#include <ostream>
				24	#include <string>
				25	#include <utils/Unicode.h>
				26	#include <vector>
				27
				28	namespace aapt {
				29	namespace util {
				30
				31	static std::vector<std::string> splitAndTransform(const StringPiece& str, char sep,
				32	const std::function<char(char)>& f) {
				33	std::vector<std::string> parts;
				34	const StringPiece::const_iterator end = std::end(str);
				35	StringPiece::const_iterator start = std::begin(str);
				36	StringPiece::const_iterator current;
				37	do {
				38	current = std::find(start, end, sep);
				39	parts.emplace_back(str.substr(start, current).toString());
				40	if (f) {
				41	std::string& part = parts.back();
				42	std::transform(part.begin(), part.end(), part.begin(), f);
				43	}
				44	start = current + 1;
				45	} while (current != end);
				46	return parts;
				47	}
				48
				49	std::vector<std::string> split(const StringPiece& str, char sep) {
				50	return splitAndTransform(str, sep, nullptr);
				51	}
				52
				53	std::vector<std::string> splitAndLowercase(const StringPiece& str, char sep) {
				54	return splitAndTransform(str, sep, ::tolower);
				55	}
				56
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	57	bool stringStartsWith(const StringPiece& str, const StringPiece& prefix) {
				58	if (str.size() < prefix.size()) {
				59	return false;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	60	}
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	61	return str.substr(0, prefix.size()) == prefix;
				62	}
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	63
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	64	bool stringEndsWith(const StringPiece& str, const StringPiece& suffix) {
				65	if (str.size() < suffix.size()) {
				66	return false;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	67	}
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	68	return str.substr(str.size() - suffix.size(), suffix.size()) == suffix;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	69	}
				70
Adam Lesinski	3b4cd94	2015-10-30 16:31:42 -0700	[diff] [blame]	71	StringPiece trimWhitespace(const StringPiece& str) {
				72	if (str.size() == 0 \|\| str.data() == nullptr) {
				73	return str;
				74	}
				75
				76	const char* start = str.data();
				77	const char* end = str.data() + str.length();
				78
				79	while (start != end && isspace(*start)) {
				80	start++;
				81	}
				82
				83	while (end != start && isspace(*(end - 1))) {
				84	end--;
				85	}
				86
				87	return StringPiece(start, end - start);
				88	}
				89
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	90	StringPiece::const_iterator findNonAlphaNumericAndNotInSet(const StringPiece& str,
				91	const StringPiece& allowedChars) {
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	92	const auto endIter = str.end();
				93	for (auto iter = str.begin(); iter != endIter; ++iter) {
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	94	char c = *iter;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	95	if ((c >= u'a' && c <= u'z') \|\|
				96	(c >= u'A' && c <= u'Z') \|\|
				97	(c >= u'0' && c <= u'9')) {
				98	continue;
				99	}
				100
				101	bool match = false;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	102	for (char i : allowedChars) {
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	103	if (c == i) {
				104	match = true;
				105	break;
				106	}
				107	}
				108
				109	if (!match) {
				110	return iter;
				111	}
				112	}
				113	return endIter;
				114	}
				115
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	116	bool isJavaClassName(const StringPiece& str) {
Adam Lesinski	a1ad4a8	2015-06-08 11:41:09 -0700	[diff] [blame]	117	size_t pieces = 0;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	118	for (const StringPiece& piece : tokenize(str, '.')) {
Adam Lesinski	a1ad4a8	2015-06-08 11:41:09 -0700	[diff] [blame]	119	pieces++;
				120	if (piece.empty()) {
				121	return false;
				122	}
				123
				124	// Can't have starting or trailing $ character.
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	125	if (piece.data()[0] == '$' \|\| piece.data()[piece.size() - 1] == '$') {
Adam Lesinski	a1ad4a8	2015-06-08 11:41:09 -0700	[diff] [blame]	126	return false;
				127	}
				128
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	129	if (findNonAlphaNumericAndNotInSet(piece, "$_") != piece.end()) {
Adam Lesinski	a1ad4a8	2015-06-08 11:41:09 -0700	[diff] [blame]	130	return false;
				131	}
				132	}
				133	return pieces >= 2;
				134	}
				135
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	136	bool isJavaPackageName(const StringPiece& str) {
Adam Lesinski	1ab598f	2015-08-14 14:26:04 -0700	[diff] [blame]	137	if (str.empty()) {
				138	return false;
				139	}
				140
				141	size_t pieces = 0;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	142	for (const StringPiece& piece : tokenize(str, '.')) {
Adam Lesinski	1ab598f	2015-08-14 14:26:04 -0700	[diff] [blame]	143	pieces++;
				144	if (piece.empty()) {
				145	return false;
				146	}
				147
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	148	if (piece.data()[0] == '_' \|\| piece.data()[piece.size() - 1] == '_') {
Adam Lesinski	1ab598f	2015-08-14 14:26:04 -0700	[diff] [blame]	149	return false;
				150	}
				151
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	152	if (findNonAlphaNumericAndNotInSet(piece, "_") != piece.end()) {
Adam Lesinski	1ab598f	2015-08-14 14:26:04 -0700	[diff] [blame]	153	return false;
				154	}
				155	}
				156	return pieces >= 1;
				157	}
				158
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	159	Maybe<std::string> getFullyQualifiedClassName(const StringPiece& package,
				160	const StringPiece& className) {
Adam Lesinski	a1ad4a8	2015-06-08 11:41:09 -0700	[diff] [blame]	161	if (className.empty()) {
				162	return {};
				163	}
				164
				165	if (util::isJavaClassName(className)) {
				166	return className.toString();
				167	}
				168
				169	if (package.empty()) {
				170	return {};
				171	}
				172
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	173	std::string result(package.data(), package.size());
				174	if (className.data()[0] != '.') {
				175	result += '.';
Adam Lesinski	a1ad4a8	2015-06-08 11:41:09 -0700	[diff] [blame]	176	}
Adam Lesinski	52364f7	2016-01-11 13:10:24 -0800	[diff] [blame]	177
Adam Lesinski	a1ad4a8	2015-06-08 11:41:09 -0700	[diff] [blame]	178	result.append(className.data(), className.size());
				179	if (!isJavaClassName(result)) {
				180	return {};
				181	}
				182	return result;
				183	}
				184
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	185	static size_t consumeDigits(const char* start, const char* end) {
				186	const char* c = start;
				187	for (; c != end && c >= '0' && c <= '9'; c++) {}
Adam Lesinski	b23f1e0	2015-11-03 12:24:17 -0800	[diff] [blame]	188	return static_cast<size_t>(c - start);
				189	}
				190
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	191	bool verifyJavaStringFormat(const StringPiece& str) {
				192	const char* c = str.begin();
				193	const char* const end = str.end();
Adam Lesinski	b23f1e0	2015-11-03 12:24:17 -0800	[diff] [blame]	194
				195	size_t argCount = 0;
				196	bool nonpositional = false;
				197	while (c != end) {
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	198	if (*c == '%' && c + 1 < end) {
Adam Lesinski	b23f1e0	2015-11-03 12:24:17 -0800	[diff] [blame]	199	c++;
				200
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	201	if (*c == '%') {
Adam Lesinski	b23f1e0	2015-11-03 12:24:17 -0800	[diff] [blame]	202	c++;
				203	continue;
				204	}
				205
				206	argCount++;
				207
				208	size_t numDigits = consumeDigits(c, end);
				209	if (numDigits > 0) {
				210	c += numDigits;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	211	if (c != end && *c != '$') {
Adam Lesinski	b23f1e0	2015-11-03 12:24:17 -0800	[diff] [blame]	212	// The digits were a size, but not a positional argument.
				213	nonpositional = true;
				214	}
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	215	} else if (*c == '<') {
Adam Lesinski	b23f1e0	2015-11-03 12:24:17 -0800	[diff] [blame]	216	// Reusing last argument, bad idea since positions can be moved around
				217	// during translation.
				218	nonpositional = true;
				219
				220	c++;
				221
				222	// Optionally we can have a $ after
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	223	if (c != end && *c == '$') {
Adam Lesinski	b23f1e0	2015-11-03 12:24:17 -0800	[diff] [blame]	224	c++;
				225	}
				226	} else {
				227	nonpositional = true;
				228	}
				229
				230	// Ignore size, width, flags, etc.
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	231	while (c != end && (*c == '-' \|\|
				232	*c == '#' \|\|
				233	*c == '+' \|\|
				234	*c == ' ' \|\|
				235	*c == ',' \|\|
				236	*c == '(' \|\|
				237	(c >= '0' && c <= '9'))) {
Adam Lesinski	b23f1e0	2015-11-03 12:24:17 -0800	[diff] [blame]	238	c++;
				239	}
				240
				241	/*
				242	* This is a shortcut to detect strings that are going to Time.format()
				243	* instead of String.format()
				244	*
				245	* Comparison of String.format() and Time.format() args:
				246	*
				247	* String: ABC E GH ST X abcdefgh nost x
				248	* Time: DEFGHKMS W Za d hkm s w yz
				249	*
				250	* Therefore we know it's definitely Time if we have:
				251	* DFKMWZkmwyz
				252	*/
				253	if (c != end) {
				254	switch (*c) {
				255	case 'D':
				256	case 'F':
				257	case 'K':
				258	case 'M':
				259	case 'W':
				260	case 'Z':
				261	case 'k':
				262	case 'm':
				263	case 'w':
				264	case 'y':
				265	case 'z':
				266	return true;
				267	}
				268	}
				269	}
				270
				271	if (c != end) {
				272	c++;
				273	}
				274	}
				275
				276	if (argCount > 1 && nonpositional) {
				277	// Multiple arguments were specified, but some or all were non positional. Translated
				278	// strings may rearrange the order of the arguments, which will break the string.
				279	return false;
				280	}
				281	return true;
				282	}
				283
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	284	static Maybe<std::string> parseUnicodeCodepoint(const char** start, const char* end) {
				285	char32_t code = 0;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	286	for (size_t i = 0; i < 4 && start != end; i++, (start)++) {
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	287	char c = **start;
				288	char32_t a;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	289	if (c >= '0' && c <= '9') {
				290	a = c - '0';
				291	} else if (c >= 'a' && c <= 'f') {
				292	a = c - 'a' + 10;
				293	} else if (c >= 'A' && c <= 'F') {
				294	a = c - 'A' + 10;
				295	} else {
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	296	return {};
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	297	}
				298	code = (code << 4) \| a;
				299	}
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	300
				301	ssize_t len = utf32_to_utf8_length(&code, 1);
				302	if (len < 0) {
				303	return {};
				304	}
				305
				306	std::string resultUtf8;
				307	resultUtf8.resize(len);
				308	utf32_to_utf8(&code, 1, &*resultUtf8.begin(), len + 1);
				309	return resultUtf8;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	310	}
				311
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	312	StringBuilder& StringBuilder::append(const StringPiece& str) {
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	313	if (!mError.empty()) {
				314	return *this;
				315	}
				316
Adam Lesinski	8c3f31f	2016-09-07 13:45:13 -0700	[diff] [blame^]	317	// Where the new data will be appended to.
				318	size_t newDataIndex = mStr.size();
				319
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	320	const char* const end = str.end();
				321	const char* start = str.begin();
				322	const char* current = start;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	323	while (current != end) {
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	324	if (mLastCharWasEscape) {
				325	switch (*current) {
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	326	case 't':
				327	mStr += '\t';
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	328	break;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	329	case 'n':
				330	mStr += '\n';
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	331	break;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	332	case '#':
				333	mStr += '#';
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	334	break;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	335	case '@':
				336	mStr += '@';
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	337	break;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	338	case '?':
				339	mStr += '?';
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	340	break;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	341	case '"':
				342	mStr += '"';
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	343	break;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	344	case '\'':
				345	mStr += '\'';
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	346	break;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	347	case '\\':
				348	mStr += '\\';
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	349	break;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	350	case 'u': {
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	351	current++;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	352	Maybe<std::string> c = parseUnicodeCodepoint(&current, end);
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	353	if (!c) {
				354	mError = "invalid unicode escape sequence";
				355	return *this;
				356	}
				357	mStr += c.value();
				358	current -= 1;
				359	break;
				360	}
				361
				362	default:
				363	// Ignore.
				364	break;
				365	}
				366	mLastCharWasEscape = false;
				367	start = current + 1;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	368	} else if (*current == '"') {
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	369	if (!mQuote && mTrailingSpace) {
				370	// We found an opening quote, and we have
				371	// trailing space, so we should append that
				372	// space now.
				373	if (mTrailingSpace) {
				374	// We had trailing whitespace, so
				375	// replace with a single space.
				376	if (!mStr.empty()) {
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	377	mStr += ' ';
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	378	}
				379	mTrailingSpace = false;
				380	}
				381	}
				382	mQuote = !mQuote;
				383	mStr.append(start, current - start);
				384	start = current + 1;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	385	} else if (*current == '\'' && !mQuote) {
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	386	// This should be escaped.
				387	mError = "unescaped apostrophe";
				388	return *this;
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	389	} else if (*current == '\\') {
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	390	// This is an escape sequence, convert to the real value.
				391	if (!mQuote && mTrailingSpace) {
				392	// We had trailing whitespace, so
				393	// replace with a single space.
				394	if (!mStr.empty()) {
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	395	mStr += ' ';
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	396	}
				397	mTrailingSpace = false;
				398	}
				399	mStr.append(start, current - start);
				400	start = current + 1;
Adam Lesinski	9095988	2015-07-06 18:09:18 -0700	[diff] [blame]	401	mLastCharWasEscape = true;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	402	} else if (!mQuote) {
				403	// This is not quoted text, so look for whitespace.
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	404	if (isspace(*current)) {
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	405	// We found whitespace, see if we have seen some
				406	// before.
				407	if (!mTrailingSpace) {
				408	// We didn't see a previous adjacent space,
				409	// so mark that we did.
				410	mTrailingSpace = true;
				411	mStr.append(start, current - start);
				412	}
				413
				414	// Keep skipping whitespace.
				415	start = current + 1;
				416	} else if (mTrailingSpace) {
				417	// We saw trailing space before, so replace all
				418	// that trailing space with one space.
				419	if (!mStr.empty()) {
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	420	mStr += ' ';
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	421	}
				422	mTrailingSpace = false;
				423	}
				424	}
				425	current++;
				426	}
				427	mStr.append(start, end - start);
Adam Lesinski	8c3f31f	2016-09-07 13:45:13 -0700	[diff] [blame^]	428
				429	// Accumulate the added string's UTF-16 length.
				430	ssize_t len = utf8_to_utf16_length(
				431	reinterpret_cast<const uint8_t*>(mStr.data()) + newDataIndex,
				432	mStr.size() - newDataIndex);
				433	if (len < 0) {
				434	mError = "invalid unicode code point";
				435	return *this;
				436	}
				437	mUtf16Len += len;
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	438	return *this;
				439	}
				440
				441	std::u16string utf8ToUtf16(const StringPiece& utf8) {
				442	ssize_t utf16Length = utf8_to_utf16_length(reinterpret_cast<const uint8_t*>(utf8.data()),
				443	utf8.length());
				444	if (utf16Length <= 0) {
				445	return {};
				446	}
				447
				448	std::u16string utf16;
				449	utf16.resize(utf16Length);
Adam Lesinski	8c3f31f	2016-09-07 13:45:13 -0700	[diff] [blame^]	450	utf8_to_utf16(reinterpret_cast<const uint8_t*>(utf8.data()), utf8.length(),
				451	&*utf16.begin(), utf16Length + 1);
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	452	return utf16;
				453	}
				454
				455	std::string utf16ToUtf8(const StringPiece16& utf16) {
				456	ssize_t utf8Length = utf16_to_utf8_length(utf16.data(), utf16.length());
				457	if (utf8Length <= 0) {
				458	return {};
				459	}
				460
				461	std::string utf8;
				462	utf8.resize(utf8Length);
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	463	utf16_to_utf8(utf16.data(), utf16.length(), &*utf8.begin(), utf8Length + 1);
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	464	return utf8;
				465	}
				466
				467	bool writeAll(std::ostream& out, const BigBuffer& buffer) {
				468	for (const auto& b : buffer) {
				469	if (!out.write(reinterpret_cast<const char*>(b.buffer.get()), b.size)) {
				470	return false;
				471	}
				472	}
				473	return true;
				474	}
				475
				476	std::unique_ptr<uint8_t[]> copy(const BigBuffer& buffer) {
				477	std::unique_ptr<uint8_t[]> data = std::unique_ptr<uint8_t[]>(new uint8_t[buffer.size()]);
				478	uint8_t* p = data.get();
				479	for (const auto& block : buffer) {
				480	memcpy(p, block.buffer.get(), block.size);
				481	p += block.size;
				482	}
				483	return data;
				484	}
				485
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	486	typename Tokenizer::iterator& Tokenizer::iterator::operator++() {
				487	const char* start = mToken.end();
				488	const char* end = mStr.end();
				489	if (start == end) {
				490	mEnd = true;
				491	mToken.assign(mToken.end(), 0);
				492	return *this;
				493	}
				494
				495	start += 1;
				496	const char* current = start;
				497	while (current != end) {
				498	if (*current == mSeparator) {
				499	mToken.assign(start, current - start);
				500	return *this;
				501	}
				502	++current;
				503	}
				504	mToken.assign(start, end - start);
				505	return *this;
				506	}
				507
				508	bool Tokenizer::iterator::operator==(const iterator& rhs) const {
				509	// We check equality here a bit differently.
				510	// We need to know that the addresses are the same.
				511	return mToken.begin() == rhs.mToken.begin() && mToken.end() == rhs.mToken.end() &&
				512	mEnd == rhs.mEnd;
				513	}
				514
				515	bool Tokenizer::iterator::operator!=(const iterator& rhs) const {
				516	return !(*this == rhs);
				517	}
				518
				519	Tokenizer::iterator::iterator(StringPiece s, char sep, StringPiece tok, bool end) :
				520	mStr(s), mSeparator(sep), mToken(tok), mEnd(end) {
				521	}
				522
				523	Tokenizer::Tokenizer(StringPiece str, char sep) :
				524	mBegin(++iterator(str, sep, StringPiece(str.begin() - 1, 0), false)),
				525	mEnd(str, sep, StringPiece(str.end(), 0), true) {
				526	}
				527
				528	bool extractResFilePathParts(const StringPiece& path, StringPiece* outPrefix,
				529	StringPiece* outEntry, StringPiece* outSuffix) {
				530	const StringPiece resPrefix("res/");
				531	if (!stringStartsWith(path, resPrefix)) {
Adam Lesinski	1ab598f	2015-08-14 14:26:04 -0700	[diff] [blame]	532	return false;
				533	}
				534
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	535	StringPiece::const_iterator lastOccurence = path.end();
				536	for (auto iter = path.begin() + resPrefix.size(); iter != path.end(); ++iter) {
				537	if (*iter == '/') {
Adam Lesinski	1ab598f	2015-08-14 14:26:04 -0700	[diff] [blame]	538	lastOccurence = iter;
				539	}
				540	}
				541
				542	if (lastOccurence == path.end()) {
				543	return false;
				544	}
				545
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	546	auto iter = std::find(lastOccurence, path.end(), '.');
				547	*outSuffix = StringPiece(iter, path.end() - iter);
				548	*outEntry = StringPiece(lastOccurence + 1, iter - lastOccurence - 1);
				549	*outPrefix = StringPiece(path.begin(), lastOccurence - path.begin() + 1);
Adam Lesinski	1ab598f	2015-08-14 14:26:04 -0700	[diff] [blame]	550	return true;
				551	}
				552
Adam Lesinski	d0f116b	2016-07-08 15:00:32 -0700	[diff] [blame]	553	StringPiece16 getString16(const android::ResStringPool& pool, size_t idx) {
				554	size_t len;
				555	const char16_t* str = pool.stringAt(idx, &len);
				556	if (str != nullptr) {
				557	return StringPiece16(str, len);
				558	}
				559	return StringPiece16();
				560	}
				561
				562	std::string getString(const android::ResStringPool& pool, size_t idx) {
				563	size_t len;
				564	const char* str = pool.string8At(idx, &len);
				565	if (str != nullptr) {
				566	return std::string(str, len);
				567	}
				568	return utf16ToUtf8(getString16(pool, idx));
				569	}
				570
Adam Lesinski	6f6ceb7	2014-11-14 14:48:12 -0800	[diff] [blame]	571	} // namespace util
				572	} // namespace aapt