1 /*
2 * Copyright (C) 2015 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17 #ifndef AAPT_UTIL_H
18 #define AAPT_UTIL_H
19
20 #include "util/BigBuffer.h"
21 #include "util/Maybe.h"
22 #include "util/StringPiece.h"
23
24 #include <androidfw/ResourceTypes.h>
25 #include <functional>
26 #include <memory>
27 #include <ostream>
28 #include <string>
29 #include <vector>
30
31 namespace aapt {
32 namespace util {
33
34 std::vector<std::string> split(const StringPiece& str, char sep);
35 std::vector<std::string> splitAndLowercase(const StringPiece& str, char sep);
36
37 /**
38 * Returns true if the string starts with prefix.
39 */
40 template <typename T>
stringStartsWith(const BasicStringPiece<T> & str,const BasicStringPiece<T> & prefix)41 bool stringStartsWith(const BasicStringPiece<T>& str, const BasicStringPiece<T>& prefix) {
42 if (str.size() < prefix.size()) {
43 return false;
44 }
45 return str.substr(0, prefix.size()) == prefix;
46 }
47
48 /**
49 * Returns true if the string ends with suffix.
50 */
51 template <typename T>
stringEndsWith(const BasicStringPiece<T> & str,const BasicStringPiece<T> & suffix)52 bool stringEndsWith(const BasicStringPiece<T>& str, const BasicStringPiece<T>& suffix) {
53 if (str.size() < suffix.size()) {
54 return false;
55 }
56 return str.substr(str.size() - suffix.size(), suffix.size()) == suffix;
57 }
58
59 /**
60 * Creates a new StringPiece16 that points to a substring
61 * of the original string without leading or trailing whitespace.
62 */
63 StringPiece16 trimWhitespace(const StringPiece16& str);
64
65 StringPiece trimWhitespace(const StringPiece& str);
66
67 /**
68 * UTF-16 isspace(). It basically checks for lower range characters that are
69 * whitespace.
70 */
isspace16(char16_t c)71 inline bool isspace16(char16_t c) {
72 return c < 0x0080 && isspace(c);
73 }
74
75 /**
76 * Returns an iterator to the first character that is not alpha-numeric and that
77 * is not in the allowedChars set.
78 */
79 StringPiece16::const_iterator findNonAlphaNumericAndNotInSet(const StringPiece16& str,
80 const StringPiece16& allowedChars);
81
82 /**
83 * Tests that the string is a valid Java class name.
84 */
85 bool isJavaClassName(const StringPiece16& str);
86
87 /**
88 * Tests that the string is a valid Java package name.
89 */
90 bool isJavaPackageName(const StringPiece16& str);
91
92 /**
93 * Converts the class name to a fully qualified class name from the given `package`. Ex:
94 *
95 * asdf --> package.asdf
96 * .asdf --> package.asdf
97 * .a.b --> package.a.b
98 * asdf.adsf --> asdf.adsf
99 */
100 Maybe<std::u16string> getFullyQualifiedClassName(const StringPiece16& package,
101 const StringPiece16& className);
102
103
104 /**
105 * Makes a std::unique_ptr<> with the template parameter inferred by the compiler.
106 * This will be present in C++14 and can be removed then.
107 */
108 template <typename T, class... Args>
make_unique(Args &&...args)109 std::unique_ptr<T> make_unique(Args&&... args) {
110 return std::unique_ptr<T>(new T{std::forward<Args>(args)...});
111 }
112
113 /**
114 * Writes a set of items to the std::ostream, joining the times with the provided
115 * separator.
116 */
117 template <typename Iterator>
joiner(Iterator begin,Iterator end,const char * sep)118 ::std::function<::std::ostream&(::std::ostream&)> joiner(Iterator begin, Iterator end,
119 const char* sep) {
120 return [begin, end, sep](::std::ostream& out) -> ::std::ostream& {
121 for (auto iter = begin; iter != end; ++iter) {
122 if (iter != begin) {
123 out << sep;
124 }
125 out << *iter;
126 }
127 return out;
128 };
129 }
130
formatSize(size_t size)131 inline ::std::function<::std::ostream&(::std::ostream&)> formatSize(size_t size) {
132 return [size](::std::ostream& out) -> ::std::ostream& {
133 constexpr size_t K = 1024u;
134 constexpr size_t M = K * K;
135 constexpr size_t G = M * K;
136 if (size < K) {
137 out << size << "B";
138 } else if (size < M) {
139 out << (double(size) / K) << " KiB";
140 } else if (size < G) {
141 out << (double(size) / M) << " MiB";
142 } else {
143 out << (double(size) / G) << " GiB";
144 }
145 return out;
146 };
147 }
148
149 /**
150 * Helper method to extract a string from a StringPool.
151 */
getString(const android::ResStringPool & pool,size_t idx)152 inline StringPiece16 getString(const android::ResStringPool& pool, size_t idx) {
153 size_t len;
154 const char16_t* str = pool.stringAt(idx, &len);
155 if (str != nullptr) {
156 return StringPiece16(str, len);
157 }
158 return StringPiece16();
159 }
160
getString8(const android::ResStringPool & pool,size_t idx)161 inline StringPiece getString8(const android::ResStringPool& pool, size_t idx) {
162 size_t len;
163 const char* str = pool.string8At(idx, &len);
164 if (str != nullptr) {
165 return StringPiece(str, len);
166 }
167 return StringPiece();
168 }
169
170 /**
171 * Checks that the Java string format contains no non-positional arguments (arguments without
172 * explicitly specifying an index) when there are more than one argument. This is an error
173 * because translations may rearrange the order of the arguments in the string, which will
174 * break the string interpolation.
175 */
176 bool verifyJavaStringFormat(const StringPiece16& str);
177
178 class StringBuilder {
179 public:
180 StringBuilder& append(const StringPiece16& str);
181 const std::u16string& str() const;
182 const std::string& error() const;
183 operator bool() const;
184
185 private:
186 std::u16string mStr;
187 bool mQuote = false;
188 bool mTrailingSpace = false;
189 bool mLastCharWasEscape = false;
190 std::string mError;
191 };
192
str()193 inline const std::u16string& StringBuilder::str() const {
194 return mStr;
195 }
196
error()197 inline const std::string& StringBuilder::error() const {
198 return mError;
199 }
200
201 inline StringBuilder::operator bool() const {
202 return mError.empty();
203 }
204
205 /**
206 * Converts a UTF8 string to a UTF16 string.
207 */
208 std::u16string utf8ToUtf16(const StringPiece& utf8);
209 std::string utf16ToUtf8(const StringPiece16& utf8);
210
211 /**
212 * Writes the entire BigBuffer to the output stream.
213 */
214 bool writeAll(std::ostream& out, const BigBuffer& buffer);
215
216 /*
217 * Copies the entire BigBuffer into a single buffer.
218 */
219 std::unique_ptr<uint8_t[]> copy(const BigBuffer& buffer);
220
221 /**
222 * A Tokenizer implemented as an iterable collection. It does not allocate
223 * any memory on the heap nor use standard containers.
224 */
225 template <typename Char>
226 class Tokenizer {
227 public:
228 class iterator {
229 public:
230 iterator(const iterator&) = default;
231 iterator& operator=(const iterator&) = default;
232
233 iterator& operator++();
234 BasicStringPiece<Char> operator*();
235 bool operator==(const iterator& rhs) const;
236 bool operator!=(const iterator& rhs) const;
237
238 private:
239 friend class Tokenizer<Char>;
240
241 iterator(BasicStringPiece<Char> s, Char sep, BasicStringPiece<Char> tok, bool end);
242
243 BasicStringPiece<Char> mStr;
244 Char mSeparator;
245 BasicStringPiece<Char> mToken;
246 bool mEnd;
247 };
248
249 Tokenizer(BasicStringPiece<Char> str, Char sep);
250 iterator begin();
251 iterator end();
252
253 private:
254 const iterator mBegin;
255 const iterator mEnd;
256 };
257
258 template <typename Char>
tokenize(BasicStringPiece<Char> str,Char sep)259 inline Tokenizer<Char> tokenize(BasicStringPiece<Char> str, Char sep) {
260 return Tokenizer<Char>(str, sep);
261 }
262
263 template <typename Char>
264 typename Tokenizer<Char>::iterator& Tokenizer<Char>::iterator::operator++() {
265 const Char* start = mToken.end();
266 const Char* end = mStr.end();
267 if (start == end) {
268 mEnd = true;
269 mToken.assign(mToken.end(), 0);
270 return *this;
271 }
272
273 start += 1;
274 const Char* current = start;
275 while (current != end) {
276 if (*current == mSeparator) {
277 mToken.assign(start, current - start);
278 return *this;
279 }
280 ++current;
281 }
282 mToken.assign(start, end - start);
283 return *this;
284 }
285
286 template <typename Char>
287 inline BasicStringPiece<Char> Tokenizer<Char>::iterator::operator*() {
288 return mToken;
289 }
290
291 template <typename Char>
292 inline bool Tokenizer<Char>::iterator::operator==(const iterator& rhs) const {
293 // We check equality here a bit differently.
294 // We need to know that the addresses are the same.
295 return mToken.begin() == rhs.mToken.begin() && mToken.end() == rhs.mToken.end() &&
296 mEnd == rhs.mEnd;
297 }
298
299 template <typename Char>
300 inline bool Tokenizer<Char>::iterator::operator!=(const iterator& rhs) const {
301 return !(*this == rhs);
302 }
303
304 template <typename Char>
iterator(BasicStringPiece<Char> s,Char sep,BasicStringPiece<Char> tok,bool end)305 inline Tokenizer<Char>::iterator::iterator(BasicStringPiece<Char> s, Char sep,
306 BasicStringPiece<Char> tok, bool end) :
307 mStr(s), mSeparator(sep), mToken(tok), mEnd(end) {
308 }
309
310 template <typename Char>
begin()311 inline typename Tokenizer<Char>::iterator Tokenizer<Char>::begin() {
312 return mBegin;
313 }
314
315 template <typename Char>
end()316 inline typename Tokenizer<Char>::iterator Tokenizer<Char>::end() {
317 return mEnd;
318 }
319
320 template <typename Char>
Tokenizer(BasicStringPiece<Char> str,Char sep)321 inline Tokenizer<Char>::Tokenizer(BasicStringPiece<Char> str, Char sep) :
322 mBegin(++iterator(str, sep, BasicStringPiece<Char>(str.begin() - 1, 0), false)),
323 mEnd(str, sep, BasicStringPiece<Char>(str.end(), 0), true) {
324 }
325
hostToDevice16(uint16_t value)326 inline uint16_t hostToDevice16(uint16_t value) {
327 return htods(value);
328 }
329
hostToDevice32(uint32_t value)330 inline uint32_t hostToDevice32(uint32_t value) {
331 return htodl(value);
332 }
333
deviceToHost16(uint16_t value)334 inline uint16_t deviceToHost16(uint16_t value) {
335 return dtohs(value);
336 }
337
deviceToHost32(uint32_t value)338 inline uint32_t deviceToHost32(uint32_t value) {
339 return dtohl(value);
340 }
341
342 /**
343 * Given a path like: res/xml-sw600dp/foo.xml
344 *
345 * Extracts "res/xml-sw600dp/" into outPrefix.
346 * Extracts "foo" into outEntry.
347 * Extracts ".xml" into outSuffix.
348 *
349 * Returns true if successful.
350 */
351 bool extractResFilePathParts(const StringPiece16& path, StringPiece16* outPrefix,
352 StringPiece16* outEntry, StringPiece16* outSuffix);
353
354 } // namespace util
355
356 /**
357 * Stream operator for functions. Calls the function with the stream as an argument.
358 * In the aapt namespace for lookup.
359 */
360 inline ::std::ostream& operator<<(::std::ostream& out,
361 ::std::function<::std::ostream&(::std::ostream&)> f) {
362 return f(out);
363 }
364
365 } // namespace aapt
366
367 #endif // AAPT_UTIL_H
368