1 /*
2 * Copyright (C) 2017 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17 #include "dex_file_loader.h"
18
19 #include "android-base/stringprintf.h"
20
21 #include "base/stl_util.h"
22 #include "compact_dex_file.h"
23 #include "dex_file.h"
24 #include "dex_file_verifier.h"
25 #include "standard_dex_file.h"
26 #include "ziparchive/zip_archive.h"
27
28 namespace art {
29
30 namespace {
31
32 class VectorContainer : public DexFileContainer {
33 public:
VectorContainer(std::vector<uint8_t> && vector)34 explicit VectorContainer(std::vector<uint8_t>&& vector) : vector_(std::move(vector)) { }
~VectorContainer()35 ~VectorContainer() override { }
36
GetPermissions()37 int GetPermissions() override {
38 return 0;
39 }
40
IsReadOnly()41 bool IsReadOnly() override {
42 return true;
43 }
44
EnableWrite()45 bool EnableWrite() override {
46 return false;
47 }
48
DisableWrite()49 bool DisableWrite() override {
50 return false;
51 }
52
53 private:
54 std::vector<uint8_t> vector_;
55 DISALLOW_COPY_AND_ASSIGN(VectorContainer);
56 };
57
58 } // namespace
59
60 using android::base::StringPrintf;
61
62 class DexZipArchive;
63
64 class DexZipEntry {
65 public:
66 // Extract this entry to memory.
67 // Returns null on failure and sets error_msg.
Extract(std::string * error_msg)68 const std::vector<uint8_t> Extract(std::string* error_msg) {
69 std::vector<uint8_t> map(GetUncompressedLength());
70 if (map.size() == 0) {
71 DCHECK(!error_msg->empty());
72 return map;
73 }
74 const int32_t error = ExtractToMemory(handle_, zip_entry_, map.data(), map.size());
75 if (error) {
76 *error_msg = std::string(ErrorCodeString(error));
77 }
78 return map;
79 }
80
~DexZipEntry()81 virtual ~DexZipEntry() {
82 delete zip_entry_;
83 }
84
GetUncompressedLength()85 uint32_t GetUncompressedLength() {
86 return zip_entry_->uncompressed_length;
87 }
88
GetCrc32()89 uint32_t GetCrc32() {
90 return zip_entry_->crc32;
91 }
92
93 private:
DexZipEntry(ZipArchiveHandle handle,::ZipEntry * zip_entry,const std::string & entry_name)94 DexZipEntry(ZipArchiveHandle handle,
95 ::ZipEntry* zip_entry,
96 const std::string& entry_name)
97 : handle_(handle), zip_entry_(zip_entry), entry_name_(entry_name) {}
98
99 ZipArchiveHandle handle_;
100 ::ZipEntry* const zip_entry_;
101 std::string const entry_name_;
102
103 friend class DexZipArchive;
104 DISALLOW_COPY_AND_ASSIGN(DexZipEntry);
105 };
106
107 class DexZipArchive {
108 public:
109 // return new DexZipArchive instance on success, null on error.
Open(const uint8_t * base,size_t size,std::string * error_msg)110 static DexZipArchive* Open(const uint8_t* base, size_t size, std::string* error_msg) {
111 ZipArchiveHandle handle;
112 uint8_t* nonconst_base = const_cast<uint8_t*>(base);
113 const int32_t error = OpenArchiveFromMemory(nonconst_base, size, "ZipArchiveMemory", &handle);
114 if (error) {
115 *error_msg = std::string(ErrorCodeString(error));
116 CloseArchive(handle);
117 return nullptr;
118 }
119 return new DexZipArchive(handle);
120 }
121
Find(const char * name,std::string * error_msg) const122 DexZipEntry* Find(const char* name, std::string* error_msg) const {
123 DCHECK(name != nullptr);
124 // Resist the urge to delete the space. <: is a bigraph sequence.
125 std::unique_ptr< ::ZipEntry> zip_entry(new ::ZipEntry);
126 const int32_t error = FindEntry(handle_, name, zip_entry.get());
127 if (error) {
128 *error_msg = std::string(ErrorCodeString(error));
129 return nullptr;
130 }
131 return new DexZipEntry(handle_, zip_entry.release(), name);
132 }
133
~DexZipArchive()134 ~DexZipArchive() {
135 CloseArchive(handle_);
136 }
137
138
139 private:
DexZipArchive(ZipArchiveHandle handle)140 explicit DexZipArchive(ZipArchiveHandle handle) : handle_(handle) {}
141 ZipArchiveHandle handle_;
142
143 friend class DexZipEntry;
144 DISALLOW_COPY_AND_ASSIGN(DexZipArchive);
145 };
146
IsZipMagic(uint32_t magic)147 static bool IsZipMagic(uint32_t magic) {
148 return (('P' == ((magic >> 0) & 0xff)) &&
149 ('K' == ((magic >> 8) & 0xff)));
150 }
151
IsMagicValid(uint32_t magic)152 bool DexFileLoader::IsMagicValid(uint32_t magic) {
153 return IsMagicValid(reinterpret_cast<uint8_t*>(&magic));
154 }
155
IsMagicValid(const uint8_t * magic)156 bool DexFileLoader::IsMagicValid(const uint8_t* magic) {
157 return StandardDexFile::IsMagicValid(magic) ||
158 CompactDexFile::IsMagicValid(magic);
159 }
160
IsVersionAndMagicValid(const uint8_t * magic)161 bool DexFileLoader::IsVersionAndMagicValid(const uint8_t* magic) {
162 if (StandardDexFile::IsMagicValid(magic)) {
163 return StandardDexFile::IsVersionValid(magic);
164 }
165 if (CompactDexFile::IsMagicValid(magic)) {
166 return CompactDexFile::IsVersionValid(magic);
167 }
168 return false;
169 }
170
IsMultiDexLocation(const char * location)171 bool DexFileLoader::IsMultiDexLocation(const char* location) {
172 return strrchr(location, kMultiDexSeparator) != nullptr;
173 }
174
GetMultiDexClassesDexName(size_t index)175 std::string DexFileLoader::GetMultiDexClassesDexName(size_t index) {
176 return (index == 0) ? "classes.dex" : StringPrintf("classes%zu.dex", index + 1);
177 }
178
GetMultiDexLocation(size_t index,const char * dex_location)179 std::string DexFileLoader::GetMultiDexLocation(size_t index, const char* dex_location) {
180 return (index == 0)
181 ? dex_location
182 : StringPrintf("%s%cclasses%zu.dex", dex_location, kMultiDexSeparator, index + 1);
183 }
184
GetDexCanonicalLocation(const char * dex_location)185 std::string DexFileLoader::GetDexCanonicalLocation(const char* dex_location) {
186 CHECK_NE(dex_location, static_cast<const char*>(nullptr));
187 std::string base_location = GetBaseLocation(dex_location);
188 const char* suffix = dex_location + base_location.size();
189 DCHECK(suffix[0] == 0 || suffix[0] == kMultiDexSeparator);
190 #ifdef _WIN32
191 // Warning: No symbolic link processing here.
192 PLOG(WARNING) << "realpath is unsupported on Windows.";
193 #else
194 // Warning: Bionic implementation of realpath() allocates > 12KB on the stack.
195 // Do not run this code on a small stack, e.g. in signal handler.
196 UniqueCPtr<const char[]> path(realpath(base_location.c_str(), nullptr));
197 if (path != nullptr && path.get() != base_location) {
198 return std::string(path.get()) + suffix;
199 }
200 #endif
201 if (suffix[0] == 0) {
202 return base_location;
203 } else {
204 return dex_location;
205 }
206 }
207
208 // All of the implementations here should be independent of the runtime.
209 // TODO: implement all the virtual methods.
210
GetMultiDexChecksums(const char * filename ATTRIBUTE_UNUSED,std::vector<uint32_t> * checksums ATTRIBUTE_UNUSED,std::string * error_msg,int zip_fd ATTRIBUTE_UNUSED,bool * zip_file_only_contains_uncompress_dex ATTRIBUTE_UNUSED) const211 bool DexFileLoader::GetMultiDexChecksums(
212 const char* filename ATTRIBUTE_UNUSED,
213 std::vector<uint32_t>* checksums ATTRIBUTE_UNUSED,
214 std::string* error_msg,
215 int zip_fd ATTRIBUTE_UNUSED,
216 bool* zip_file_only_contains_uncompress_dex ATTRIBUTE_UNUSED) const {
217 *error_msg = "UNIMPLEMENTED";
218 return false;
219 }
220
Open(const uint8_t * base,size_t size,const std::string & location,uint32_t location_checksum,const OatDexFile * oat_dex_file,bool verify,bool verify_checksum,std::string * error_msg,std::unique_ptr<DexFileContainer> container) const221 std::unique_ptr<const DexFile> DexFileLoader::Open(
222 const uint8_t* base,
223 size_t size,
224 const std::string& location,
225 uint32_t location_checksum,
226 const OatDexFile* oat_dex_file,
227 bool verify,
228 bool verify_checksum,
229 std::string* error_msg,
230 std::unique_ptr<DexFileContainer> container) const {
231 return OpenCommon(base,
232 size,
233 /*data_base=*/ nullptr,
234 /*data_size=*/ 0,
235 location,
236 location_checksum,
237 oat_dex_file,
238 verify,
239 verify_checksum,
240 error_msg,
241 std::move(container),
242 /*verify_result=*/ nullptr);
243 }
244
OpenWithDataSection(const uint8_t * base,size_t size,const uint8_t * data_base,size_t data_size,const std::string & location,uint32_t location_checksum,const OatDexFile * oat_dex_file,bool verify,bool verify_checksum,std::string * error_msg) const245 std::unique_ptr<const DexFile> DexFileLoader::OpenWithDataSection(
246 const uint8_t* base,
247 size_t size,
248 const uint8_t* data_base,
249 size_t data_size,
250 const std::string& location,
251 uint32_t location_checksum,
252 const OatDexFile* oat_dex_file,
253 bool verify,
254 bool verify_checksum,
255 std::string* error_msg) const {
256 return OpenCommon(base,
257 size,
258 data_base,
259 data_size,
260 location,
261 location_checksum,
262 oat_dex_file,
263 verify,
264 verify_checksum,
265 error_msg,
266 /*container=*/ nullptr,
267 /*verify_result=*/ nullptr);
268 }
269
OpenAll(const uint8_t * base,size_t size,const std::string & location,bool verify,bool verify_checksum,DexFileLoaderErrorCode * error_code,std::string * error_msg,std::vector<std::unique_ptr<const DexFile>> * dex_files) const270 bool DexFileLoader::OpenAll(
271 const uint8_t* base,
272 size_t size,
273 const std::string& location,
274 bool verify,
275 bool verify_checksum,
276 DexFileLoaderErrorCode* error_code,
277 std::string* error_msg,
278 std::vector<std::unique_ptr<const DexFile>>* dex_files) const {
279 DCHECK(dex_files != nullptr) << "DexFile::Open: out-param is nullptr";
280 uint32_t magic = *reinterpret_cast<const uint32_t*>(base);
281 if (IsZipMagic(magic)) {
282 std::unique_ptr<DexZipArchive> zip_archive(DexZipArchive::Open(base, size, error_msg));
283 if (zip_archive.get() == nullptr) {
284 DCHECK(!error_msg->empty());
285 return false;
286 }
287 return OpenAllDexFilesFromZip(*zip_archive.get(),
288 location,
289 verify,
290 verify_checksum,
291 error_code,
292 error_msg,
293 dex_files);
294 }
295 if (IsMagicValid(magic)) {
296 const DexFile::Header* dex_header = reinterpret_cast<const DexFile::Header*>(base);
297 std::unique_ptr<const DexFile> dex_file(Open(base,
298 size,
299 location,
300 dex_header->checksum_,
301 /*oat_dex_file=*/ nullptr,
302 verify,
303 verify_checksum,
304 error_msg));
305 if (dex_file.get() != nullptr) {
306 dex_files->push_back(std::move(dex_file));
307 return true;
308 } else {
309 return false;
310 }
311 }
312 *error_msg = StringPrintf("Expected valid zip or dex file");
313 return false;
314 }
315
OpenCommon(const uint8_t * base,size_t size,const uint8_t * data_base,size_t data_size,const std::string & location,uint32_t location_checksum,const OatDexFile * oat_dex_file,bool verify,bool verify_checksum,std::string * error_msg,std::unique_ptr<DexFileContainer> container,VerifyResult * verify_result)316 std::unique_ptr<DexFile> DexFileLoader::OpenCommon(const uint8_t* base,
317 size_t size,
318 const uint8_t* data_base,
319 size_t data_size,
320 const std::string& location,
321 uint32_t location_checksum,
322 const OatDexFile* oat_dex_file,
323 bool verify,
324 bool verify_checksum,
325 std::string* error_msg,
326 std::unique_ptr<DexFileContainer> container,
327 VerifyResult* verify_result) {
328 if (verify_result != nullptr) {
329 *verify_result = VerifyResult::kVerifyNotAttempted;
330 }
331 std::unique_ptr<DexFile> dex_file;
332 if (size >= sizeof(StandardDexFile::Header) && StandardDexFile::IsMagicValid(base)) {
333 if (data_size != 0) {
334 CHECK_EQ(base, data_base) << "Unsupported for standard dex";
335 }
336 dex_file.reset(new StandardDexFile(base,
337 size,
338 location,
339 location_checksum,
340 oat_dex_file,
341 std::move(container)));
342 } else if (size >= sizeof(CompactDexFile::Header) && CompactDexFile::IsMagicValid(base)) {
343 if (data_base == nullptr) {
344 // TODO: Is there a clean way to support both an explicit data section and reading the one
345 // from the header.
346 CHECK_EQ(data_size, 0u);
347 const CompactDexFile::Header* const header = CompactDexFile::Header::At(base);
348 data_base = base + header->data_off_;
349 data_size = header->data_size_;
350 }
351 dex_file.reset(new CompactDexFile(base,
352 size,
353 data_base,
354 data_size,
355 location,
356 location_checksum,
357 oat_dex_file,
358 std::move(container)));
359 // Disable verification for CompactDex input.
360 verify = false;
361 } else {
362 *error_msg = "Invalid or truncated dex file";
363 }
364 if (dex_file == nullptr) {
365 *error_msg = StringPrintf("Failed to open dex file '%s' from memory: %s", location.c_str(),
366 error_msg->c_str());
367 return nullptr;
368 }
369 if (!dex_file->Init(error_msg)) {
370 dex_file.reset();
371 return nullptr;
372 }
373 if (verify && !dex::Verify(dex_file.get(),
374 dex_file->Begin(),
375 dex_file->Size(),
376 location.c_str(),
377 verify_checksum,
378 error_msg)) {
379 if (verify_result != nullptr) {
380 *verify_result = VerifyResult::kVerifyFailed;
381 }
382 return nullptr;
383 }
384 if (verify_result != nullptr) {
385 *verify_result = VerifyResult::kVerifySucceeded;
386 }
387 return dex_file;
388 }
389
OpenOneDexFileFromZip(const DexZipArchive & zip_archive,const char * entry_name,const std::string & location,bool verify,bool verify_checksum,DexFileLoaderErrorCode * error_code,std::string * error_msg) const390 std::unique_ptr<const DexFile> DexFileLoader::OpenOneDexFileFromZip(
391 const DexZipArchive& zip_archive,
392 const char* entry_name,
393 const std::string& location,
394 bool verify,
395 bool verify_checksum,
396 DexFileLoaderErrorCode* error_code,
397 std::string* error_msg) const {
398 CHECK(!location.empty());
399 std::unique_ptr<DexZipEntry> zip_entry(zip_archive.Find(entry_name, error_msg));
400 if (zip_entry == nullptr) {
401 *error_code = DexFileLoaderErrorCode::kEntryNotFound;
402 return nullptr;
403 }
404 if (zip_entry->GetUncompressedLength() == 0) {
405 *error_msg = StringPrintf("Dex file '%s' has zero length", location.c_str());
406 *error_code = DexFileLoaderErrorCode::kDexFileError;
407 return nullptr;
408 }
409
410 std::vector<uint8_t> map(zip_entry->Extract(error_msg));
411 if (map.size() == 0) {
412 *error_msg = StringPrintf("Failed to extract '%s' from '%s': %s", entry_name, location.c_str(),
413 error_msg->c_str());
414 *error_code = DexFileLoaderErrorCode::kExtractToMemoryError;
415 return nullptr;
416 }
417 VerifyResult verify_result;
418 auto map_data = map.data();
419 auto map_size = map.size();
420 std::unique_ptr<const DexFile> dex_file = OpenCommon(
421 map_data,
422 map_size,
423 /*data_base=*/ nullptr,
424 /*data_size=*/ 0u,
425 location,
426 zip_entry->GetCrc32(),
427 /*oat_dex_file=*/ nullptr,
428 verify,
429 verify_checksum,
430 error_msg,
431 std::make_unique<VectorContainer>(std::move(map)),
432 &verify_result);
433 if (verify_result != VerifyResult::kVerifySucceeded) {
434 if (verify_result == VerifyResult::kVerifyNotAttempted) {
435 *error_code = DexFileLoaderErrorCode::kDexFileError;
436 } else {
437 *error_code = DexFileLoaderErrorCode::kVerifyError;
438 }
439 return nullptr;
440 }
441 *error_code = DexFileLoaderErrorCode::kNoError;
442 return dex_file;
443 }
444
445 // Technically we do not have a limitation with respect to the number of dex files that can be in a
446 // multidex APK. However, it's bad practice, as each dex file requires its own tables for symbols
447 // (types, classes, methods, ...) and dex caches. So warn the user that we open a zip with what
448 // seems an excessive number.
449 static constexpr size_t kWarnOnManyDexFilesThreshold = 100;
450
OpenAllDexFilesFromZip(const DexZipArchive & zip_archive,const std::string & location,bool verify,bool verify_checksum,DexFileLoaderErrorCode * error_code,std::string * error_msg,std::vector<std::unique_ptr<const DexFile>> * dex_files) const451 bool DexFileLoader::OpenAllDexFilesFromZip(
452 const DexZipArchive& zip_archive,
453 const std::string& location,
454 bool verify,
455 bool verify_checksum,
456 DexFileLoaderErrorCode* error_code,
457 std::string* error_msg,
458 std::vector<std::unique_ptr<const DexFile>>* dex_files) const {
459 DCHECK(dex_files != nullptr) << "DexFile::OpenFromZip: out-param is nullptr";
460 std::unique_ptr<const DexFile> dex_file(OpenOneDexFileFromZip(zip_archive,
461 kClassesDex,
462 location,
463 verify,
464 verify_checksum,
465 error_code,
466 error_msg));
467 if (*error_code != DexFileLoaderErrorCode::kNoError) {
468 return false;
469 } else {
470 // Had at least classes.dex.
471 dex_files->push_back(std::move(dex_file));
472
473 // Now try some more.
474
475 // We could try to avoid std::string allocations by working on a char array directly. As we
476 // do not expect a lot of iterations, this seems too involved and brittle.
477
478 for (size_t i = 1; ; ++i) {
479 std::string name = GetMultiDexClassesDexName(i);
480 std::string fake_location = GetMultiDexLocation(i, location.c_str());
481 std::unique_ptr<const DexFile> next_dex_file(OpenOneDexFileFromZip(zip_archive,
482 name.c_str(),
483 fake_location,
484 verify,
485 verify_checksum,
486 error_code,
487 error_msg));
488 if (next_dex_file.get() == nullptr) {
489 if (*error_code != DexFileLoaderErrorCode::kEntryNotFound) {
490 LOG(WARNING) << "Zip open failed: " << *error_msg;
491 }
492 break;
493 } else {
494 dex_files->push_back(std::move(next_dex_file));
495 }
496
497 if (i == kWarnOnManyDexFilesThreshold) {
498 LOG(WARNING) << location << " has in excess of " << kWarnOnManyDexFilesThreshold
499 << " dex files. Please consider coalescing and shrinking the number to "
500 " avoid runtime overhead.";
501 }
502
503 if (i == std::numeric_limits<size_t>::max()) {
504 LOG(ERROR) << "Overflow in number of dex files!";
505 break;
506 }
507 }
508
509 return true;
510 }
511 }
512 } // namespace art
513