blob: 5f1d280bb4e5fcbd0a4542305939ea2c5bbd0f4a [file] [log] [blame]
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001/*
2 * Copyright (C) 2012 The Android Open Source Project
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * * Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in
12 * the documentation and/or other materials provided with the
13 * distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
18 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
19 * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
21 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
22 * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
23 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
25 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * SUCH DAMAGE.
27 */
28
Elliott Hughes650be4e2013-03-05 18:47:58 -080029#include "linker_phdr.h"
30
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020031#include <errno.h>
Elliott Hughes05fc1d72015-01-28 18:02:33 -080032#include <string.h>
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020033#include <sys/mman.h>
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +000034#include <sys/types.h>
35#include <sys/stat.h>
36#include <unistd.h>
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020037
Elliott Hughes650be4e2013-03-05 18:47:58 -080038#include "linker.h"
Dimitry Ivanov48ec2882016-08-04 11:50:36 -070039#include "linker_globals.h"
Elliott Hughes650be4e2013-03-05 18:47:58 -080040#include "linker_debug.h"
Dmitriy Ivanov3c524812015-11-20 17:28:12 -080041#include "linker_utils.h"
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020042
Dimitry Ivanov1b84afc2016-01-27 18:12:03 -080043#include "private/bionic_prctl.h"
44
Elliott Hughesb5140262014-12-02 16:16:29 -080045static int GetTargetElfMachine() {
46#if defined(__arm__)
47 return EM_ARM;
48#elif defined(__aarch64__)
49 return EM_AARCH64;
50#elif defined(__i386__)
51 return EM_386;
52#elif defined(__mips__)
53 return EM_MIPS;
54#elif defined(__x86_64__)
55 return EM_X86_64;
56#endif
57}
58
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020059/**
60 TECHNICAL NOTE ON ELF LOADING.
61
62 An ELF file's program header table contains one or more PT_LOAD
63 segments, which corresponds to portions of the file that need to
64 be mapped into the process' address space.
65
66 Each loadable segment has the following important properties:
67
68 p_offset -> segment file offset
69 p_filesz -> segment file size
70 p_memsz -> segment memory size (always >= p_filesz)
71 p_vaddr -> segment's virtual address
72 p_flags -> segment flags (e.g. readable, writable, executable)
73
Elliott Hughes0266ae52014-02-10 17:46:57 -080074 We will ignore the p_paddr and p_align fields of ElfW(Phdr) for now.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020075
76 The loadable segments can be seen as a list of [p_vaddr ... p_vaddr+p_memsz)
77 ranges of virtual addresses. A few rules apply:
78
79 - the virtual address ranges should not overlap.
80
81 - if a segment's p_filesz is smaller than its p_memsz, the extra bytes
82 between them should always be initialized to 0.
83
84 - ranges do not necessarily start or end at page boundaries. Two distinct
85 segments can have their start and end on the same page. In this case, the
86 page inherits the mapping flags of the latter segment.
87
88 Finally, the real load addrs of each segment is not p_vaddr. Instead the
89 loader decides where to load the first segment, then will load all others
90 relative to the first one to respect the initial range layout.
91
92 For example, consider the following list:
93
94 [ offset:0, filesz:0x4000, memsz:0x4000, vaddr:0x30000 ],
95 [ offset:0x4000, filesz:0x2000, memsz:0x8000, vaddr:0x40000 ],
96
97 This corresponds to two segments that cover these virtual address ranges:
98
99 0x30000...0x34000
100 0x40000...0x48000
101
102 If the loader decides to load the first segment at address 0xa0000000
103 then the segments' load address ranges will be:
104
105 0xa0030000...0xa0034000
106 0xa0040000...0xa0048000
107
108 In other words, all segments must be loaded at an address that has the same
109 constant offset from their p_vaddr value. This offset is computed as the
110 difference between the first segment's load address, and its p_vaddr value.
111
112 However, in practice, segments do _not_ start at page boundaries. Since we
113 can only memory-map at page boundaries, this means that the bias is
114 computed as:
115
116 load_bias = phdr0_load_address - PAGE_START(phdr0->p_vaddr)
117
118 (NOTE: The value must be used as a 32-bit unsigned integer, to deal with
119 possible wrap around UINT32_MAX for possible large p_vaddr values).
120
121 And that the phdr0_load_address must start at a page boundary, with
122 the segment's real content starting at:
123
124 phdr0_load_address + PAGE_OFFSET(phdr0->p_vaddr)
125
126 Note that ELF requires the following condition to make the mmap()-ing work:
127
128 PAGE_OFFSET(phdr0->p_vaddr) == PAGE_OFFSET(phdr0->p_offset)
129
130 The load_bias must be added to any p_vaddr value read from the ELF file to
131 determine the corresponding memory address.
132
133 **/
134
Elliott Hughesfaf05ba2014-02-11 16:59:37 -0800135#define MAYBE_MAP_FLAG(x, from, to) (((x) & (from)) ? (to) : 0)
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200136#define PFLAGS_TO_PROT(x) (MAYBE_MAP_FLAG((x), PF_X, PROT_EXEC) | \
137 MAYBE_MAP_FLAG((x), PF_R, PROT_READ) | \
138 MAYBE_MAP_FLAG((x), PF_W, PROT_WRITE))
139
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700140ElfReader::ElfReader()
141 : did_read_(false), did_load_(false), fd_(-1), file_offset_(0), file_size_(0), phdr_num_(0),
142 phdr_table_(nullptr), shdr_table_(nullptr), shdr_num_(0), dynamic_(nullptr), strtab_(nullptr),
Dimitry Ivanovf45b0e92016-01-15 11:13:35 -0800143 strtab_size_(0), load_start_(nullptr), load_size_(0), load_bias_(0), loaded_phdr_(nullptr),
144 mapped_by_caller_(false) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700145}
146
147bool ElfReader::Read(const char* name, int fd, off64_t file_offset, off64_t file_size) {
148 CHECK(!did_read_);
149 CHECK(!did_load_);
150 name_ = name;
151 fd_ = fd;
152 file_offset_ = file_offset;
153 file_size_ = file_size;
154
155 if (ReadElfHeader() &&
156 VerifyElfHeader() &&
157 ReadProgramHeaders() &&
158 ReadSectionHeaders() &&
159 ReadDynamicSection()) {
160 did_read_ = true;
161 }
162
163 return did_read_;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200164}
165
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000166bool ElfReader::Load(const android_dlextinfo* extinfo) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700167 CHECK(did_read_);
168 CHECK(!did_load_);
169 if (ReserveAddressSpace(extinfo) &&
170 LoadSegments() &&
171 FindPhdr()) {
172 did_load_ = true;
173 }
174
175 return did_load_;
176}
177
178const char* ElfReader::get_string(ElfW(Word) index) const {
179 CHECK(strtab_ != nullptr);
180 CHECK(index < strtab_size_);
181
182 return strtab_ + index;
Elliott Hughes650be4e2013-03-05 18:47:58 -0800183}
184
185bool ElfReader::ReadElfHeader() {
Dmitriy Ivanova6c12792014-10-21 12:09:18 -0700186 ssize_t rc = TEMP_FAILURE_RETRY(pread64(fd_, &header_, sizeof(header_), file_offset_));
Elliott Hughes650be4e2013-03-05 18:47:58 -0800187 if (rc < 0) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700188 DL_ERR("can't read file \"%s\": %s", name_.c_str(), strerror(errno));
Elliott Hughes650be4e2013-03-05 18:47:58 -0800189 return false;
190 }
Dmitriy Ivanova6c12792014-10-21 12:09:18 -0700191
Elliott Hughes650be4e2013-03-05 18:47:58 -0800192 if (rc != sizeof(header_)) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700193 DL_ERR("\"%s\" is too small to be an ELF executable: only found %zd bytes", name_.c_str(),
Elliott Hughesc6200592013-09-30 18:43:46 -0700194 static_cast<size_t>(rc));
Elliott Hughes650be4e2013-03-05 18:47:58 -0800195 return false;
196 }
197 return true;
198}
199
200bool ElfReader::VerifyElfHeader() {
Elliott Hughes625993d2014-07-15 16:53:13 -0700201 if (memcmp(header_.e_ident, ELFMAG, SELFMAG) != 0) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700202 DL_ERR("\"%s\" has bad ELF magic", name_.c_str());
Elliott Hughes650be4e2013-03-05 18:47:58 -0800203 return false;
204 }
205
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700206 // Try to give a clear diagnostic for ELF class mismatches, since they're
207 // an easy mistake to make during the 32-bit/64-bit transition period.
208 int elf_class = header_.e_ident[EI_CLASS];
209#if defined(__LP64__)
210 if (elf_class != ELFCLASS64) {
211 if (elf_class == ELFCLASS32) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700212 DL_ERR("\"%s\" is 32-bit instead of 64-bit", name_.c_str());
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700213 } else {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700214 DL_ERR("\"%s\" has unknown ELF class: %d", name_.c_str(), elf_class);
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700215 }
Elliott Hughes650be4e2013-03-05 18:47:58 -0800216 return false;
217 }
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700218#else
219 if (elf_class != ELFCLASS32) {
220 if (elf_class == ELFCLASS64) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700221 DL_ERR("\"%s\" is 64-bit instead of 32-bit", name_.c_str());
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700222 } else {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700223 DL_ERR("\"%s\" has unknown ELF class: %d", name_.c_str(), elf_class);
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700224 }
225 return false;
226 }
227#endif
228
Elliott Hughes650be4e2013-03-05 18:47:58 -0800229 if (header_.e_ident[EI_DATA] != ELFDATA2LSB) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700230 DL_ERR("\"%s\" not little-endian: %d", name_.c_str(), header_.e_ident[EI_DATA]);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800231 return false;
232 }
233
234 if (header_.e_type != ET_DYN) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700235 DL_ERR("\"%s\" has unexpected e_type: %d", name_.c_str(), header_.e_type);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800236 return false;
237 }
238
239 if (header_.e_version != EV_CURRENT) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700240 DL_ERR("\"%s\" has unexpected e_version: %d", name_.c_str(), header_.e_version);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800241 return false;
242 }
243
Elliott Hughesb5140262014-12-02 16:16:29 -0800244 if (header_.e_machine != GetTargetElfMachine()) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700245 DL_ERR("\"%s\" has unexpected e_machine: %d", name_.c_str(), header_.e_machine);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800246 return false;
247 }
248
Dimitry Ivanovc73eec12016-07-22 12:50:59 -0700249 if (header_.e_shentsize != sizeof(ElfW(Shdr))) {
250 DL_ERR("\"%s\" has unsupported e_shentsize: 0x%x (expected 0x%zx)",
251 name_.c_str(), header_.e_shentsize, sizeof(ElfW(Shdr)));
252 return false;
253 }
254
255 if (header_.e_shstrndx == 0) {
256 DL_ERR("\"%s\" has invalid e_shstrndx", name_.c_str());
257 return false;
258 }
259
Elliott Hughes650be4e2013-03-05 18:47:58 -0800260 return true;
261}
262
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800263bool ElfReader::CheckFileRange(ElfW(Addr) offset, size_t size) {
264 off64_t range_start;
265 off64_t range_end;
266
Dimitry Ivanov0c9d30f2016-07-13 17:06:36 -0700267 // Only header can be located at the 0 offset... This function called to
268 // check DYNSYM and DYNAMIC sections and phdr/shdr - none of them can be
Dimitry Ivanovebe5af72016-07-14 11:15:44 -0700269 // at offset 0.
Dimitry Ivanov0c9d30f2016-07-13 17:06:36 -0700270
271 return offset > 0 &&
272 safe_add(&range_start, file_offset_, offset) &&
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800273 safe_add(&range_end, range_start, size) &&
274 range_start < file_size_ &&
275 range_end <= file_size_;
276}
277
Elliott Hughes650be4e2013-03-05 18:47:58 -0800278// Loads the program header table from an ELF file into a read-only private
279// anonymous mmap-ed block.
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700280bool ElfReader::ReadProgramHeaders() {
Elliott Hughes650be4e2013-03-05 18:47:58 -0800281 phdr_num_ = header_.e_phnum;
282
283 // Like the kernel, we only accept program header tables that
284 // are smaller than 64KiB.
Elliott Hughes0266ae52014-02-10 17:46:57 -0800285 if (phdr_num_ < 1 || phdr_num_ > 65536/sizeof(ElfW(Phdr))) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700286 DL_ERR("\"%s\" has invalid e_phnum: %zd", name_.c_str(), phdr_num_);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800287 return false;
288 }
289
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800290 // Boundary checks
291 size_t size = phdr_num_ * sizeof(ElfW(Phdr));
292 if (!CheckFileRange(header_.e_phoff, size)) {
293 DL_ERR("\"%s\" has invalid phdr offset/size", name_.c_str());
294 return false;
295 }
296
297 if (!phdr_fragment_.Map(fd_, file_offset_, header_.e_phoff, size)) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700298 DL_ERR("\"%s\" phdr mmap failed: %s", name_.c_str(), strerror(errno));
Elliott Hughes650be4e2013-03-05 18:47:58 -0800299 return false;
300 }
301
Dmitriy Ivanovcf1cbbe2015-10-19 16:57:46 -0700302 phdr_table_ = static_cast<ElfW(Phdr)*>(phdr_fragment_.data());
Elliott Hughes650be4e2013-03-05 18:47:58 -0800303 return true;
304}
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200305
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700306bool ElfReader::ReadSectionHeaders() {
307 shdr_num_ = header_.e_shnum;
308
Dmitriy Ivanovb76123f2015-11-20 10:42:02 -0800309 if (shdr_num_ == 0) {
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800310 DL_ERR("\"%s\" has no section headers", name_.c_str());
Dmitriy Ivanovb76123f2015-11-20 10:42:02 -0800311 return false;
312 }
313
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800314 size_t size = shdr_num_ * sizeof(ElfW(Shdr));
315 if (!CheckFileRange(header_.e_shoff, size)) {
316 DL_ERR("\"%s\" has invalid shdr offset/size", name_.c_str());
317 return false;
318 }
319
320 if (!shdr_fragment_.Map(fd_, file_offset_, header_.e_shoff, size)) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700321 DL_ERR("\"%s\" shdr mmap failed: %s", name_.c_str(), strerror(errno));
322 return false;
323 }
324
325 shdr_table_ = static_cast<const ElfW(Shdr)*>(shdr_fragment_.data());
326 return true;
327}
328
329bool ElfReader::ReadDynamicSection() {
330 // 1. Find .dynamic section (in section headers)
331 const ElfW(Shdr)* dynamic_shdr = nullptr;
332 for (size_t i = 0; i < shdr_num_; ++i) {
333 if (shdr_table_[i].sh_type == SHT_DYNAMIC) {
334 dynamic_shdr = &shdr_table_ [i];
335 break;
336 }
337 }
338
339 if (dynamic_shdr == nullptr) {
Dmitriy Ivanovb76123f2015-11-20 10:42:02 -0800340 DL_ERR("\"%s\" .dynamic section header was not found", name_.c_str());
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700341 return false;
342 }
343
Dimitry Ivanov0c9d30f2016-07-13 17:06:36 -0700344 // Make sure dynamic_shdr offset and size matches PT_DYNAMIC phdr
345 size_t pt_dynamic_offset = 0;
346 size_t pt_dynamic_filesz = 0;
347 for (size_t i = 0; i < phdr_num_; ++i) {
348 const ElfW(Phdr)* phdr = &phdr_table_[i];
349 if (phdr->p_type == PT_DYNAMIC) {
350 pt_dynamic_offset = phdr->p_offset;
351 pt_dynamic_filesz = phdr->p_filesz;
352 }
353 }
354
355 if (pt_dynamic_offset != dynamic_shdr->sh_offset) {
356 DL_ERR("\"%s\" .dynamic section has invalid offset: 0x%zx, "
357 "expected to match PT_DYNAMIC offset: 0x%zx",
358 name_.c_str(),
359 static_cast<size_t>(dynamic_shdr->sh_offset),
360 pt_dynamic_offset);
361 return false;
362 }
363
364 if (pt_dynamic_filesz != dynamic_shdr->sh_size) {
365 DL_ERR("\"%s\" .dynamic section has invalid size: 0x%zx, "
366 "expected to match PT_DYNAMIC filesz: 0x%zx",
367 name_.c_str(),
368 static_cast<size_t>(dynamic_shdr->sh_size),
369 pt_dynamic_filesz);
370 return false;
371 }
372
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700373 if (dynamic_shdr->sh_link >= shdr_num_) {
374 DL_ERR("\"%s\" .dynamic section has invalid sh_link: %d", name_.c_str(), dynamic_shdr->sh_link);
375 return false;
376 }
377
378 const ElfW(Shdr)* strtab_shdr = &shdr_table_[dynamic_shdr->sh_link];
379
380 if (strtab_shdr->sh_type != SHT_STRTAB) {
381 DL_ERR("\"%s\" .dynamic section has invalid link(%d) sh_type: %d (expected SHT_STRTAB)",
382 name_.c_str(), dynamic_shdr->sh_link, strtab_shdr->sh_type);
383 return false;
384 }
385
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800386 if (!CheckFileRange(dynamic_shdr->sh_offset, dynamic_shdr->sh_size)) {
387 DL_ERR("\"%s\" has invalid offset/size of .dynamic section", name_.c_str());
388 PRINT("\"%s\" has invalid offset/size of .dynamic section", name_.c_str());
389 return false;
390 }
391
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700392 if (!dynamic_fragment_.Map(fd_, file_offset_, dynamic_shdr->sh_offset, dynamic_shdr->sh_size)) {
393 DL_ERR("\"%s\" dynamic section mmap failed: %s", name_.c_str(), strerror(errno));
394 return false;
395 }
396
397 dynamic_ = static_cast<const ElfW(Dyn)*>(dynamic_fragment_.data());
398
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800399 if (!CheckFileRange(strtab_shdr->sh_offset, strtab_shdr->sh_size)) {
400 DL_ERR("\"%s\" has invalid offset/size of the .strtab section linked from .dynamic section",
401 name_.c_str());
402 return false;
403 }
404
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700405 if (!strtab_fragment_.Map(fd_, file_offset_, strtab_shdr->sh_offset, strtab_shdr->sh_size)) {
406 DL_ERR("\"%s\" strtab section mmap failed: %s", name_.c_str(), strerror(errno));
407 return false;
408 }
409
410 strtab_ = static_cast<const char*>(strtab_fragment_.data());
411 strtab_size_ = strtab_fragment_.size();
412 return true;
413}
414
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800415/* Returns the size of the extent of all the possibly non-contiguous
416 * loadable segments in an ELF program header table. This corresponds
417 * to the page-aligned size in bytes that needs to be reserved in the
418 * process' address space. If there are no loadable segments, 0 is
419 * returned.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200420 *
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700421 * If out_min_vaddr or out_max_vaddr are not null, they will be
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800422 * set to the minimum and maximum addresses of pages to be reserved,
423 * or 0 if there is nothing to load.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200424 */
Elliott Hughes0266ae52014-02-10 17:46:57 -0800425size_t phdr_table_get_load_size(const ElfW(Phdr)* phdr_table, size_t phdr_count,
426 ElfW(Addr)* out_min_vaddr,
427 ElfW(Addr)* out_max_vaddr) {
428 ElfW(Addr) min_vaddr = UINTPTR_MAX;
429 ElfW(Addr) max_vaddr = 0;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200430
Elliott Hughes0266ae52014-02-10 17:46:57 -0800431 bool found_pt_load = false;
432 for (size_t i = 0; i < phdr_count; ++i) {
433 const ElfW(Phdr)* phdr = &phdr_table[i];
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200434
Elliott Hughes0266ae52014-02-10 17:46:57 -0800435 if (phdr->p_type != PT_LOAD) {
436 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200437 }
Elliott Hughes0266ae52014-02-10 17:46:57 -0800438 found_pt_load = true;
439
440 if (phdr->p_vaddr < min_vaddr) {
441 min_vaddr = phdr->p_vaddr;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200442 }
443
Elliott Hughes0266ae52014-02-10 17:46:57 -0800444 if (phdr->p_vaddr + phdr->p_memsz > max_vaddr) {
445 max_vaddr = phdr->p_vaddr + phdr->p_memsz;
446 }
447 }
448 if (!found_pt_load) {
449 min_vaddr = 0;
450 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200451
Elliott Hughes0266ae52014-02-10 17:46:57 -0800452 min_vaddr = PAGE_START(min_vaddr);
453 max_vaddr = PAGE_END(max_vaddr);
454
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700455 if (out_min_vaddr != nullptr) {
Elliott Hughes0266ae52014-02-10 17:46:57 -0800456 *out_min_vaddr = min_vaddr;
457 }
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700458 if (out_max_vaddr != nullptr) {
Elliott Hughes0266ae52014-02-10 17:46:57 -0800459 *out_max_vaddr = max_vaddr;
460 }
461 return max_vaddr - min_vaddr;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200462}
463
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700464// Reserve a virtual address range such that if it's limits were extended to the next 2**align
465// boundary, it would not overlap with any existing mappings.
466static void* ReserveAligned(void* hint, size_t size, size_t align) {
467 int mmap_flags = MAP_PRIVATE | MAP_ANONYMOUS;
468 // Address hint is only used in Art for the image mapping, and it is pretty important. Don't mess
469 // with it.
470 // FIXME: try an aligned allocation and fall back to plain mmap() if the former does not provide a
471 // mapping at the requested address?
472 if (align == PAGE_SIZE || hint != nullptr) {
473 void* mmap_ptr = mmap(hint, size, PROT_NONE, mmap_flags, -1, 0);
474 if (mmap_ptr == MAP_FAILED) {
475 return nullptr;
476 }
477 return mmap_ptr;
478 }
479
480 // Allocate enough space so that the end of the desired region aligned up is still inside the
481 // mapping.
482 size_t mmap_size = align_up(size, align) + align - PAGE_SIZE;
483 uint8_t* mmap_ptr =
484 reinterpret_cast<uint8_t*>(mmap(nullptr, mmap_size, PROT_NONE, mmap_flags, -1, 0));
485 if (mmap_ptr == MAP_FAILED) {
486 return nullptr;
487 }
488
489 uint8_t* first = align_up(mmap_ptr, align);
490 uint8_t* last = align_down(mmap_ptr + mmap_size, align) - size;
491 size_t n = arc4random_uniform((last - first) / PAGE_SIZE + 1);
492 uint8_t* start = first + n * PAGE_SIZE;
493 munmap(mmap_ptr, start - mmap_ptr);
494 munmap(start + size, mmap_ptr + mmap_size - (start + size));
495 return start;
496}
497
Elliott Hughes650be4e2013-03-05 18:47:58 -0800498// Reserve a virtual address range big enough to hold all loadable
499// segments of a program header table. This is done by creating a
500// private anonymous mmap() with PROT_NONE.
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000501bool ElfReader::ReserveAddressSpace(const android_dlextinfo* extinfo) {
Elliott Hughes0266ae52014-02-10 17:46:57 -0800502 ElfW(Addr) min_vaddr;
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800503 load_size_ = phdr_table_get_load_size(phdr_table_, phdr_num_, &min_vaddr);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800504 if (load_size_ == 0) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700505 DL_ERR("\"%s\" has no loadable segments", name_.c_str());
Elliott Hughes650be4e2013-03-05 18:47:58 -0800506 return false;
507 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200508
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800509 uint8_t* addr = reinterpret_cast<uint8_t*>(min_vaddr);
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000510 void* start;
511 size_t reserved_size = 0;
512 bool reserved_hint = true;
Dmitriy Ivanov126af752015-10-07 16:34:20 -0700513 bool strict_hint = false;
Dmitriy Ivanov8a116282015-06-05 22:16:23 -0700514 // Assume position independent executable by default.
Dmitriy Ivanov126af752015-10-07 16:34:20 -0700515 void* mmap_hint = nullptr;
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000516
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700517 if (extinfo != nullptr) {
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000518 if (extinfo->flags & ANDROID_DLEXT_RESERVED_ADDRESS) {
519 reserved_size = extinfo->reserved_size;
520 reserved_hint = false;
521 } else if (extinfo->flags & ANDROID_DLEXT_RESERVED_ADDRESS_HINT) {
522 reserved_size = extinfo->reserved_size;
523 }
Dmitriy Ivanov8a116282015-06-05 22:16:23 -0700524
Dmitriy Ivanov126af752015-10-07 16:34:20 -0700525 if (addr != nullptr && (extinfo->flags & ANDROID_DLEXT_FORCE_FIXED_VADDR) != 0) {
Dmitriy Ivanov8a116282015-06-05 22:16:23 -0700526 mmap_hint = addr;
Dmitriy Ivanov126af752015-10-07 16:34:20 -0700527 } else if ((extinfo->flags & ANDROID_DLEXT_LOAD_AT_FIXED_ADDRESS) != 0) {
528 mmap_hint = extinfo->reserved_addr;
529 strict_hint = true;
Dmitriy Ivanov8a116282015-06-05 22:16:23 -0700530 }
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000531 }
532
533 if (load_size_ > reserved_size) {
534 if (!reserved_hint) {
535 DL_ERR("reserved address space %zd smaller than %zd bytes needed for \"%s\"",
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700536 reserved_size - load_size_, load_size_, name_.c_str());
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000537 return false;
538 }
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700539 start = ReserveAligned(mmap_hint, load_size_, kLibraryAlignment);
540 if (start == nullptr) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700541 DL_ERR("couldn't reserve %zd bytes of address space for \"%s\"", load_size_, name_.c_str());
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000542 return false;
543 }
Dmitriy Ivanov126af752015-10-07 16:34:20 -0700544 if (strict_hint && (start != mmap_hint)) {
545 munmap(start, load_size_);
546 DL_ERR("couldn't reserve %zd bytes of address space at %p for \"%s\"",
547 load_size_, mmap_hint, name_.c_str());
548 return false;
549 }
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000550 } else {
551 start = extinfo->reserved_addr;
Dimitry Ivanovf45b0e92016-01-15 11:13:35 -0800552 mapped_by_caller_ = true;
Elliott Hughes650be4e2013-03-05 18:47:58 -0800553 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200554
Elliott Hughes650be4e2013-03-05 18:47:58 -0800555 load_start_ = start;
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800556 load_bias_ = reinterpret_cast<uint8_t*>(start) - addr;
Elliott Hughes650be4e2013-03-05 18:47:58 -0800557 return true;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200558}
559
Elliott Hughes650be4e2013-03-05 18:47:58 -0800560bool ElfReader::LoadSegments() {
561 for (size_t i = 0; i < phdr_num_; ++i) {
Elliott Hughes0266ae52014-02-10 17:46:57 -0800562 const ElfW(Phdr)* phdr = &phdr_table_[i];
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200563
Elliott Hughes650be4e2013-03-05 18:47:58 -0800564 if (phdr->p_type != PT_LOAD) {
565 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200566 }
Elliott Hughes650be4e2013-03-05 18:47:58 -0800567
568 // Segment addresses in memory.
Elliott Hughes0266ae52014-02-10 17:46:57 -0800569 ElfW(Addr) seg_start = phdr->p_vaddr + load_bias_;
570 ElfW(Addr) seg_end = seg_start + phdr->p_memsz;
Elliott Hughes650be4e2013-03-05 18:47:58 -0800571
Elliott Hughes0266ae52014-02-10 17:46:57 -0800572 ElfW(Addr) seg_page_start = PAGE_START(seg_start);
573 ElfW(Addr) seg_page_end = PAGE_END(seg_end);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800574
Elliott Hughes0266ae52014-02-10 17:46:57 -0800575 ElfW(Addr) seg_file_end = seg_start + phdr->p_filesz;
Elliott Hughes650be4e2013-03-05 18:47:58 -0800576
577 // File offsets.
Elliott Hughes0266ae52014-02-10 17:46:57 -0800578 ElfW(Addr) file_start = phdr->p_offset;
579 ElfW(Addr) file_end = file_start + phdr->p_filesz;
Elliott Hughes650be4e2013-03-05 18:47:58 -0800580
Elliott Hughes0266ae52014-02-10 17:46:57 -0800581 ElfW(Addr) file_page_start = PAGE_START(file_start);
582 ElfW(Addr) file_length = file_end - file_page_start;
Elliott Hughes650be4e2013-03-05 18:47:58 -0800583
Dmitriy Ivanov3f987f52015-06-25 15:51:41 -0700584 if (file_size_ <= 0) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700585 DL_ERR("\"%s\" invalid file size: %" PRId64, name_.c_str(), file_size_);
Dmitriy Ivanov3f987f52015-06-25 15:51:41 -0700586 return false;
587 }
588
skvalex93ce3542015-08-20 01:06:42 +0300589 if (file_end > static_cast<size_t>(file_size_)) {
Dmitriy Ivanov3f987f52015-06-25 15:51:41 -0700590 DL_ERR("invalid ELF file \"%s\" load segment[%zd]:"
591 " p_offset (%p) + p_filesz (%p) ( = %p) past end of file (0x%" PRIx64 ")",
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700592 name_.c_str(), i, reinterpret_cast<void*>(phdr->p_offset),
Dmitriy Ivanov3f987f52015-06-25 15:51:41 -0700593 reinterpret_cast<void*>(phdr->p_filesz),
594 reinterpret_cast<void*>(file_end), file_size_);
595 return false;
596 }
597
Brian Carlstrom82dcc792013-05-21 16:49:24 -0700598 if (file_length != 0) {
Dmitriy Ivanov07e5bc12014-10-03 17:52:44 -0700599 void* seg_addr = mmap64(reinterpret_cast<void*>(seg_page_start),
Brian Carlstrom82dcc792013-05-21 16:49:24 -0700600 file_length,
601 PFLAGS_TO_PROT(phdr->p_flags),
602 MAP_FIXED|MAP_PRIVATE,
603 fd_,
Dmitriy Ivanov07e5bc12014-10-03 17:52:44 -0700604 file_offset_ + file_page_start);
Brian Carlstrom82dcc792013-05-21 16:49:24 -0700605 if (seg_addr == MAP_FAILED) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700606 DL_ERR("couldn't map \"%s\" segment %zd: %s", name_.c_str(), i, strerror(errno));
Brian Carlstrom82dcc792013-05-21 16:49:24 -0700607 return false;
608 }
Elliott Hughes650be4e2013-03-05 18:47:58 -0800609 }
610
611 // if the segment is writable, and does not end on a page boundary,
612 // zero-fill it until the page limit.
613 if ((phdr->p_flags & PF_W) != 0 && PAGE_OFFSET(seg_file_end) > 0) {
Elliott Hughesfaf05ba2014-02-11 16:59:37 -0800614 memset(reinterpret_cast<void*>(seg_file_end), 0, PAGE_SIZE - PAGE_OFFSET(seg_file_end));
Elliott Hughes650be4e2013-03-05 18:47:58 -0800615 }
616
617 seg_file_end = PAGE_END(seg_file_end);
618
619 // seg_file_end is now the first page address after the file
620 // content. If seg_end is larger, we need to zero anything
621 // between them. This is done by using a private anonymous
622 // map for all extra pages.
623 if (seg_page_end > seg_file_end) {
Dimitry Ivanov1b84afc2016-01-27 18:12:03 -0800624 size_t zeromap_size = seg_page_end - seg_file_end;
Elliott Hughesfaf05ba2014-02-11 16:59:37 -0800625 void* zeromap = mmap(reinterpret_cast<void*>(seg_file_end),
Dimitry Ivanov1b84afc2016-01-27 18:12:03 -0800626 zeromap_size,
Elliott Hughes650be4e2013-03-05 18:47:58 -0800627 PFLAGS_TO_PROT(phdr->p_flags),
628 MAP_FIXED|MAP_ANONYMOUS|MAP_PRIVATE,
629 -1,
630 0);
631 if (zeromap == MAP_FAILED) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700632 DL_ERR("couldn't zero fill \"%s\" gap: %s", name_.c_str(), strerror(errno));
Elliott Hughes650be4e2013-03-05 18:47:58 -0800633 return false;
634 }
Dimitry Ivanov1b84afc2016-01-27 18:12:03 -0800635
636 prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, zeromap, zeromap_size, ".bss");
Elliott Hughes650be4e2013-03-05 18:47:58 -0800637 }
638 }
639 return true;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200640}
641
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +0000642/* Used internally. Used to set the protection bits of all loaded segments
643 * with optional extra flags (i.e. really PROT_WRITE). Used by
644 * phdr_table_protect_segments and phdr_table_unprotect_segments.
645 */
646static int _phdr_table_set_load_prot(const ElfW(Phdr)* phdr_table, size_t phdr_count,
647 ElfW(Addr) load_bias, int extra_prot_flags) {
648 const ElfW(Phdr)* phdr = phdr_table;
649 const ElfW(Phdr)* phdr_limit = phdr + phdr_count;
650
651 for (; phdr < phdr_limit; phdr++) {
652 if (phdr->p_type != PT_LOAD || (phdr->p_flags & PF_W) != 0) {
653 continue;
654 }
655
656 ElfW(Addr) seg_page_start = PAGE_START(phdr->p_vaddr) + load_bias;
657 ElfW(Addr) seg_page_end = PAGE_END(phdr->p_vaddr + phdr->p_memsz) + load_bias;
658
Nick Kralevich8fdb3412015-04-01 16:57:50 -0700659 int prot = PFLAGS_TO_PROT(phdr->p_flags);
660 if ((extra_prot_flags & PROT_WRITE) != 0) {
661 // make sure we're never simultaneously writable / executable
662 prot &= ~PROT_EXEC;
663 }
664
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +0000665 int ret = mprotect(reinterpret_cast<void*>(seg_page_start),
666 seg_page_end - seg_page_start,
Nick Kralevich8fdb3412015-04-01 16:57:50 -0700667 prot | extra_prot_flags);
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +0000668 if (ret < 0) {
669 return -1;
670 }
671 }
672 return 0;
673}
674
675/* Restore the original protection modes for all loadable segments.
676 * You should only call this after phdr_table_unprotect_segments and
677 * applying all relocations.
678 *
679 * Input:
680 * phdr_table -> program header table
681 * phdr_count -> number of entries in tables
682 * load_bias -> load bias
683 * Return:
684 * 0 on error, -1 on failure (error code in errno).
685 */
686int phdr_table_protect_segments(const ElfW(Phdr)* phdr_table,
687 size_t phdr_count, ElfW(Addr) load_bias) {
688 return _phdr_table_set_load_prot(phdr_table, phdr_count, load_bias, 0);
689}
690
691/* Change the protection of all loaded segments in memory to writable.
692 * This is useful before performing relocations. Once completed, you
693 * will have to call phdr_table_protect_segments to restore the original
694 * protection flags on all segments.
695 *
696 * Note that some writable segments can also have their content turned
697 * to read-only by calling phdr_table_protect_gnu_relro. This is no
698 * performed here.
699 *
700 * Input:
701 * phdr_table -> program header table
702 * phdr_count -> number of entries in tables
703 * load_bias -> load bias
704 * Return:
705 * 0 on error, -1 on failure (error code in errno).
706 */
707int phdr_table_unprotect_segments(const ElfW(Phdr)* phdr_table,
708 size_t phdr_count, ElfW(Addr) load_bias) {
709 return _phdr_table_set_load_prot(phdr_table, phdr_count, load_bias, PROT_WRITE);
710}
711
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200712/* Used internally by phdr_table_protect_gnu_relro and
713 * phdr_table_unprotect_gnu_relro.
714 */
Elliott Hughes0266ae52014-02-10 17:46:57 -0800715static int _phdr_table_set_gnu_relro_prot(const ElfW(Phdr)* phdr_table, size_t phdr_count,
716 ElfW(Addr) load_bias, int prot_flags) {
717 const ElfW(Phdr)* phdr = phdr_table;
718 const ElfW(Phdr)* phdr_limit = phdr + phdr_count;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200719
Elliott Hughes0266ae52014-02-10 17:46:57 -0800720 for (phdr = phdr_table; phdr < phdr_limit; phdr++) {
721 if (phdr->p_type != PT_GNU_RELRO) {
722 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200723 }
Elliott Hughes0266ae52014-02-10 17:46:57 -0800724
725 // Tricky: what happens when the relro segment does not start
726 // or end at page boundaries? We're going to be over-protective
727 // here and put every page touched by the segment as read-only.
728
729 // This seems to match Ian Lance Taylor's description of the
730 // feature at http://www.airs.com/blog/archives/189.
731
732 // Extract:
733 // Note that the current dynamic linker code will only work
734 // correctly if the PT_GNU_RELRO segment starts on a page
735 // boundary. This is because the dynamic linker rounds the
736 // p_vaddr field down to the previous page boundary. If
737 // there is anything on the page which should not be read-only,
738 // the program is likely to fail at runtime. So in effect the
739 // linker must only emit a PT_GNU_RELRO segment if it ensures
740 // that it starts on a page boundary.
741 ElfW(Addr) seg_page_start = PAGE_START(phdr->p_vaddr) + load_bias;
742 ElfW(Addr) seg_page_end = PAGE_END(phdr->p_vaddr + phdr->p_memsz) + load_bias;
743
Elliott Hughesfaf05ba2014-02-11 16:59:37 -0800744 int ret = mprotect(reinterpret_cast<void*>(seg_page_start),
Elliott Hughes0266ae52014-02-10 17:46:57 -0800745 seg_page_end - seg_page_start,
746 prot_flags);
747 if (ret < 0) {
748 return -1;
749 }
750 }
751 return 0;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200752}
753
754/* Apply GNU relro protection if specified by the program header. This will
755 * turn some of the pages of a writable PT_LOAD segment to read-only, as
756 * specified by one or more PT_GNU_RELRO segments. This must be always
757 * performed after relocations.
758 *
Ard Biesheuvel12c78bb2012-08-14 12:30:09 +0200759 * The areas typically covered are .got and .data.rel.ro, these are
760 * read-only from the program's POV, but contain absolute addresses
761 * that need to be relocated before use.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200762 *
763 * Input:
764 * phdr_table -> program header table
Elliott Hughes105bc262012-08-15 16:56:00 -0700765 * phdr_count -> number of entries in tables
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200766 * load_bias -> load bias
767 * Return:
768 * 0 on error, -1 on failure (error code in errno).
769 */
Dmitriy Ivanov20d89cb2015-03-30 18:43:38 -0700770int phdr_table_protect_gnu_relro(const ElfW(Phdr)* phdr_table,
771 size_t phdr_count, ElfW(Addr) load_bias) {
Elliott Hughes0266ae52014-02-10 17:46:57 -0800772 return _phdr_table_set_gnu_relro_prot(phdr_table, phdr_count, load_bias, PROT_READ);
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200773}
774
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +0000775/* Serialize the GNU relro segments to the given file descriptor. This can be
776 * performed after relocations to allow another process to later share the
777 * relocated segment, if it was loaded at the same address.
778 *
779 * Input:
780 * phdr_table -> program header table
781 * phdr_count -> number of entries in tables
782 * load_bias -> load bias
783 * fd -> writable file descriptor to use
784 * Return:
785 * 0 on error, -1 on failure (error code in errno).
786 */
Dmitriy Ivanov20d89cb2015-03-30 18:43:38 -0700787int phdr_table_serialize_gnu_relro(const ElfW(Phdr)* phdr_table,
788 size_t phdr_count,
789 ElfW(Addr) load_bias,
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +0000790 int fd) {
791 const ElfW(Phdr)* phdr = phdr_table;
792 const ElfW(Phdr)* phdr_limit = phdr + phdr_count;
793 ssize_t file_offset = 0;
794
795 for (phdr = phdr_table; phdr < phdr_limit; phdr++) {
796 if (phdr->p_type != PT_GNU_RELRO) {
797 continue;
798 }
799
800 ElfW(Addr) seg_page_start = PAGE_START(phdr->p_vaddr) + load_bias;
801 ElfW(Addr) seg_page_end = PAGE_END(phdr->p_vaddr + phdr->p_memsz) + load_bias;
802 ssize_t size = seg_page_end - seg_page_start;
803
804 ssize_t written = TEMP_FAILURE_RETRY(write(fd, reinterpret_cast<void*>(seg_page_start), size));
805 if (written != size) {
806 return -1;
807 }
808 void* map = mmap(reinterpret_cast<void*>(seg_page_start), size, PROT_READ,
809 MAP_PRIVATE|MAP_FIXED, fd, file_offset);
810 if (map == MAP_FAILED) {
811 return -1;
812 }
813 file_offset += size;
814 }
815 return 0;
816}
817
818/* Where possible, replace the GNU relro segments with mappings of the given
819 * file descriptor. This can be performed after relocations to allow a file
820 * previously created by phdr_table_serialize_gnu_relro in another process to
821 * replace the dirty relocated pages, saving memory, if it was loaded at the
822 * same address. We have to compare the data before we map over it, since some
823 * parts of the relro segment may not be identical due to other libraries in
824 * the process being loaded at different addresses.
825 *
826 * Input:
827 * phdr_table -> program header table
828 * phdr_count -> number of entries in tables
829 * load_bias -> load bias
830 * fd -> readable file descriptor to use
831 * Return:
832 * 0 on error, -1 on failure (error code in errno).
833 */
Dmitriy Ivanov20d89cb2015-03-30 18:43:38 -0700834int phdr_table_map_gnu_relro(const ElfW(Phdr)* phdr_table,
835 size_t phdr_count,
836 ElfW(Addr) load_bias,
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +0000837 int fd) {
838 // Map the file at a temporary location so we can compare its contents.
839 struct stat file_stat;
840 if (TEMP_FAILURE_RETRY(fstat(fd, &file_stat)) != 0) {
841 return -1;
842 }
843 off_t file_size = file_stat.st_size;
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700844 void* temp_mapping = nullptr;
Torne (Richard Coles)26ec9672014-04-30 15:48:40 +0100845 if (file_size > 0) {
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700846 temp_mapping = mmap(nullptr, file_size, PROT_READ, MAP_PRIVATE, fd, 0);
Torne (Richard Coles)26ec9672014-04-30 15:48:40 +0100847 if (temp_mapping == MAP_FAILED) {
848 return -1;
849 }
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +0000850 }
851 size_t file_offset = 0;
852
853 // Iterate over the relro segments and compare/remap the pages.
854 const ElfW(Phdr)* phdr = phdr_table;
855 const ElfW(Phdr)* phdr_limit = phdr + phdr_count;
856
857 for (phdr = phdr_table; phdr < phdr_limit; phdr++) {
858 if (phdr->p_type != PT_GNU_RELRO) {
859 continue;
860 }
861
862 ElfW(Addr) seg_page_start = PAGE_START(phdr->p_vaddr) + load_bias;
863 ElfW(Addr) seg_page_end = PAGE_END(phdr->p_vaddr + phdr->p_memsz) + load_bias;
864
865 char* file_base = static_cast<char*>(temp_mapping) + file_offset;
866 char* mem_base = reinterpret_cast<char*>(seg_page_start);
867 size_t match_offset = 0;
868 size_t size = seg_page_end - seg_page_start;
869
Torne (Richard Coles)26ec9672014-04-30 15:48:40 +0100870 if (file_size - file_offset < size) {
871 // File is too short to compare to this segment. The contents are likely
872 // different as well (it's probably for a different library version) so
873 // just don't bother checking.
874 break;
875 }
876
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +0000877 while (match_offset < size) {
878 // Skip over dissimilar pages.
879 while (match_offset < size &&
880 memcmp(mem_base + match_offset, file_base + match_offset, PAGE_SIZE) != 0) {
881 match_offset += PAGE_SIZE;
882 }
883
884 // Count similar pages.
885 size_t mismatch_offset = match_offset;
886 while (mismatch_offset < size &&
887 memcmp(mem_base + mismatch_offset, file_base + mismatch_offset, PAGE_SIZE) == 0) {
888 mismatch_offset += PAGE_SIZE;
889 }
890
891 // Map over similar pages.
892 if (mismatch_offset > match_offset) {
893 void* map = mmap(mem_base + match_offset, mismatch_offset - match_offset,
894 PROT_READ, MAP_PRIVATE|MAP_FIXED, fd, match_offset);
895 if (map == MAP_FAILED) {
896 munmap(temp_mapping, file_size);
897 return -1;
898 }
899 }
900
901 match_offset = mismatch_offset;
902 }
903
904 // Add to the base file offset in case there are multiple relro segments.
905 file_offset += size;
906 }
907 munmap(temp_mapping, file_size);
908 return 0;
909}
910
911
Elliott Hughes4eeb1f12013-10-25 17:38:02 -0700912#if defined(__arm__)
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200913
914# ifndef PT_ARM_EXIDX
915# define PT_ARM_EXIDX 0x70000001 /* .ARM.exidx segment */
916# endif
917
918/* Return the address and size of the .ARM.exidx section in memory,
919 * if present.
920 *
921 * Input:
922 * phdr_table -> program header table
Elliott Hughes105bc262012-08-15 16:56:00 -0700923 * phdr_count -> number of entries in tables
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200924 * load_bias -> load bias
925 * Output:
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700926 * arm_exidx -> address of table in memory (null on failure).
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200927 * arm_exidx_count -> number of items in table (0 on failure).
928 * Return:
929 * 0 on error, -1 on failure (_no_ error code in errno)
930 */
Elliott Hughes0266ae52014-02-10 17:46:57 -0800931int phdr_table_get_arm_exidx(const ElfW(Phdr)* phdr_table, size_t phdr_count,
932 ElfW(Addr) load_bias,
Dmitriy Ivanov1649e7e2015-01-22 16:04:25 -0800933 ElfW(Addr)** arm_exidx, size_t* arm_exidx_count) {
Elliott Hughes0266ae52014-02-10 17:46:57 -0800934 const ElfW(Phdr)* phdr = phdr_table;
935 const ElfW(Phdr)* phdr_limit = phdr + phdr_count;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200936
Elliott Hughes0266ae52014-02-10 17:46:57 -0800937 for (phdr = phdr_table; phdr < phdr_limit; phdr++) {
938 if (phdr->p_type != PT_ARM_EXIDX) {
939 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200940 }
Elliott Hughes0266ae52014-02-10 17:46:57 -0800941
942 *arm_exidx = reinterpret_cast<ElfW(Addr)*>(load_bias + phdr->p_vaddr);
Dmitriy Ivanov1649e7e2015-01-22 16:04:25 -0800943 *arm_exidx_count = phdr->p_memsz / 8;
Elliott Hughes0266ae52014-02-10 17:46:57 -0800944 return 0;
945 }
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700946 *arm_exidx = nullptr;
Elliott Hughes0266ae52014-02-10 17:46:57 -0800947 *arm_exidx_count = 0;
948 return -1;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200949}
Elliott Hughes4eeb1f12013-10-25 17:38:02 -0700950#endif
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200951
Ard Biesheuvel12c78bb2012-08-14 12:30:09 +0200952/* Return the address and size of the ELF file's .dynamic section in memory,
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700953 * or null if missing.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200954 *
955 * Input:
956 * phdr_table -> program header table
Elliott Hughes105bc262012-08-15 16:56:00 -0700957 * phdr_count -> number of entries in tables
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200958 * load_bias -> load bias
Ard Biesheuvel12c78bb2012-08-14 12:30:09 +0200959 * Output:
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700960 * dynamic -> address of table in memory (null on failure).
Ningsheng Jiane93be992014-09-16 15:22:10 +0800961 * dynamic_flags -> protection flags for section (unset on failure)
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200962 * Return:
Ard Biesheuvel12c78bb2012-08-14 12:30:09 +0200963 * void
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200964 */
Elliott Hughes0266ae52014-02-10 17:46:57 -0800965void phdr_table_get_dynamic_section(const ElfW(Phdr)* phdr_table, size_t phdr_count,
Ningsheng Jiane93be992014-09-16 15:22:10 +0800966 ElfW(Addr) load_bias, ElfW(Dyn)** dynamic,
967 ElfW(Word)* dynamic_flags) {
Dmitriy Ivanov498eb182014-09-05 14:57:59 -0700968 *dynamic = nullptr;
Dmitriy Ivanov20d89cb2015-03-30 18:43:38 -0700969 for (size_t i = 0; i<phdr_count; ++i) {
970 const ElfW(Phdr)& phdr = phdr_table[i];
971 if (phdr.p_type == PT_DYNAMIC) {
972 *dynamic = reinterpret_cast<ElfW(Dyn)*>(load_bias + phdr.p_vaddr);
Ningsheng Jiane93be992014-09-16 15:22:10 +0800973 if (dynamic_flags) {
Dmitriy Ivanov20d89cb2015-03-30 18:43:38 -0700974 *dynamic_flags = phdr.p_flags;
Ningsheng Jiane93be992014-09-16 15:22:10 +0800975 }
Dmitriy Ivanov14669a92014-09-05 16:42:53 -0700976 return;
977 }
Elliott Hughes0266ae52014-02-10 17:46:57 -0800978 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200979}
980
Evgenii Stepanovd640b222015-07-10 17:54:01 -0700981/* Return the program interpreter string, or nullptr if missing.
982 *
983 * Input:
984 * phdr_table -> program header table
985 * phdr_count -> number of entries in tables
986 * load_bias -> load bias
987 * Return:
988 * pointer to the program interpreter string.
989 */
990const char* phdr_table_get_interpreter_name(const ElfW(Phdr) * phdr_table, size_t phdr_count,
991 ElfW(Addr) load_bias) {
992 for (size_t i = 0; i<phdr_count; ++i) {
993 const ElfW(Phdr)& phdr = phdr_table[i];
994 if (phdr.p_type == PT_INTERP) {
995 return reinterpret_cast<const char*>(load_bias + phdr.p_vaddr);
996 }
997 }
998 return nullptr;
999}
1000
Robert Grosse4544d9f2014-10-15 14:32:19 -07001001// Sets loaded_phdr_ to the address of the program header table as it appears
1002// in the loaded segments in memory. This is in contrast with phdr_table_,
1003// which is temporary and will be released before the library is relocated.
Elliott Hughes650be4e2013-03-05 18:47:58 -08001004bool ElfReader::FindPhdr() {
Elliott Hughes0266ae52014-02-10 17:46:57 -08001005 const ElfW(Phdr)* phdr_limit = phdr_table_ + phdr_num_;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001006
Elliott Hughes650be4e2013-03-05 18:47:58 -08001007 // If there is a PT_PHDR, use it directly.
Elliott Hughes0266ae52014-02-10 17:46:57 -08001008 for (const ElfW(Phdr)* phdr = phdr_table_; phdr < phdr_limit; ++phdr) {
Elliott Hughes650be4e2013-03-05 18:47:58 -08001009 if (phdr->p_type == PT_PHDR) {
1010 return CheckPhdr(load_bias_ + phdr->p_vaddr);
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001011 }
Elliott Hughes650be4e2013-03-05 18:47:58 -08001012 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001013
Elliott Hughes650be4e2013-03-05 18:47:58 -08001014 // Otherwise, check the first loadable segment. If its file offset
1015 // is 0, it starts with the ELF header, and we can trivially find the
1016 // loaded program header from it.
Elliott Hughes0266ae52014-02-10 17:46:57 -08001017 for (const ElfW(Phdr)* phdr = phdr_table_; phdr < phdr_limit; ++phdr) {
Elliott Hughes650be4e2013-03-05 18:47:58 -08001018 if (phdr->p_type == PT_LOAD) {
1019 if (phdr->p_offset == 0) {
Elliott Hughes0266ae52014-02-10 17:46:57 -08001020 ElfW(Addr) elf_addr = load_bias_ + phdr->p_vaddr;
Elliott Hughesfaf05ba2014-02-11 16:59:37 -08001021 const ElfW(Ehdr)* ehdr = reinterpret_cast<const ElfW(Ehdr)*>(elf_addr);
Elliott Hughes0266ae52014-02-10 17:46:57 -08001022 ElfW(Addr) offset = ehdr->e_phoff;
Dmitriy Ivanov1649e7e2015-01-22 16:04:25 -08001023 return CheckPhdr(reinterpret_cast<ElfW(Addr)>(ehdr) + offset);
Elliott Hughes650be4e2013-03-05 18:47:58 -08001024 }
1025 break;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001026 }
Elliott Hughes650be4e2013-03-05 18:47:58 -08001027 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001028
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -07001029 DL_ERR("can't find loaded phdr for \"%s\"", name_.c_str());
Elliott Hughes650be4e2013-03-05 18:47:58 -08001030 return false;
1031}
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001032
Elliott Hughes650be4e2013-03-05 18:47:58 -08001033// Ensures that our program header is actually within a loadable
1034// segment. This should help catch badly-formed ELF files that
1035// would cause the linker to crash later when trying to access it.
Elliott Hughes0266ae52014-02-10 17:46:57 -08001036bool ElfReader::CheckPhdr(ElfW(Addr) loaded) {
1037 const ElfW(Phdr)* phdr_limit = phdr_table_ + phdr_num_;
1038 ElfW(Addr) loaded_end = loaded + (phdr_num_ * sizeof(ElfW(Phdr)));
Dmitriy Ivanovcf1cbbe2015-10-19 16:57:46 -07001039 for (const ElfW(Phdr)* phdr = phdr_table_; phdr < phdr_limit; ++phdr) {
Elliott Hughes650be4e2013-03-05 18:47:58 -08001040 if (phdr->p_type != PT_LOAD) {
1041 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001042 }
Elliott Hughes0266ae52014-02-10 17:46:57 -08001043 ElfW(Addr) seg_start = phdr->p_vaddr + load_bias_;
1044 ElfW(Addr) seg_end = phdr->p_filesz + seg_start;
Elliott Hughes650be4e2013-03-05 18:47:58 -08001045 if (seg_start <= loaded && loaded_end <= seg_end) {
Elliott Hughes0266ae52014-02-10 17:46:57 -08001046 loaded_phdr_ = reinterpret_cast<const ElfW(Phdr)*>(loaded);
Elliott Hughes650be4e2013-03-05 18:47:58 -08001047 return true;
1048 }
1049 }
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -07001050 DL_ERR("\"%s\" loaded phdr %p not in loadable segment",
1051 name_.c_str(), reinterpret_cast<void*>(loaded));
Elliott Hughes650be4e2013-03-05 18:47:58 -08001052 return false;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001053}