blob: c37066bb3a0f169b42b189b2c78d773d0c9ad7c2 [file] [log] [blame]
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001/*
2 * Copyright (C) 2012 The Android Open Source Project
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * * Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in
12 * the documentation and/or other materials provided with the
13 * distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
18 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
19 * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
21 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
22 * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
23 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
25 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * SUCH DAMAGE.
27 */
28
Elliott Hughes650be4e2013-03-05 18:47:58 -080029#include "linker_phdr.h"
30
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020031#include <errno.h>
Elliott Hughes05fc1d72015-01-28 18:02:33 -080032#include <string.h>
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020033#include <sys/mman.h>
Elliott Hughes99d54652018-08-22 10:36:23 -070034#include <sys/prctl.h>
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +000035#include <sys/types.h>
36#include <sys/stat.h>
37#include <unistd.h>
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020038
Elliott Hughes650be4e2013-03-05 18:47:58 -080039#include "linker.h"
Florian Mayer4edc20d2024-10-30 14:24:26 -070040#include "linker_debug.h"
Elliott Hughes4cc5a602016-11-15 16:54:16 -080041#include "linker_dlwarning.h"
Dimitry Ivanov48ec2882016-08-04 11:50:36 -070042#include "linker_globals.h"
Florian Mayer4edc20d2024-10-30 14:24:26 -070043#include "linker_logger.h"
44#include "linker_main.h"
45#include "linker_soinfo.h"
Dmitriy Ivanov3c524812015-11-20 17:28:12 -080046#include "linker_utils.h"
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020047
Kalesh Singh377f0b92024-01-31 20:23:39 -080048#include "private/bionic_asm_note.h"
Evgenii Stepanov0a3637d2016-07-06 13:20:59 -070049#include "private/CFIShadow.h" // For kLibraryAlignment
Kalesh Singh377f0b92024-01-31 20:23:39 -080050#include "private/elf_note.h"
Dimitry Ivanov1b84afc2016-01-27 18:12:03 -080051
Kalesh Singhc5c1d192024-04-09 16:27:56 -070052#include <android-base/file.h>
Kalesh Singhb23787f2024-09-05 08:22:06 +000053#include <android-base/properties.h>
Kalesh Singhc5c1d192024-04-09 16:27:56 -070054
Elliott Hughesb5140262014-12-02 16:16:29 -080055static int GetTargetElfMachine() {
56#if defined(__arm__)
57 return EM_ARM;
58#elif defined(__aarch64__)
59 return EM_AARCH64;
60#elif defined(__i386__)
61 return EM_386;
Elliott Hughes43462702022-10-10 19:21:44 +000062#elif defined(__riscv)
63 return EM_RISCV;
Elliott Hughesb5140262014-12-02 16:16:29 -080064#elif defined(__x86_64__)
65 return EM_X86_64;
66#endif
67}
68
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020069/**
70 TECHNICAL NOTE ON ELF LOADING.
71
72 An ELF file's program header table contains one or more PT_LOAD
73 segments, which corresponds to portions of the file that need to
74 be mapped into the process' address space.
75
76 Each loadable segment has the following important properties:
77
78 p_offset -> segment file offset
79 p_filesz -> segment file size
80 p_memsz -> segment memory size (always >= p_filesz)
81 p_vaddr -> segment's virtual address
82 p_flags -> segment flags (e.g. readable, writable, executable)
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -070083 p_align -> segment's in-memory and in-file alignment
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020084
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -070085 We will ignore the p_paddr field of ElfW(Phdr) for now.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +020086
87 The loadable segments can be seen as a list of [p_vaddr ... p_vaddr+p_memsz)
88 ranges of virtual addresses. A few rules apply:
89
90 - the virtual address ranges should not overlap.
91
92 - if a segment's p_filesz is smaller than its p_memsz, the extra bytes
93 between them should always be initialized to 0.
94
95 - ranges do not necessarily start or end at page boundaries. Two distinct
96 segments can have their start and end on the same page. In this case, the
97 page inherits the mapping flags of the latter segment.
98
99 Finally, the real load addrs of each segment is not p_vaddr. Instead the
100 loader decides where to load the first segment, then will load all others
101 relative to the first one to respect the initial range layout.
102
103 For example, consider the following list:
104
105 [ offset:0, filesz:0x4000, memsz:0x4000, vaddr:0x30000 ],
106 [ offset:0x4000, filesz:0x2000, memsz:0x8000, vaddr:0x40000 ],
107
108 This corresponds to two segments that cover these virtual address ranges:
109
110 0x30000...0x34000
111 0x40000...0x48000
112
113 If the loader decides to load the first segment at address 0xa0000000
114 then the segments' load address ranges will be:
115
116 0xa0030000...0xa0034000
117 0xa0040000...0xa0048000
118
119 In other words, all segments must be loaded at an address that has the same
120 constant offset from their p_vaddr value. This offset is computed as the
121 difference between the first segment's load address, and its p_vaddr value.
122
123 However, in practice, segments do _not_ start at page boundaries. Since we
124 can only memory-map at page boundaries, this means that the bias is
125 computed as:
126
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700127 load_bias = phdr0_load_address - page_start(phdr0->p_vaddr)
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200128
129 (NOTE: The value must be used as a 32-bit unsigned integer, to deal with
130 possible wrap around UINT32_MAX for possible large p_vaddr values).
131
132 And that the phdr0_load_address must start at a page boundary, with
133 the segment's real content starting at:
134
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700135 phdr0_load_address + page_offset(phdr0->p_vaddr)
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200136
137 Note that ELF requires the following condition to make the mmap()-ing work:
138
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700139 page_offset(phdr0->p_vaddr) == page_offset(phdr0->p_offset)
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200140
141 The load_bias must be added to any p_vaddr value read from the ELF file to
142 determine the corresponding memory address.
143
144 **/
145
Kalesh Singh1dd68582024-02-01 00:14:36 -0800146static const size_t kPageSize = page_size();
147
148/*
149 * Generic PMD size calculation:
150 * - Each page table (PT) is of size 1 page.
151 * - Each page table entry (PTE) is of size 64 bits.
152 * - Each PTE locates one physical page frame (PFN) of size 1 page.
153 * - A PMD entry locates 1 page table (PT)
154 *
155 * PMD size = Num entries in a PT * page_size
156 */
157static const size_t kPmdSize = (kPageSize / sizeof(uint64_t)) * kPageSize;
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700158
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700159ElfReader::ElfReader()
160 : did_read_(false), did_load_(false), fd_(-1), file_offset_(0), file_size_(0), phdr_num_(0),
161 phdr_table_(nullptr), shdr_table_(nullptr), shdr_num_(0), dynamic_(nullptr), strtab_(nullptr),
Dimitry Ivanovf45b0e92016-01-15 11:13:35 -0800162 strtab_size_(0), load_start_(nullptr), load_size_(0), load_bias_(0), loaded_phdr_(nullptr),
163 mapped_by_caller_(false) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700164}
165
166bool ElfReader::Read(const char* name, int fd, off64_t file_offset, off64_t file_size) {
Jiyong Park02586a22017-05-20 01:01:24 +0900167 if (did_read_) {
168 return true;
169 }
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700170 name_ = name;
171 fd_ = fd;
172 file_offset_ = file_offset;
173 file_size_ = file_size;
174
175 if (ReadElfHeader() &&
176 VerifyElfHeader() &&
177 ReadProgramHeaders() &&
178 ReadSectionHeaders() &&
Kalesh Singh377f0b92024-01-31 20:23:39 -0800179 ReadDynamicSection() &&
180 ReadPadSegmentNote()) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700181 did_read_ = true;
182 }
183
Kalesh Singhb23787f2024-09-05 08:22:06 +0000184 if (kPageSize == 0x4000 && phdr_table_get_minimum_alignment(phdr_table_, phdr_num_) == 0x1000) {
185 // This prop needs to be read on 16KiB devices for each ELF where min_palign is 4KiB.
186 // It cannot be cached since the developer may toggle app compat on/off.
187 // This check will be removed once app compat is made the default on 16KiB devices.
188 should_use_16kib_app_compat_ =
189 ::android::base::GetBoolProperty("bionic.linker.16kb.app_compat.enabled", false);
190 }
191
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700192 return did_read_;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200193}
194
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -0400195bool ElfReader::Load(address_space_params* address_space) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700196 CHECK(did_read_);
Jiyong Park02586a22017-05-20 01:01:24 +0900197 if (did_load_) {
198 return true;
199 }
huangchaochaobdc37962022-12-27 19:38:41 +0800200 bool reserveSuccess = ReserveAddressSpace(address_space);
201 if (reserveSuccess && LoadSegments() && FindPhdr() &&
Tamas Petz8d55d182020-02-24 14:15:25 +0100202 FindGnuPropertySection()) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700203 did_load_ = true;
Tamas Petz8d55d182020-02-24 14:15:25 +0100204#if defined(__aarch64__)
205 // For Armv8.5-A loaded executable segments may require PROT_BTI.
206 if (note_gnu_property_.IsBTICompatible()) {
Kalesh Singhb23787f2024-09-05 08:22:06 +0000207 did_load_ =
208 (phdr_table_protect_segments(phdr_table_, phdr_num_, load_bias_, should_pad_segments_,
209 should_use_16kib_app_compat_, &note_gnu_property_) == 0);
Tamas Petz8d55d182020-02-24 14:15:25 +0100210 }
211#endif
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700212 }
huangchaochaobdc37962022-12-27 19:38:41 +0800213 if (reserveSuccess && !did_load_) {
214 if (load_start_ != nullptr && load_size_ != 0) {
215 if (!mapped_by_caller_) {
216 munmap(load_start_, load_size_);
217 }
218 }
219 }
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700220
221 return did_load_;
222}
223
224const char* ElfReader::get_string(ElfW(Word) index) const {
225 CHECK(strtab_ != nullptr);
226 CHECK(index < strtab_size_);
227
228 return strtab_ + index;
Elliott Hughes650be4e2013-03-05 18:47:58 -0800229}
230
231bool ElfReader::ReadElfHeader() {
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000232 ssize_t rc = TEMP_FAILURE_RETRY(pread64(fd_, &header_, sizeof(header_), file_offset_));
233 if (rc < 0) {
234 DL_ERR("can't read file \"%s\": %s", name_.c_str(), strerror(errno));
235 return false;
236 }
237
238 if (rc != sizeof(header_)) {
Suren Baghdasaryanea5dd952024-07-19 17:12:16 -0700239 DL_ERR("\"%s\" is too small to be an ELF executable: only found %zd bytes", name_.c_str(),
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000240 static_cast<size_t>(rc));
Elliott Hughes650be4e2013-03-05 18:47:58 -0800241 return false;
242 }
Elliott Hughes650be4e2013-03-05 18:47:58 -0800243 return true;
244}
245
Elliott Hughes72007ee2017-04-19 17:44:57 -0700246static const char* EM_to_string(int em) {
247 if (em == EM_386) return "EM_386";
248 if (em == EM_AARCH64) return "EM_AARCH64";
249 if (em == EM_ARM) return "EM_ARM";
Ulya Trafimovichb973c752022-11-15 14:39:44 +0000250 if (em == EM_RISCV) return "EM_RISCV";
Elliott Hughes72007ee2017-04-19 17:44:57 -0700251 if (em == EM_X86_64) return "EM_X86_64";
252 return "EM_???";
253}
254
Elliott Hughes650be4e2013-03-05 18:47:58 -0800255bool ElfReader::VerifyElfHeader() {
Elliott Hughes625993d2014-07-15 16:53:13 -0700256 if (memcmp(header_.e_ident, ELFMAG, SELFMAG) != 0) {
Elliott Hughesa8971512018-06-27 14:39:06 -0700257 DL_ERR("\"%s\" has bad ELF magic: %02x%02x%02x%02x", name_.c_str(),
258 header_.e_ident[0], header_.e_ident[1], header_.e_ident[2], header_.e_ident[3]);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800259 return false;
260 }
261
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700262 // Try to give a clear diagnostic for ELF class mismatches, since they're
263 // an easy mistake to make during the 32-bit/64-bit transition period.
264 int elf_class = header_.e_ident[EI_CLASS];
265#if defined(__LP64__)
266 if (elf_class != ELFCLASS64) {
267 if (elf_class == ELFCLASS32) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700268 DL_ERR("\"%s\" is 32-bit instead of 64-bit", name_.c_str());
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700269 } else {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700270 DL_ERR("\"%s\" has unknown ELF class: %d", name_.c_str(), elf_class);
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700271 }
Elliott Hughes650be4e2013-03-05 18:47:58 -0800272 return false;
273 }
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700274#else
275 if (elf_class != ELFCLASS32) {
276 if (elf_class == ELFCLASS64) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700277 DL_ERR("\"%s\" is 64-bit instead of 32-bit", name_.c_str());
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700278 } else {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700279 DL_ERR("\"%s\" has unknown ELF class: %d", name_.c_str(), elf_class);
Elliott Hughesc00f2cb2013-10-04 17:01:33 -0700280 }
281 return false;
282 }
283#endif
284
Elliott Hughes650be4e2013-03-05 18:47:58 -0800285 if (header_.e_ident[EI_DATA] != ELFDATA2LSB) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700286 DL_ERR("\"%s\" not little-endian: %d", name_.c_str(), header_.e_ident[EI_DATA]);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800287 return false;
288 }
289
290 if (header_.e_type != ET_DYN) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700291 DL_ERR("\"%s\" has unexpected e_type: %d", name_.c_str(), header_.e_type);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800292 return false;
293 }
294
295 if (header_.e_version != EV_CURRENT) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700296 DL_ERR("\"%s\" has unexpected e_version: %d", name_.c_str(), header_.e_version);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800297 return false;
298 }
299
Elliott Hughesb5140262014-12-02 16:16:29 -0800300 if (header_.e_machine != GetTargetElfMachine()) {
Elliott Hughesd16cfac2018-09-17 15:50:09 -0700301 DL_ERR("\"%s\" is for %s (%d) instead of %s (%d)",
302 name_.c_str(),
303 EM_to_string(header_.e_machine), header_.e_machine,
304 EM_to_string(GetTargetElfMachine()), GetTargetElfMachine());
Elliott Hughes650be4e2013-03-05 18:47:58 -0800305 return false;
306 }
307
Dimitry Ivanovc73eec12016-07-22 12:50:59 -0700308 if (header_.e_shentsize != sizeof(ElfW(Shdr))) {
Elliott Hughes95c6cd72019-12-20 13:26:14 -0800309 if (get_application_target_sdk_version() >= 26) {
Dimitry Ivanov12b91872016-11-16 12:29:37 -0800310 DL_ERR_AND_LOG("\"%s\" has unsupported e_shentsize: 0x%x (expected 0x%zx)",
311 name_.c_str(), header_.e_shentsize, sizeof(ElfW(Shdr)));
312 return false;
313 }
Elliott Hughes95c6cd72019-12-20 13:26:14 -0800314 DL_WARN_documented_change(26,
Elliott Hughes9076b0c2018-02-28 11:29:45 -0800315 "invalid-elf-header_section-headers-enforced-for-api-level-26",
316 "\"%s\" has unsupported e_shentsize 0x%x (expected 0x%zx)",
317 name_.c_str(), header_.e_shentsize, sizeof(ElfW(Shdr)));
Dimitry Ivanov12b91872016-11-16 12:29:37 -0800318 add_dlwarning(name_.c_str(), "has invalid ELF header");
Dimitry Ivanovc73eec12016-07-22 12:50:59 -0700319 }
320
321 if (header_.e_shstrndx == 0) {
Elliott Hughes95c6cd72019-12-20 13:26:14 -0800322 if (get_application_target_sdk_version() >= 26) {
Dimitry Ivanov12b91872016-11-16 12:29:37 -0800323 DL_ERR_AND_LOG("\"%s\" has invalid e_shstrndx", name_.c_str());
324 return false;
325 }
Elliott Hughes95c6cd72019-12-20 13:26:14 -0800326 DL_WARN_documented_change(26,
Elliott Hughes9076b0c2018-02-28 11:29:45 -0800327 "invalid-elf-header_section-headers-enforced-for-api-level-26",
328 "\"%s\" has invalid e_shstrndx", name_.c_str());
Dimitry Ivanov12b91872016-11-16 12:29:37 -0800329 add_dlwarning(name_.c_str(), "has invalid ELF header");
Dimitry Ivanovc73eec12016-07-22 12:50:59 -0700330 }
331
Elliott Hughes650be4e2013-03-05 18:47:58 -0800332 return true;
333}
334
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700335bool ElfReader::CheckFileRange(ElfW(Addr) offset, size_t size, size_t alignment) {
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800336 off64_t range_start;
337 off64_t range_end;
338
Dimitry Ivanov0c9d30f2016-07-13 17:06:36 -0700339 // Only header can be located at the 0 offset... This function called to
340 // check DYNSYM and DYNAMIC sections and phdr/shdr - none of them can be
Dimitry Ivanovebe5af72016-07-14 11:15:44 -0700341 // at offset 0.
Dimitry Ivanov0c9d30f2016-07-13 17:06:36 -0700342
343 return offset > 0 &&
344 safe_add(&range_start, file_offset_, offset) &&
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800345 safe_add(&range_end, range_start, size) &&
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700346 (range_start < file_size_) &&
347 (range_end <= file_size_) &&
348 ((offset % alignment) == 0);
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800349}
350
Elliott Hughes650be4e2013-03-05 18:47:58 -0800351// Loads the program header table from an ELF file into a read-only private
352// anonymous mmap-ed block.
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700353bool ElfReader::ReadProgramHeaders() {
Elliott Hughes650be4e2013-03-05 18:47:58 -0800354 phdr_num_ = header_.e_phnum;
355
356 // Like the kernel, we only accept program header tables that
357 // are smaller than 64KiB.
Elliott Hughes0266ae52014-02-10 17:46:57 -0800358 if (phdr_num_ < 1 || phdr_num_ > 65536/sizeof(ElfW(Phdr))) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700359 DL_ERR("\"%s\" has invalid e_phnum: %zd", name_.c_str(), phdr_num_);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800360 return false;
361 }
362
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800363 // Boundary checks
364 size_t size = phdr_num_ * sizeof(ElfW(Phdr));
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700365 if (!CheckFileRange(header_.e_phoff, size, alignof(ElfW(Phdr)))) {
366 DL_ERR_AND_LOG("\"%s\" has invalid phdr offset/size: %zu/%zu",
367 name_.c_str(),
368 static_cast<size_t>(header_.e_phoff),
369 size);
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800370 return false;
371 }
372
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000373 if (!phdr_fragment_.Map(fd_, file_offset_, header_.e_phoff, size)) {
Elliott Hughesf5e21d92024-07-26 11:48:19 +0000374 DL_ERR("\"%s\" phdr mmap failed: %m", name_.c_str());
Elliott Hughes650be4e2013-03-05 18:47:58 -0800375 return false;
376 }
377
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000378 phdr_table_ = static_cast<ElfW(Phdr)*>(phdr_fragment_.data());
Elliott Hughes650be4e2013-03-05 18:47:58 -0800379 return true;
380}
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200381
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700382bool ElfReader::ReadSectionHeaders() {
383 shdr_num_ = header_.e_shnum;
384
Dmitriy Ivanovb76123f2015-11-20 10:42:02 -0800385 if (shdr_num_ == 0) {
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700386 DL_ERR_AND_LOG("\"%s\" has no section headers", name_.c_str());
Dmitriy Ivanovb76123f2015-11-20 10:42:02 -0800387 return false;
388 }
389
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800390 size_t size = shdr_num_ * sizeof(ElfW(Shdr));
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700391 if (!CheckFileRange(header_.e_shoff, size, alignof(const ElfW(Shdr)))) {
392 DL_ERR_AND_LOG("\"%s\" has invalid shdr offset/size: %zu/%zu",
393 name_.c_str(),
394 static_cast<size_t>(header_.e_shoff),
395 size);
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800396 return false;
397 }
398
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000399 if (!shdr_fragment_.Map(fd_, file_offset_, header_.e_shoff, size)) {
Elliott Hughesf5e21d92024-07-26 11:48:19 +0000400 DL_ERR("\"%s\" shdr mmap failed: %m", name_.c_str());
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700401 return false;
402 }
403
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000404 shdr_table_ = static_cast<const ElfW(Shdr)*>(shdr_fragment_.data());
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700405 return true;
406}
407
408bool ElfReader::ReadDynamicSection() {
409 // 1. Find .dynamic section (in section headers)
410 const ElfW(Shdr)* dynamic_shdr = nullptr;
411 for (size_t i = 0; i < shdr_num_; ++i) {
412 if (shdr_table_[i].sh_type == SHT_DYNAMIC) {
413 dynamic_shdr = &shdr_table_ [i];
414 break;
415 }
416 }
417
418 if (dynamic_shdr == nullptr) {
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700419 DL_ERR_AND_LOG("\"%s\" .dynamic section header was not found", name_.c_str());
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700420 return false;
421 }
422
Dimitry Ivanov0c9d30f2016-07-13 17:06:36 -0700423 // Make sure dynamic_shdr offset and size matches PT_DYNAMIC phdr
424 size_t pt_dynamic_offset = 0;
425 size_t pt_dynamic_filesz = 0;
426 for (size_t i = 0; i < phdr_num_; ++i) {
427 const ElfW(Phdr)* phdr = &phdr_table_[i];
428 if (phdr->p_type == PT_DYNAMIC) {
429 pt_dynamic_offset = phdr->p_offset;
430 pt_dynamic_filesz = phdr->p_filesz;
431 }
432 }
433
434 if (pt_dynamic_offset != dynamic_shdr->sh_offset) {
Elliott Hughes95c6cd72019-12-20 13:26:14 -0800435 if (get_application_target_sdk_version() >= 26) {
Dimitry Ivanove30c17f2016-12-28 16:21:49 -0800436 DL_ERR_AND_LOG("\"%s\" .dynamic section has invalid offset: 0x%zx, "
437 "expected to match PT_DYNAMIC offset: 0x%zx",
438 name_.c_str(),
439 static_cast<size_t>(dynamic_shdr->sh_offset),
440 pt_dynamic_offset);
441 return false;
442 }
Elliott Hughes95c6cd72019-12-20 13:26:14 -0800443 DL_WARN_documented_change(26,
Elliott Hughes9076b0c2018-02-28 11:29:45 -0800444 "invalid-elf-header_section-headers-enforced-for-api-level-26",
445 "\"%s\" .dynamic section has invalid offset: 0x%zx "
446 "(expected to match PT_DYNAMIC offset 0x%zx)",
447 name_.c_str(),
448 static_cast<size_t>(dynamic_shdr->sh_offset),
449 pt_dynamic_offset);
Dimitry Ivanove30c17f2016-12-28 16:21:49 -0800450 add_dlwarning(name_.c_str(), "invalid .dynamic section");
Dimitry Ivanov0c9d30f2016-07-13 17:06:36 -0700451 }
452
453 if (pt_dynamic_filesz != dynamic_shdr->sh_size) {
Elliott Hughes95c6cd72019-12-20 13:26:14 -0800454 if (get_application_target_sdk_version() >= 26) {
Dimitry Ivanove30c17f2016-12-28 16:21:49 -0800455 DL_ERR_AND_LOG("\"%s\" .dynamic section has invalid size: 0x%zx, "
456 "expected to match PT_DYNAMIC filesz: 0x%zx",
457 name_.c_str(),
458 static_cast<size_t>(dynamic_shdr->sh_size),
459 pt_dynamic_filesz);
460 return false;
461 }
Elliott Hughes95c6cd72019-12-20 13:26:14 -0800462 DL_WARN_documented_change(26,
Elliott Hughes9076b0c2018-02-28 11:29:45 -0800463 "invalid-elf-header_section-headers-enforced-for-api-level-26",
464 "\"%s\" .dynamic section has invalid size: 0x%zx "
465 "(expected to match PT_DYNAMIC filesz 0x%zx)",
466 name_.c_str(),
467 static_cast<size_t>(dynamic_shdr->sh_size),
468 pt_dynamic_filesz);
Dimitry Ivanove30c17f2016-12-28 16:21:49 -0800469 add_dlwarning(name_.c_str(), "invalid .dynamic section");
Dimitry Ivanov0c9d30f2016-07-13 17:06:36 -0700470 }
471
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700472 if (dynamic_shdr->sh_link >= shdr_num_) {
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700473 DL_ERR_AND_LOG("\"%s\" .dynamic section has invalid sh_link: %d",
474 name_.c_str(),
475 dynamic_shdr->sh_link);
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700476 return false;
477 }
478
479 const ElfW(Shdr)* strtab_shdr = &shdr_table_[dynamic_shdr->sh_link];
480
481 if (strtab_shdr->sh_type != SHT_STRTAB) {
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700482 DL_ERR_AND_LOG("\"%s\" .dynamic section has invalid link(%d) sh_type: %d (expected SHT_STRTAB)",
483 name_.c_str(), dynamic_shdr->sh_link, strtab_shdr->sh_type);
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700484 return false;
485 }
486
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700487 if (!CheckFileRange(dynamic_shdr->sh_offset, dynamic_shdr->sh_size, alignof(const ElfW(Dyn)))) {
488 DL_ERR_AND_LOG("\"%s\" has invalid offset/size of .dynamic section", name_.c_str());
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800489 return false;
490 }
491
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000492 if (!dynamic_fragment_.Map(fd_, file_offset_, dynamic_shdr->sh_offset, dynamic_shdr->sh_size)) {
Elliott Hughesf5e21d92024-07-26 11:48:19 +0000493 DL_ERR("\"%s\" dynamic section mmap failed: %m", name_.c_str());
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700494 return false;
495 }
496
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000497 dynamic_ = static_cast<const ElfW(Dyn)*>(dynamic_fragment_.data());
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700498
Dimitry Ivanovbd906752016-08-08 17:12:18 -0700499 if (!CheckFileRange(strtab_shdr->sh_offset, strtab_shdr->sh_size, alignof(const char))) {
500 DL_ERR_AND_LOG("\"%s\" has invalid offset/size of the .strtab section linked from .dynamic section",
501 name_.c_str());
Dmitriy Ivanov3c524812015-11-20 17:28:12 -0800502 return false;
503 }
504
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000505 if (!strtab_fragment_.Map(fd_, file_offset_, strtab_shdr->sh_offset, strtab_shdr->sh_size)) {
Elliott Hughesf5e21d92024-07-26 11:48:19 +0000506 DL_ERR("\"%s\" strtab section mmap failed: %m", name_.c_str());
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700507 return false;
508 }
509
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000510 strtab_ = static_cast<const char*>(strtab_fragment_.data());
511 strtab_size_ = strtab_fragment_.size();
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700512 return true;
513}
514
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800515/* Returns the size of the extent of all the possibly non-contiguous
516 * loadable segments in an ELF program header table. This corresponds
517 * to the page-aligned size in bytes that needs to be reserved in the
518 * process' address space. If there are no loadable segments, 0 is
519 * returned.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200520 *
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700521 * If out_min_vaddr or out_max_vaddr are not null, they will be
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800522 * set to the minimum and maximum addresses of pages to be reserved,
523 * or 0 if there is nothing to load.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200524 */
Elliott Hughes0266ae52014-02-10 17:46:57 -0800525size_t phdr_table_get_load_size(const ElfW(Phdr)* phdr_table, size_t phdr_count,
526 ElfW(Addr)* out_min_vaddr,
527 ElfW(Addr)* out_max_vaddr) {
528 ElfW(Addr) min_vaddr = UINTPTR_MAX;
529 ElfW(Addr) max_vaddr = 0;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200530
Elliott Hughes0266ae52014-02-10 17:46:57 -0800531 bool found_pt_load = false;
532 for (size_t i = 0; i < phdr_count; ++i) {
533 const ElfW(Phdr)* phdr = &phdr_table[i];
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200534
Elliott Hughes0266ae52014-02-10 17:46:57 -0800535 if (phdr->p_type != PT_LOAD) {
536 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200537 }
Elliott Hughes0266ae52014-02-10 17:46:57 -0800538 found_pt_load = true;
539
540 if (phdr->p_vaddr < min_vaddr) {
541 min_vaddr = phdr->p_vaddr;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200542 }
543
Elliott Hughes0266ae52014-02-10 17:46:57 -0800544 if (phdr->p_vaddr + phdr->p_memsz > max_vaddr) {
545 max_vaddr = phdr->p_vaddr + phdr->p_memsz;
546 }
547 }
548 if (!found_pt_load) {
549 min_vaddr = 0;
550 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200551
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700552 min_vaddr = page_start(min_vaddr);
553 max_vaddr = page_end(max_vaddr);
Elliott Hughes0266ae52014-02-10 17:46:57 -0800554
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700555 if (out_min_vaddr != nullptr) {
Elliott Hughes0266ae52014-02-10 17:46:57 -0800556 *out_min_vaddr = min_vaddr;
557 }
Dmitriy Ivanov851135b2014-08-29 12:02:36 -0700558 if (out_max_vaddr != nullptr) {
Elliott Hughes0266ae52014-02-10 17:46:57 -0800559 *out_max_vaddr = max_vaddr;
560 }
561 return max_vaddr - min_vaddr;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200562}
563
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700564// Returns the maximum p_align associated with a loadable segment in the ELF
565// program header table. Used to determine whether the file should be loaded at
566// a specific virtual address alignment for use with huge pages.
567size_t phdr_table_get_maximum_alignment(const ElfW(Phdr)* phdr_table, size_t phdr_count) {
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700568 size_t maximum_alignment = page_size();
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700569
570 for (size_t i = 0; i < phdr_count; ++i) {
571 const ElfW(Phdr)* phdr = &phdr_table[i];
572
573 // p_align must be 0, 1, or a positive, integral power of two.
574 if (phdr->p_type != PT_LOAD || ((phdr->p_align & (phdr->p_align - 1)) != 0)) {
575 continue;
576 }
577
Steven Morelandfc89c8a2024-08-01 21:20:33 +0000578 maximum_alignment = std::max(maximum_alignment, static_cast<size_t>(phdr->p_align));
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700579 }
580
581#if defined(__LP64__)
582 return maximum_alignment;
583#else
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700584 return page_size();
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700585#endif
586}
587
Steven Morelandfc89c8a2024-08-01 21:20:33 +0000588// Returns the minimum p_align associated with a loadable segment in the ELF
589// program header table. Used to determine if the program alignment is compatible
590// with the page size of this system.
591size_t phdr_table_get_minimum_alignment(const ElfW(Phdr)* phdr_table, size_t phdr_count) {
592 size_t minimum_alignment = page_size();
593
594 for (size_t i = 0; i < phdr_count; ++i) {
595 const ElfW(Phdr)* phdr = &phdr_table[i];
596
597 // p_align must be 0, 1, or a positive, integral power of two.
598 if (phdr->p_type != PT_LOAD || ((phdr->p_align & (phdr->p_align - 1)) != 0)) {
599 continue;
600 }
601
602 if (phdr->p_align <= 1) {
603 continue;
604 }
605
606 minimum_alignment = std::min(minimum_alignment, static_cast<size_t>(phdr->p_align));
607 }
608
609 return minimum_alignment;
610}
611
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700612// Reserve a virtual address range such that if it's limits were extended to the next 2**align
613// boundary, it would not overlap with any existing mappings.
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700614static void* ReserveWithAlignmentPadding(size_t size, size_t mapping_align, size_t start_align,
615 void** out_gap_start, size_t* out_gap_size) {
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700616 int mmap_flags = MAP_PRIVATE | MAP_ANONYMOUS;
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700617 // Reserve enough space to properly align the library's start address.
618 mapping_align = std::max(mapping_align, start_align);
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700619 if (mapping_align == page_size()) {
Elliott Hughes8178c412018-11-05 13:34:36 -0800620 void* mmap_ptr = mmap(nullptr, size, PROT_NONE, mmap_flags, -1, 0);
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700621 if (mmap_ptr == MAP_FAILED) {
622 return nullptr;
623 }
624 return mmap_ptr;
625 }
626
Evgenii Stepanove0848bb2020-07-14 16:44:57 -0700627 // Minimum alignment of shared library gap. For efficiency, this should match the second level
628 // page size of the platform.
629#if defined(__LP64__)
630 constexpr size_t kGapAlignment = 1ul << 21; // 2MB
631#else
632 constexpr size_t kGapAlignment = 0;
633#endif
634 // Maximum gap size, in the units of kGapAlignment.
635 constexpr size_t kMaxGapUnits = 32;
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700636 // Allocate enough space so that the end of the desired region aligned up is still inside the
637 // mapping.
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700638 size_t mmap_size = align_up(size, mapping_align) + mapping_align - page_size();
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700639 uint8_t* mmap_ptr =
640 reinterpret_cast<uint8_t*>(mmap(nullptr, mmap_size, PROT_NONE, mmap_flags, -1, 0));
641 if (mmap_ptr == MAP_FAILED) {
642 return nullptr;
643 }
Evgenii Stepanove0848bb2020-07-14 16:44:57 -0700644 size_t gap_size = 0;
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700645 size_t first_byte = reinterpret_cast<size_t>(align_up(mmap_ptr, mapping_align));
646 size_t last_byte = reinterpret_cast<size_t>(align_down(mmap_ptr + mmap_size, mapping_align) - 1);
Evgenii Stepanove0848bb2020-07-14 16:44:57 -0700647 if (kGapAlignment && first_byte / kGapAlignment != last_byte / kGapAlignment) {
648 // This library crosses a 2MB boundary and will fragment a new huge page.
649 // Lets take advantage of that and insert a random number of inaccessible huge pages before that
650 // to improve address randomization and make it harder to locate this library code by probing.
651 munmap(mmap_ptr, mmap_size);
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700652 mapping_align = std::max(mapping_align, kGapAlignment);
Evgenii Stepanove0848bb2020-07-14 16:44:57 -0700653 gap_size =
654 kGapAlignment * (is_first_stage_init() ? 1 : arc4random_uniform(kMaxGapUnits - 1) + 1);
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700655 mmap_size = align_up(size + gap_size, mapping_align) + mapping_align - page_size();
Evgenii Stepanove0848bb2020-07-14 16:44:57 -0700656 mmap_ptr = reinterpret_cast<uint8_t*>(mmap(nullptr, mmap_size, PROT_NONE, mmap_flags, -1, 0));
657 if (mmap_ptr == MAP_FAILED) {
658 return nullptr;
659 }
660 }
661
662 uint8_t *gap_end, *gap_start;
663 if (gap_size) {
664 gap_end = align_down(mmap_ptr + mmap_size, kGapAlignment);
665 gap_start = gap_end - gap_size;
666 } else {
667 gap_start = gap_end = mmap_ptr + mmap_size;
668 }
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700669
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700670 uint8_t* first = align_up(mmap_ptr, mapping_align);
671 uint8_t* last = align_down(gap_start, mapping_align) - size;
Jiyong Park31cd08f2018-06-01 19:18:56 +0900672
Tom Cherry66bc4282018-11-08 13:40:52 -0800673 // arc4random* is not available in first stage init because /dev/urandom hasn't yet been
Jiyong Park31cd08f2018-06-01 19:18:56 +0900674 // created. Don't randomize then.
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700675 size_t n = is_first_stage_init() ? 0 : arc4random_uniform((last - first) / start_align + 1);
676 uint8_t* start = first + n * start_align;
Evgenii Stepanove0848bb2020-07-14 16:44:57 -0700677 // Unmap the extra space around the allocation.
678 // Keep it mapped PROT_NONE on 64-bit targets where address space is plentiful to make it harder
679 // to defeat ASLR by probing for readable memory mappings.
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700680 munmap(mmap_ptr, start - mmap_ptr);
Evgenii Stepanove0848bb2020-07-14 16:44:57 -0700681 munmap(start + size, gap_start - (start + size));
682 if (gap_end != mmap_ptr + mmap_size) {
683 munmap(gap_end, mmap_ptr + mmap_size - gap_end);
684 }
685 *out_gap_start = gap_start;
686 *out_gap_size = gap_size;
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700687 return start;
688}
689
Elliott Hughes650be4e2013-03-05 18:47:58 -0800690// Reserve a virtual address range big enough to hold all loadable
691// segments of a program header table. This is done by creating a
692// private anonymous mmap() with PROT_NONE.
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -0400693bool ElfReader::ReserveAddressSpace(address_space_params* address_space) {
Elliott Hughes0266ae52014-02-10 17:46:57 -0800694 ElfW(Addr) min_vaddr;
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800695 load_size_ = phdr_table_get_load_size(phdr_table_, phdr_num_, &min_vaddr);
Elliott Hughes650be4e2013-03-05 18:47:58 -0800696 if (load_size_ == 0) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700697 DL_ERR("\"%s\" has no loadable segments", name_.c_str());
Elliott Hughes650be4e2013-03-05 18:47:58 -0800698 return false;
699 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200700
Kalesh Singhce1c3cf2024-09-30 13:26:23 -0700701 if (should_use_16kib_app_compat_) {
702 // Reserve additional space for aligning the permission boundary in compat loading
703 // Up to kPageSize-kCompatPageSize additional space is needed, but reservation
704 // is done with mmap which gives kPageSize multiple-sized reservations.
705 load_size_ += kPageSize;
706 }
707
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800708 uint8_t* addr = reinterpret_cast<uint8_t*>(min_vaddr);
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000709 void* start;
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000710
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -0400711 if (load_size_ > address_space->reserved_size) {
712 if (address_space->must_use_address) {
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000713 DL_ERR("reserved address space %zd smaller than %zd bytes needed for \"%s\"",
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -0400714 load_size_ - address_space->reserved_size, load_size_, name_.c_str());
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000715 return false;
716 }
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700717 size_t start_alignment = page_size();
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700718 if (get_transparent_hugepages_supported() && get_application_target_sdk_version() >= 31) {
719 size_t maximum_alignment = phdr_table_get_maximum_alignment(phdr_table_, phdr_num_);
720 // Limit alignment to PMD size as other alignments reduce the number of
721 // bits available for ASLR for no benefit.
Peter Collingbournebb11ee62022-05-02 12:26:16 -0700722 start_alignment = maximum_alignment == kPmdSize ? kPmdSize : page_size();
Collin Fijalkovich47d27aa2021-03-24 10:17:39 -0700723 }
724 start = ReserveWithAlignmentPadding(load_size_, kLibraryAlignment, start_alignment, &gap_start_,
725 &gap_size_);
Evgenii Stepanovd13e9a62016-07-15 16:31:42 -0700726 if (start == nullptr) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -0700727 DL_ERR("couldn't reserve %zd bytes of address space for \"%s\"", load_size_, name_.c_str());
Torne (Richard Coles)12bbb912014-02-06 14:34:21 +0000728 return false;
729 }
730 } else {
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -0400731 start = address_space->start_addr;
Evgenii Stepanove0848bb2020-07-14 16:44:57 -0700732 gap_start_ = nullptr;
733 gap_size_ = 0;
Dimitry Ivanovf45b0e92016-01-15 11:13:35 -0800734 mapped_by_caller_ = true;
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -0400735
736 // Update the reserved address space to subtract the space used by this library.
737 address_space->start_addr = reinterpret_cast<uint8_t*>(address_space->start_addr) + load_size_;
738 address_space->reserved_size -= load_size_;
Elliott Hughes650be4e2013-03-05 18:47:58 -0800739 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200740
Elliott Hughes650be4e2013-03-05 18:47:58 -0800741 load_start_ = start;
Brian Carlstrome7dffe12013-01-10 16:39:58 -0800742 load_bias_ = reinterpret_cast<uint8_t*>(start) - addr;
Kalesh Singhce1c3cf2024-09-30 13:26:23 -0700743
744 if (should_use_16kib_app_compat_) {
745 // In compat mode make the initial mapping RW since the ELF contents will be read
746 // into it; instead of mapped over it.
747 mprotect(reinterpret_cast<void*>(start), load_size_, PROT_READ | PROT_WRITE);
748 }
749
Elliott Hughes650be4e2013-03-05 18:47:58 -0800750 return true;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +0200751}
752
Kalesh Singhc5c1d192024-04-09 16:27:56 -0700753/*
754 * Returns true if the kernel supports page size migration, else false.
755 */
756bool page_size_migration_supported() {
757 static bool pgsize_migration_enabled = []() {
758 std::string enabled;
759 if (!android::base::ReadFileToString("/sys/kernel/mm/pgsize_migration/enabled", &enabled)) {
760 return false;
761 }
762 return enabled.find("1") != std::string::npos;
763 }();
764 return pgsize_migration_enabled;
765}
766
Kalesh Singh377f0b92024-01-31 20:23:39 -0800767// Find the ELF note of type NT_ANDROID_TYPE_PAD_SEGMENT and check that the desc value is 1.
768bool ElfReader::ReadPadSegmentNote() {
Kalesh Singhc5c1d192024-04-09 16:27:56 -0700769 if (!page_size_migration_supported()) {
770 // Don't attempt to read the note, since segment extension isn't
771 // supported; but return true so that loading can continue normally.
772 return true;
773 }
774
Kalesh Singh377f0b92024-01-31 20:23:39 -0800775 // The ELF can have multiple PT_NOTE's, check them all
776 for (size_t i = 0; i < phdr_num_; ++i) {
777 const ElfW(Phdr)* phdr = &phdr_table_[i];
778
779 if (phdr->p_type != PT_NOTE) {
780 continue;
781 }
782
Kalesh Singh13fb3cf2024-02-08 14:58:04 -0800783 // Some obfuscated ELFs may contain "empty" PT_NOTE program headers that don't
784 // point to any part of the ELF (p_memsz == 0). Skip these since there is
785 // nothing to decode. See: b/324468126
786 if (phdr->p_memsz == 0) {
787 continue;
788 }
789
Kalesh Singh751bb8a2024-03-29 17:55:37 -0700790 // If the PT_NOTE extends beyond the file. The ELF is doing something
791 // strange -- obfuscation, embedding hidden loaders, ...
792 //
793 // It doesn't contain the pad_segment note. Skip it to avoid SIGBUS
794 // by accesses beyond the file.
795 off64_t note_end_off = file_offset_ + phdr->p_offset + phdr->p_filesz;
796 if (note_end_off > file_size_) {
797 continue;
798 }
799
Kalesh Singh377f0b92024-01-31 20:23:39 -0800800 // note_fragment is scoped to within the loop so that there is
801 // at most 1 PT_NOTE mapped at anytime during this search.
802 MappedFileFragment note_fragment;
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000803 if (!note_fragment.Map(fd_, file_offset_, phdr->p_offset, phdr->p_memsz)) {
Kalesh Singh32b6d8c2024-02-13 18:37:12 -0800804 DL_ERR("\"%s\": PT_NOTE mmap(nullptr, %p, PROT_READ, MAP_PRIVATE, %d, %p) failed: %m",
805 name_.c_str(), reinterpret_cast<void*>(phdr->p_memsz), fd_,
806 reinterpret_cast<void*>(page_start(file_offset_ + phdr->p_offset)));
Kalesh Singh13fb3cf2024-02-08 14:58:04 -0800807 return false;
Kalesh Singh377f0b92024-01-31 20:23:39 -0800808 }
809
810 const ElfW(Nhdr)* note_hdr = nullptr;
811 const char* note_desc = nullptr;
812 if (!__get_elf_note(NT_ANDROID_TYPE_PAD_SEGMENT, "Android",
Suren Baghdasaryanc16828b2024-08-01 00:14:15 +0000813 reinterpret_cast<ElfW(Addr)>(note_fragment.data()),
Kalesh Singh377f0b92024-01-31 20:23:39 -0800814 phdr, &note_hdr, &note_desc)) {
815 continue;
816 }
817
818 if (note_hdr->n_descsz != sizeof(ElfW(Word))) {
819 DL_ERR("\"%s\" NT_ANDROID_TYPE_PAD_SEGMENT note has unexpected n_descsz: %u",
820 name_.c_str(), reinterpret_cast<unsigned int>(note_hdr->n_descsz));
821 return false;
822 }
823
824 // 1 == enabled, 0 == disabled
825 should_pad_segments_ = *reinterpret_cast<const ElfW(Word)*>(note_desc) == 1;
826 return true;
827 }
828
829 return true;
830}
831
Kalesh Singh4084b552024-03-13 13:35:49 -0700832static inline void _extend_load_segment_vma(const ElfW(Phdr)* phdr_table, size_t phdr_count,
Kalesh Singhb23787f2024-09-05 08:22:06 +0000833 size_t phdr_idx, ElfW(Addr)* p_memsz,
834 ElfW(Addr)* p_filesz, bool should_pad_segments,
835 bool should_use_16kib_app_compat) {
836 // NOTE: Segment extension is only applicable where the ELF's max-page-size > runtime page size;
837 // to save kernel VMA slab memory. 16KiB compat mode is the exact opposite scenario.
838 if (should_use_16kib_app_compat) {
839 return;
840 }
841
Kalesh Singh4084b552024-03-13 13:35:49 -0700842 const ElfW(Phdr)* phdr = &phdr_table[phdr_idx];
843 const ElfW(Phdr)* next = nullptr;
844 size_t next_idx = phdr_idx + 1;
845
Kalesh Singhe1e74792024-04-09 11:48:52 -0700846 // Don't do segment extension for p_align > 64KiB, such ELFs already existed in the
847 // field e.g. 2MiB p_align for THPs and are relatively small in number.
848 //
849 // The kernel can only represent padding for p_align up to 64KiB. This is because
850 // the kernel uses 4 available bits in the vm_area_struct to represent padding
851 // extent; and so cannot enable mitigations to avoid breaking app compatibility for
852 // p_aligns > 64KiB.
853 //
854 // Don't perform segment extension on these to avoid app compatibility issues.
855 if (phdr->p_align <= kPageSize || phdr->p_align > 64*1024 || !should_pad_segments) {
Kalesh Singh4084b552024-03-13 13:35:49 -0700856 return;
857 }
858
859 if (next_idx < phdr_count && phdr_table[next_idx].p_type == PT_LOAD) {
860 next = &phdr_table[next_idx];
861 }
862
863 // If this is the last LOAD segment, no extension is needed
864 if (!next || *p_memsz != *p_filesz) {
865 return;
866 }
867
868 ElfW(Addr) next_start = page_start(next->p_vaddr);
869 ElfW(Addr) curr_end = page_end(phdr->p_vaddr + *p_memsz);
870
871 // If adjacent segment mappings overlap, no extension is needed.
872 if (curr_end >= next_start) {
873 return;
874 }
875
876 // Extend the LOAD segment mapping to be contiguous with that of
877 // the next LOAD segment.
878 ElfW(Addr) extend = next_start - curr_end;
879 *p_memsz += extend;
880 *p_filesz += extend;
881}
882
Kalesh Singh86e04f62024-09-05 06:24:14 +0000883bool ElfReader::MapSegment(size_t seg_idx, size_t len) {
884 const ElfW(Phdr)* phdr = &phdr_table_[seg_idx];
885
886 void* start = reinterpret_cast<void*>(page_start(phdr->p_vaddr + load_bias_));
887
888 // The ELF could be being loaded directly from a zipped APK,
889 // the zip offset must be added to find the segment offset.
890 const ElfW(Addr) offset = file_offset_ + page_start(phdr->p_offset);
891
892 int prot = PFLAGS_TO_PROT(phdr->p_flags);
893
894 void* seg_addr = mmap64(start, len, prot, MAP_FIXED | MAP_PRIVATE, fd_, offset);
895
896 if (seg_addr == MAP_FAILED) {
897 DL_ERR("couldn't map \"%s\" segment %zd: %m", name_.c_str(), seg_idx);
898 return false;
899 }
900
901 // Mark segments as huge page eligible if they meet the requirements
902 if ((phdr->p_flags & PF_X) && phdr->p_align == kPmdSize &&
903 get_transparent_hugepages_supported()) {
904 madvise(seg_addr, len, MADV_HUGEPAGE);
905 }
906
907 return true;
908}
909
Kalesh Singh37bcaea2024-09-05 06:32:07 +0000910void ElfReader::ZeroFillSegment(const ElfW(Phdr)* phdr) {
Kalesh Singhb23787f2024-09-05 08:22:06 +0000911 // NOTE: In 16KiB app compat mode, the ELF mapping is anonymous, meaning that
912 // RW segments are COW-ed from the kernel's zero page. So there is no need to
913 // explicitly zero-fill until the last page's limit.
914 if (should_use_16kib_app_compat_) {
915 return;
916 }
917
Kalesh Singh37bcaea2024-09-05 06:32:07 +0000918 ElfW(Addr) seg_start = phdr->p_vaddr + load_bias_;
919 uint64_t unextended_seg_file_end = seg_start + phdr->p_filesz;
920
921 // If the segment is writable, and does not end on a page boundary,
922 // zero-fill it until the page limit.
923 //
924 // Do not attempt to zero the extended region past the first partial page,
925 // since doing so may:
926 // 1) Result in a SIGBUS, as the region is not backed by the underlying
927 // file.
928 // 2) Break the COW backing, faulting in new anon pages for a region
929 // that will not be used.
930 if ((phdr->p_flags & PF_W) != 0 && page_offset(unextended_seg_file_end) > 0) {
931 memset(reinterpret_cast<void*>(unextended_seg_file_end), 0,
932 kPageSize - page_offset(unextended_seg_file_end));
933 }
934}
935
Kalesh Singhe0f4a372024-09-05 07:07:21 +0000936void ElfReader::DropPaddingPages(const ElfW(Phdr)* phdr, uint64_t seg_file_end) {
Kalesh Singhb23787f2024-09-05 08:22:06 +0000937 // NOTE: Padding pages are only applicable where the ELF's max-page-size > runtime page size;
938 // 16KiB compat mode is the exact opposite scenario.
939 if (should_use_16kib_app_compat_) {
940 return;
941 }
942
Kalesh Singhe0f4a372024-09-05 07:07:21 +0000943 ElfW(Addr) seg_start = phdr->p_vaddr + load_bias_;
944 uint64_t unextended_seg_file_end = seg_start + phdr->p_filesz;
945
946 uint64_t pad_start = page_end(unextended_seg_file_end);
947 uint64_t pad_end = page_end(seg_file_end);
948 CHECK(pad_start <= pad_end);
949
950 uint64_t pad_len = pad_end - pad_start;
951 if (pad_len == 0 || !page_size_migration_supported()) {
952 return;
953 }
954
955 // Pages may be brought in due to readahead.
956 // Drop the padding (zero) pages, to avoid reclaim work later.
957 //
958 // NOTE: The madvise() here is special, as it also serves to hint to the
959 // kernel the portion of the LOAD segment that is padding.
960 //
961 // See: [1] https://android-review.googlesource.com/c/kernel/common/+/3032411
962 // [2] https://android-review.googlesource.com/c/kernel/common/+/3048835
963 if (madvise(reinterpret_cast<void*>(pad_start), pad_len, MADV_DONTNEED)) {
964 DL_WARN("\"%s\": madvise(0x%" PRIx64 ", 0x%" PRIx64 ", MADV_DONTNEED) failed: %m",
965 name_.c_str(), pad_start, pad_len);
966 }
967}
968
Kalesh Singh138a9552024-09-05 08:05:56 +0000969bool ElfReader::MapBssSection(const ElfW(Phdr)* phdr, ElfW(Addr) seg_page_end,
970 ElfW(Addr) seg_file_end) {
Kalesh Singhb23787f2024-09-05 08:22:06 +0000971 // NOTE: We do not need to handle .bss in 16KiB compat mode since the mapping
972 // reservation is anonymous and RW to begin with.
973 if (should_use_16kib_app_compat_) {
974 return true;
975 }
976
Kalesh Singh138a9552024-09-05 08:05:56 +0000977 // seg_file_end is now the first page address after the file content.
978 seg_file_end = page_end(seg_file_end);
979
980 if (seg_page_end <= seg_file_end) {
981 return true;
982 }
983
984 // If seg_page_end is larger than seg_file_end, we need to zero
985 // anything between them. This is done by using a private anonymous
986 // map for all extra pages
987 size_t zeromap_size = seg_page_end - seg_file_end;
988 void* zeromap =
989 mmap(reinterpret_cast<void*>(seg_file_end), zeromap_size, PFLAGS_TO_PROT(phdr->p_flags),
990 MAP_FIXED | MAP_ANONYMOUS | MAP_PRIVATE, -1, 0);
991 if (zeromap == MAP_FAILED) {
992 DL_ERR("couldn't map .bss section for \"%s\": %m", name_.c_str());
993 return false;
994 }
995
996 // Set the VMA name using prctl
997 prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, zeromap, zeromap_size, ".bss");
998
999 return true;
1000}
1001
Elliott Hughes650be4e2013-03-05 18:47:58 -08001002bool ElfReader::LoadSegments() {
Kalesh Singhce1c3cf2024-09-30 13:26:23 -07001003 // NOTE: The compat(legacy) page size (4096) must be used when aligning
1004 // the 4KiB segments for loading in compat mode. The larger 16KiB page size
1005 // will lead to overwriting adjacent segments since the ELF's segment(s)
1006 // are not 16KiB aligned.
1007 size_t seg_align = should_use_16kib_app_compat_ ? kCompatPageSize : kPageSize;
Kalesh Singhb23787f2024-09-05 08:22:06 +00001008
Steven Morelandfc89c8a2024-08-01 21:20:33 +00001009 size_t min_palign = phdr_table_get_minimum_alignment(phdr_table_, phdr_num_);
Kalesh Singhb23787f2024-09-05 08:22:06 +00001010 // Only enforce this on 16 KB systems with app compat disabled.
1011 // Apps may rely on undefined behavior here on 4 KB systems,
1012 // which is the norm before this change is introduced
1013 if (kPageSize >= 16384 && min_palign < kPageSize && !should_use_16kib_app_compat_) {
Steven Morelandfc89c8a2024-08-01 21:20:33 +00001014 DL_ERR("\"%s\" program alignment (%zu) cannot be smaller than system page size (%zu)",
1015 name_.c_str(), min_palign, kPageSize);
1016 return false;
1017 }
1018
Kalesh Singhce1c3cf2024-09-30 13:26:23 -07001019 if (!Setup16KiBAppCompat()) {
1020 DL_ERR("\"%s\" failed to setup 16KiB App Compat", name_.c_str());
1021 return false;
1022 }
1023
Elliott Hughes650be4e2013-03-05 18:47:58 -08001024 for (size_t i = 0; i < phdr_num_; ++i) {
Elliott Hughes0266ae52014-02-10 17:46:57 -08001025 const ElfW(Phdr)* phdr = &phdr_table_[i];
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001026
Elliott Hughes650be4e2013-03-05 18:47:58 -08001027 if (phdr->p_type != PT_LOAD) {
1028 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001029 }
Elliott Hughes650be4e2013-03-05 18:47:58 -08001030
Kalesh Singh4084b552024-03-13 13:35:49 -07001031 ElfW(Addr) p_memsz = phdr->p_memsz;
1032 ElfW(Addr) p_filesz = phdr->p_filesz;
Kalesh Singhb23787f2024-09-05 08:22:06 +00001033 _extend_load_segment_vma(phdr_table_, phdr_num_, i, &p_memsz, &p_filesz, should_pad_segments_,
1034 should_use_16kib_app_compat_);
Kalesh Singh4084b552024-03-13 13:35:49 -07001035
Elliott Hughes650be4e2013-03-05 18:47:58 -08001036 // Segment addresses in memory.
Elliott Hughes0266ae52014-02-10 17:46:57 -08001037 ElfW(Addr) seg_start = phdr->p_vaddr + load_bias_;
Kalesh Singh4084b552024-03-13 13:35:49 -07001038 ElfW(Addr) seg_end = seg_start + p_memsz;
Elliott Hughes650be4e2013-03-05 18:47:58 -08001039
Kalesh Singhb23787f2024-09-05 08:22:06 +00001040 ElfW(Addr) seg_page_end = align_up(seg_end, seg_align);
Elliott Hughes650be4e2013-03-05 18:47:58 -08001041
Kalesh Singh4084b552024-03-13 13:35:49 -07001042 ElfW(Addr) seg_file_end = seg_start + p_filesz;
Elliott Hughes650be4e2013-03-05 18:47:58 -08001043
1044 // File offsets.
Elliott Hughes0266ae52014-02-10 17:46:57 -08001045 ElfW(Addr) file_start = phdr->p_offset;
Kalesh Singh4084b552024-03-13 13:35:49 -07001046 ElfW(Addr) file_end = file_start + p_filesz;
Elliott Hughes650be4e2013-03-05 18:47:58 -08001047
Kalesh Singhb23787f2024-09-05 08:22:06 +00001048 ElfW(Addr) file_page_start = align_down(file_start, seg_align);
Elliott Hughes0266ae52014-02-10 17:46:57 -08001049 ElfW(Addr) file_length = file_end - file_page_start;
Elliott Hughes650be4e2013-03-05 18:47:58 -08001050
Dmitriy Ivanov3f987f52015-06-25 15:51:41 -07001051 if (file_size_ <= 0) {
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -07001052 DL_ERR("\"%s\" invalid file size: %" PRId64, name_.c_str(), file_size_);
Dmitriy Ivanov3f987f52015-06-25 15:51:41 -07001053 return false;
1054 }
1055
Kalesh Singh4084b552024-03-13 13:35:49 -07001056 if (file_start + phdr->p_filesz > static_cast<size_t>(file_size_)) {
Dmitriy Ivanov3f987f52015-06-25 15:51:41 -07001057 DL_ERR("invalid ELF file \"%s\" load segment[%zd]:"
1058 " p_offset (%p) + p_filesz (%p) ( = %p) past end of file (0x%" PRIx64 ")",
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -07001059 name_.c_str(), i, reinterpret_cast<void*>(phdr->p_offset),
Dmitriy Ivanov3f987f52015-06-25 15:51:41 -07001060 reinterpret_cast<void*>(phdr->p_filesz),
Kalesh Singh4084b552024-03-13 13:35:49 -07001061 reinterpret_cast<void*>(file_start + phdr->p_filesz), file_size_);
Dmitriy Ivanov3f987f52015-06-25 15:51:41 -07001062 return false;
1063 }
1064
Brian Carlstrom82dcc792013-05-21 16:49:24 -07001065 if (file_length != 0) {
Dimitry Ivanov9700bab2016-08-10 18:54:06 -07001066 int prot = PFLAGS_TO_PROT(phdr->p_flags);
Dimitry Ivanov9700bab2016-08-10 18:54:06 -07001067 if ((prot & (PROT_EXEC | PROT_WRITE)) == (PROT_EXEC | PROT_WRITE)) {
Elliott Hughes4cc5a602016-11-15 16:54:16 -08001068 // W + E PT_LOAD segments are not allowed in O.
Elliott Hughes95c6cd72019-12-20 13:26:14 -08001069 if (get_application_target_sdk_version() >= 26) {
Elliott Hughes9076b0c2018-02-28 11:29:45 -08001070 DL_ERR_AND_LOG("\"%s\": W+E load segments are not allowed", name_.c_str());
Elliott Hughes4cc5a602016-11-15 16:54:16 -08001071 return false;
1072 }
Elliott Hughes95c6cd72019-12-20 13:26:14 -08001073 DL_WARN_documented_change(26,
Elliott Hughes9076b0c2018-02-28 11:29:45 -08001074 "writable-and-executable-segments-enforced-for-api-level-26",
1075 "\"%s\" has load segments that are both writable and executable",
1076 name_.c_str());
Elliott Hughes4cc5a602016-11-15 16:54:16 -08001077 add_dlwarning(name_.c_str(), "W+E load segments");
Dimitry Ivanov9700bab2016-08-10 18:54:06 -07001078 }
1079
Kalesh Singh86e04f62024-09-05 06:24:14 +00001080 // Pass the file_length, since it may have been extended by _extend_load_segment_vma().
Kalesh Singhce1c3cf2024-09-30 13:26:23 -07001081 if (should_use_16kib_app_compat_) {
1082 if (!CompatMapSegment(i, file_length)) {
1083 return false;
1084 }
1085 } else {
1086 if (!MapSegment(i, file_length)) {
1087 return false;
1088 }
Brian Carlstrom82dcc792013-05-21 16:49:24 -07001089 }
Elliott Hughes650be4e2013-03-05 18:47:58 -08001090 }
1091
Kalesh Singh37bcaea2024-09-05 06:32:07 +00001092 ZeroFillSegment(phdr);
Kalesh Singh1d3ba112024-03-06 17:33:36 -08001093
Kalesh Singhe0f4a372024-09-05 07:07:21 +00001094 DropPaddingPages(phdr, seg_file_end);
Elliott Hughes650be4e2013-03-05 18:47:58 -08001095
Kalesh Singh138a9552024-09-05 08:05:56 +00001096 if (!MapBssSection(phdr, seg_page_end, seg_file_end)) {
1097 return false;
Elliott Hughes650be4e2013-03-05 18:47:58 -08001098 }
1099 }
1100 return true;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001101}
1102
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001103/* Used internally. Used to set the protection bits of all loaded segments
1104 * with optional extra flags (i.e. really PROT_WRITE). Used by
1105 * phdr_table_protect_segments and phdr_table_unprotect_segments.
1106 */
1107static int _phdr_table_set_load_prot(const ElfW(Phdr)* phdr_table, size_t phdr_count,
Kalesh Singh4084b552024-03-13 13:35:49 -07001108 ElfW(Addr) load_bias, int extra_prot_flags,
Kalesh Singhb23787f2024-09-05 08:22:06 +00001109 bool should_pad_segments, bool should_use_16kib_app_compat) {
Kalesh Singh4084b552024-03-13 13:35:49 -07001110 for (size_t i = 0; i < phdr_count; ++i) {
1111 const ElfW(Phdr)* phdr = &phdr_table[i];
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001112
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001113 if (phdr->p_type != PT_LOAD || (phdr->p_flags & PF_W) != 0) {
1114 continue;
1115 }
1116
Kalesh Singh4084b552024-03-13 13:35:49 -07001117 ElfW(Addr) p_memsz = phdr->p_memsz;
1118 ElfW(Addr) p_filesz = phdr->p_filesz;
Kalesh Singhb23787f2024-09-05 08:22:06 +00001119 _extend_load_segment_vma(phdr_table, phdr_count, i, &p_memsz, &p_filesz, should_pad_segments,
1120 should_use_16kib_app_compat);
Kalesh Singh4084b552024-03-13 13:35:49 -07001121
1122 ElfW(Addr) seg_page_start = page_start(phdr->p_vaddr + load_bias);
1123 ElfW(Addr) seg_page_end = page_end(phdr->p_vaddr + p_memsz + load_bias);
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001124
Tamas Petz8d55d182020-02-24 14:15:25 +01001125 int prot = PFLAGS_TO_PROT(phdr->p_flags) | extra_prot_flags;
1126 if ((prot & PROT_WRITE) != 0) {
Nick Kralevich8fdb3412015-04-01 16:57:50 -07001127 // make sure we're never simultaneously writable / executable
1128 prot &= ~PROT_EXEC;
1129 }
Tamas Petz8d55d182020-02-24 14:15:25 +01001130#if defined(__aarch64__)
1131 if ((prot & PROT_EXEC) == 0) {
1132 // Though it is not specified don't add PROT_BTI if segment is not
1133 // executable.
1134 prot &= ~PROT_BTI;
1135 }
1136#endif
Nick Kralevich8fdb3412015-04-01 16:57:50 -07001137
Tamas Petz8d55d182020-02-24 14:15:25 +01001138 int ret =
1139 mprotect(reinterpret_cast<void*>(seg_page_start), seg_page_end - seg_page_start, prot);
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001140 if (ret < 0) {
1141 return -1;
1142 }
1143 }
1144 return 0;
1145}
1146
1147/* Restore the original protection modes for all loadable segments.
1148 * You should only call this after phdr_table_unprotect_segments and
1149 * applying all relocations.
1150 *
Tamas Petz8d55d182020-02-24 14:15:25 +01001151 * AArch64: also called from linker_main and ElfReader::Load to apply
1152 * PROT_BTI for loaded main so and other so-s.
1153 *
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001154 * Input:
1155 * phdr_table -> program header table
1156 * phdr_count -> number of entries in tables
1157 * load_bias -> load bias
Kalesh Singh4084b552024-03-13 13:35:49 -07001158 * should_pad_segments -> Are segments extended to avoid gaps in the memory map
Kalesh Singhb23787f2024-09-05 08:22:06 +00001159 * should_use_16kib_app_compat -> Is the ELF being loaded in 16KiB app compat mode.
Tamas Petz8d55d182020-02-24 14:15:25 +01001160 * prop -> GnuPropertySection or nullptr
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001161 * Return:
Mitch Phillips117e45e2023-10-20 13:32:33 +00001162 * 0 on success, -1 on failure (error code in errno).
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001163 */
Tamas Petz8d55d182020-02-24 14:15:25 +01001164int phdr_table_protect_segments(const ElfW(Phdr)* phdr_table, size_t phdr_count,
Kalesh Singh4084b552024-03-13 13:35:49 -07001165 ElfW(Addr) load_bias, bool should_pad_segments,
Kalesh Singhb23787f2024-09-05 08:22:06 +00001166 bool should_use_16kib_app_compat,
Kalesh Singh4084b552024-03-13 13:35:49 -07001167 const GnuPropertySection* prop __unused) {
Tamas Petz8d55d182020-02-24 14:15:25 +01001168 int prot = 0;
1169#if defined(__aarch64__)
1170 if ((prop != nullptr) && prop->IsBTICompatible()) {
1171 prot |= PROT_BTI;
1172 }
1173#endif
Kalesh Singhb23787f2024-09-05 08:22:06 +00001174 return _phdr_table_set_load_prot(phdr_table, phdr_count, load_bias, prot, should_pad_segments,
1175 should_use_16kib_app_compat);
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001176}
1177
Florian Mayer4edc20d2024-10-30 14:24:26 -07001178static bool segment_needs_memtag_globals_remapping(const ElfW(Phdr) * phdr) {
1179 // For now, MTE globals is only supported on writeable data segments.
1180 return phdr->p_type == PT_LOAD && !(phdr->p_flags & PF_X) && (phdr->p_flags & PF_W);
1181}
1182
1183/* When MTE globals are requested by the binary, and when the hardware supports
1184 * it, remap the executable's PT_LOAD data pages to have PROT_MTE.
1185 *
1186 * Returns 0 on success, -1 on failure (error code in errno).
1187 */
1188int remap_memtag_globals_segments(const ElfW(Phdr) * phdr_table __unused,
1189 size_t phdr_count __unused, ElfW(Addr) load_bias __unused) {
1190#if defined(__aarch64__)
1191 for (const ElfW(Phdr)* phdr = phdr_table; phdr < phdr_table + phdr_count; phdr++) {
1192 if (!segment_needs_memtag_globals_remapping(phdr)) {
1193 continue;
1194 }
1195
1196 uintptr_t seg_page_start = page_start(phdr->p_vaddr) + load_bias;
1197 uintptr_t seg_page_end = page_end(phdr->p_vaddr + phdr->p_memsz) + load_bias;
1198 size_t seg_page_aligned_size = seg_page_end - seg_page_start;
1199
1200 int prot = PFLAGS_TO_PROT(phdr->p_flags);
1201 // For anonymous private mappings, it may be possible to simply mprotect()
1202 // the PROT_MTE flag over the top. For file-based mappings, this will fail,
1203 // and we'll need to fall back. We also allow PROT_WRITE here to allow
1204 // writing memory tags (in `soinfo::tag_globals()`), and set these sections
1205 // back to read-only after tags are applied (similar to RELRO).
1206 prot |= PROT_MTE;
1207 if (mprotect(reinterpret_cast<void*>(seg_page_start), seg_page_aligned_size,
1208 prot | PROT_WRITE) == 0) {
1209 continue;
1210 }
1211
1212 void* mapping_copy = mmap(nullptr, seg_page_aligned_size, PROT_READ | PROT_WRITE,
1213 MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
1214 linker_memcpy(mapping_copy, reinterpret_cast<void*>(seg_page_start), seg_page_aligned_size);
1215
1216 void* seg_addr = mmap(reinterpret_cast<void*>(seg_page_start), seg_page_aligned_size,
1217 prot | PROT_WRITE, MAP_FIXED | MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
1218 if (seg_addr == MAP_FAILED) return -1;
1219
1220 linker_memcpy(seg_addr, mapping_copy, seg_page_aligned_size);
1221 munmap(mapping_copy, seg_page_aligned_size);
1222 }
1223#endif // defined(__aarch64__)
1224 return 0;
1225}
1226
1227void protect_memtag_globals_ro_segments(const ElfW(Phdr) * phdr_table __unused,
1228 size_t phdr_count __unused, ElfW(Addr) load_bias __unused) {
1229#if defined(__aarch64__)
1230 for (const ElfW(Phdr)* phdr = phdr_table; phdr < phdr_table + phdr_count; phdr++) {
1231 int prot = PFLAGS_TO_PROT(phdr->p_flags);
1232 if (!segment_needs_memtag_globals_remapping(phdr) || (prot & PROT_WRITE)) {
1233 continue;
1234 }
1235
1236 prot |= PROT_MTE;
1237
1238 uintptr_t seg_page_start = page_start(phdr->p_vaddr) + load_bias;
1239 uintptr_t seg_page_end = page_end(phdr->p_vaddr + phdr->p_memsz) + load_bias;
1240 size_t seg_page_aligned_size = seg_page_end - seg_page_start;
1241 mprotect(reinterpret_cast<void*>(seg_page_start), seg_page_aligned_size, prot);
1242 }
1243#endif // defined(__aarch64__)
1244}
1245
1246void name_memtag_globals_segments(const ElfW(Phdr) * phdr_table, size_t phdr_count,
1247 ElfW(Addr) load_bias, const char* soname,
1248 std::list<std::string>* vma_names) {
1249 for (const ElfW(Phdr)* phdr = phdr_table; phdr < phdr_table + phdr_count; phdr++) {
1250 if (!segment_needs_memtag_globals_remapping(phdr)) {
1251 continue;
1252 }
1253
1254 uintptr_t seg_page_start = page_start(phdr->p_vaddr) + load_bias;
1255 uintptr_t seg_page_end = page_end(phdr->p_vaddr + phdr->p_memsz) + load_bias;
1256 size_t seg_page_aligned_size = seg_page_end - seg_page_start;
1257
1258 // For file-based mappings that we're now forcing to be anonymous mappings, set the VMA name to
1259 // make debugging easier.
1260 // Once we are targeting only devices that run kernel 5.10 or newer (and thus include
1261 // https://android-review.git.corp.google.com/c/kernel/common/+/1934723 which causes the
1262 // VMA_ANON_NAME to be copied into the kernel), we can get rid of the storage here.
1263 // For now, that is not the case:
1264 // https://source.android.com/docs/core/architecture/kernel/android-common#compatibility-matrix
1265 constexpr int kVmaNameLimit = 80;
1266 std::string& vma_name = vma_names->emplace_back(kVmaNameLimit, '\0');
1267 int full_vma_length =
1268 async_safe_format_buffer(vma_name.data(), kVmaNameLimit, "mt:%s+%" PRIxPTR, soname,
1269 page_start(phdr->p_vaddr)) +
1270 /* include the null terminator */ 1;
1271 // There's an upper limit of 80 characters, including the null terminator, in the anonymous VMA
1272 // name. If we run over that limit, we end up truncating the segment offset and parts of the
1273 // DSO's name, starting on the right hand side of the basename. Because the basename is the most
1274 // important thing, chop off the soname from the left hand side first.
1275 //
1276 // Example (with '#' as the null terminator):
1277 // - "mt:/data/nativetest64/bionic-unit-tests/bionic-loader-test-libs/libdlext_test.so+e000#"
1278 // is a `full_vma_length` == 86.
1279 //
1280 // We need to left-truncate (86 - 80) 6 characters from the soname, plus the
1281 // `vma_truncation_prefix`, so 9 characters total.
1282 if (full_vma_length > kVmaNameLimit) {
1283 const char vma_truncation_prefix[] = "...";
1284 int soname_truncated_bytes =
1285 full_vma_length - kVmaNameLimit + sizeof(vma_truncation_prefix) - 1;
1286 async_safe_format_buffer(vma_name.data(), kVmaNameLimit, "mt:%s%s+%" PRIxPTR,
1287 vma_truncation_prefix, soname + soname_truncated_bytes,
1288 page_start(phdr->p_vaddr));
1289 }
1290 if (prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, reinterpret_cast<void*>(seg_page_start),
1291 seg_page_aligned_size, vma_name.data()) != 0) {
1292 DL_WARN("Failed to rename memtag global segment: %m");
1293 }
1294 }
1295}
1296
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001297/* Change the protection of all loaded segments in memory to writable.
1298 * This is useful before performing relocations. Once completed, you
1299 * will have to call phdr_table_protect_segments to restore the original
1300 * protection flags on all segments.
1301 *
1302 * Note that some writable segments can also have their content turned
1303 * to read-only by calling phdr_table_protect_gnu_relro. This is no
1304 * performed here.
1305 *
1306 * Input:
1307 * phdr_table -> program header table
1308 * phdr_count -> number of entries in tables
1309 * load_bias -> load bias
Kalesh Singh4084b552024-03-13 13:35:49 -07001310 * should_pad_segments -> Are segments extended to avoid gaps in the memory map
Kalesh Singhb23787f2024-09-05 08:22:06 +00001311 * should_use_16kib_app_compat -> Is the ELF being loaded in 16KiB app compat mode.
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001312 * Return:
Mitch Phillips117e45e2023-10-20 13:32:33 +00001313 * 0 on success, -1 on failure (error code in errno).
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001314 */
Kalesh Singhb23787f2024-09-05 08:22:06 +00001315int phdr_table_unprotect_segments(const ElfW(Phdr)* phdr_table, size_t phdr_count,
1316 ElfW(Addr) load_bias, bool should_pad_segments,
1317 bool should_use_16kib_app_compat) {
Kalesh Singh4084b552024-03-13 13:35:49 -07001318 return _phdr_table_set_load_prot(phdr_table, phdr_count, load_bias, PROT_WRITE,
Kalesh Singhb23787f2024-09-05 08:22:06 +00001319 should_pad_segments, should_use_16kib_app_compat);
Dimitry Ivanov56be6ed2015-04-01 21:18:48 +00001320}
1321
Kalesh Singh702d9b02024-03-13 13:38:04 -07001322static inline void _extend_gnu_relro_prot_end(const ElfW(Phdr)* relro_phdr,
1323 const ElfW(Phdr)* phdr_table, size_t phdr_count,
1324 ElfW(Addr) load_bias, ElfW(Addr)* seg_page_end,
Kalesh Singhb23787f2024-09-05 08:22:06 +00001325 bool should_pad_segments,
1326 bool should_use_16kib_app_compat) {
Kalesh Singh702d9b02024-03-13 13:38:04 -07001327 // Find the index and phdr of the LOAD containing the GNU_RELRO segment
1328 for (size_t index = 0; index < phdr_count; ++index) {
1329 const ElfW(Phdr)* phdr = &phdr_table[index];
1330
1331 if (phdr->p_type == PT_LOAD && phdr->p_vaddr == relro_phdr->p_vaddr) {
1332 // If the PT_GNU_RELRO mem size is not at least as large as the corresponding
1333 // LOAD segment mem size, we need to protect only a partial region of the
1334 // LOAD segment and therefore cannot avoid a VMA split.
1335 //
1336 // Note: Don't check the page-aligned mem sizes since the extended protection
1337 // may incorrectly write protect non-relocation data.
1338 //
1339 // Example:
1340 //
1341 // |---- 3K ----|-- 1K --|---- 3K ---- |-- 1K --|
1342 // ----------------------------------------------------------------
1343 // | | | | |
1344 // SEG X | RO | RO | RW | | SEG Y
1345 // | | | | |
1346 // ----------------------------------------------------------------
1347 // | | |
1348 // | | |
1349 // | | |
1350 // relro_vaddr relro_vaddr relro_vaddr
1351 // (load_vaddr) + +
1352 // relro_memsz load_memsz
1353 //
1354 // ----------------------------------------------------------------
1355 // | PAGE | PAGE |
1356 // ----------------------------------------------------------------
1357 // | Potential |
1358 // |----- Extended RO ----|
1359 // | Protection |
1360 //
1361 // If the check below uses page aligned mem sizes it will cause incorrect write
1362 // protection of the 3K RW part of the LOAD segment containing the GNU_RELRO.
1363 if (relro_phdr->p_memsz < phdr->p_memsz) {
1364 return;
1365 }
1366
1367 ElfW(Addr) p_memsz = phdr->p_memsz;
1368 ElfW(Addr) p_filesz = phdr->p_filesz;
1369
1370 // Attempt extending the VMA (mprotect range). Without extending the range,
1371 // mprotect will only RO protect a part of the extended RW LOAD segment, which
1372 // will leave an extra split RW VMA (the gap).
1373 _extend_load_segment_vma(phdr_table, phdr_count, index, &p_memsz, &p_filesz,
Kalesh Singhb23787f2024-09-05 08:22:06 +00001374 should_pad_segments, should_use_16kib_app_compat);
Kalesh Singh702d9b02024-03-13 13:38:04 -07001375
1376 *seg_page_end = page_end(phdr->p_vaddr + p_memsz + load_bias);
1377 return;
1378 }
1379 }
1380}
1381
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001382/* Used internally by phdr_table_protect_gnu_relro and
1383 * phdr_table_unprotect_gnu_relro.
1384 */
Elliott Hughes0266ae52014-02-10 17:46:57 -08001385static int _phdr_table_set_gnu_relro_prot(const ElfW(Phdr)* phdr_table, size_t phdr_count,
Kalesh Singh702d9b02024-03-13 13:38:04 -07001386 ElfW(Addr) load_bias, int prot_flags,
Kalesh Singhb23787f2024-09-05 08:22:06 +00001387 bool should_pad_segments,
1388 bool should_use_16kib_app_compat) {
Elliott Hughes0266ae52014-02-10 17:46:57 -08001389 const ElfW(Phdr)* phdr = phdr_table;
1390 const ElfW(Phdr)* phdr_limit = phdr + phdr_count;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001391
Elliott Hughes0266ae52014-02-10 17:46:57 -08001392 for (phdr = phdr_table; phdr < phdr_limit; phdr++) {
1393 if (phdr->p_type != PT_GNU_RELRO) {
1394 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001395 }
Elliott Hughes0266ae52014-02-10 17:46:57 -08001396
1397 // Tricky: what happens when the relro segment does not start
1398 // or end at page boundaries? We're going to be over-protective
1399 // here and put every page touched by the segment as read-only.
1400
1401 // This seems to match Ian Lance Taylor's description of the
1402 // feature at http://www.airs.com/blog/archives/189.
1403
1404 // Extract:
1405 // Note that the current dynamic linker code will only work
1406 // correctly if the PT_GNU_RELRO segment starts on a page
1407 // boundary. This is because the dynamic linker rounds the
1408 // p_vaddr field down to the previous page boundary. If
1409 // there is anything on the page which should not be read-only,
1410 // the program is likely to fail at runtime. So in effect the
1411 // linker must only emit a PT_GNU_RELRO segment if it ensures
1412 // that it starts on a page boundary.
Zheng Pan9535c322024-02-14 00:04:10 +00001413 ElfW(Addr) seg_page_start = page_start(phdr->p_vaddr) + load_bias;
1414 ElfW(Addr) seg_page_end = page_end(phdr->p_vaddr + phdr->p_memsz) + load_bias;
Kalesh Singh702d9b02024-03-13 13:38:04 -07001415 _extend_gnu_relro_prot_end(phdr, phdr_table, phdr_count, load_bias, &seg_page_end,
Kalesh Singhb23787f2024-09-05 08:22:06 +00001416 should_pad_segments, should_use_16kib_app_compat);
Elliott Hughes0266ae52014-02-10 17:46:57 -08001417
Elliott Hughesfaf05ba2014-02-11 16:59:37 -08001418 int ret = mprotect(reinterpret_cast<void*>(seg_page_start),
Elliott Hughes0266ae52014-02-10 17:46:57 -08001419 seg_page_end - seg_page_start,
1420 prot_flags);
1421 if (ret < 0) {
1422 return -1;
1423 }
1424 }
1425 return 0;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001426}
1427
1428/* Apply GNU relro protection if specified by the program header. This will
1429 * turn some of the pages of a writable PT_LOAD segment to read-only, as
1430 * specified by one or more PT_GNU_RELRO segments. This must be always
1431 * performed after relocations.
1432 *
Ard Biesheuvel12c78bb2012-08-14 12:30:09 +02001433 * The areas typically covered are .got and .data.rel.ro, these are
1434 * read-only from the program's POV, but contain absolute addresses
1435 * that need to be relocated before use.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001436 *
1437 * Input:
1438 * phdr_table -> program header table
Elliott Hughes105bc262012-08-15 16:56:00 -07001439 * phdr_count -> number of entries in tables
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001440 * load_bias -> load bias
Kalesh Singh702d9b02024-03-13 13:38:04 -07001441 * should_pad_segments -> Were segments extended to avoid gaps in the memory map
Kalesh Singhb23787f2024-09-05 08:22:06 +00001442 * should_use_16kib_app_compat -> Is the ELF being loaded in 16KiB app compat mode.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001443 * Return:
Mitch Phillips117e45e2023-10-20 13:32:33 +00001444 * 0 on success, -1 on failure (error code in errno).
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001445 */
Kalesh Singh702d9b02024-03-13 13:38:04 -07001446int phdr_table_protect_gnu_relro(const ElfW(Phdr)* phdr_table, size_t phdr_count,
Kalesh Singhb23787f2024-09-05 08:22:06 +00001447 ElfW(Addr) load_bias, bool should_pad_segments,
1448 bool should_use_16kib_app_compat) {
Kalesh Singh702d9b02024-03-13 13:38:04 -07001449 return _phdr_table_set_gnu_relro_prot(phdr_table, phdr_count, load_bias, PROT_READ,
Kalesh Singhb23787f2024-09-05 08:22:06 +00001450 should_pad_segments, should_use_16kib_app_compat);
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001451}
1452
Kalesh Singhce1c3cf2024-09-30 13:26:23 -07001453/*
1454 * Apply RX protection to the compat relro region of the ELF being loaded in
1455 * 16KiB compat mode.
1456 *
1457 * Input:
1458 * start -> start address of the compat relro region.
1459 * size -> size of the compat relro region in bytes.
1460 * Return:
1461 * 0 on success, -1 on failure (error code in errno).
1462 */
1463int phdr_table_protect_gnu_relro_16kib_compat(ElfW(Addr) start, ElfW(Addr) size) {
1464 return mprotect(reinterpret_cast<void*>(start), size, PROT_READ | PROT_EXEC);
1465}
1466
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001467/* Serialize the GNU relro segments to the given file descriptor. This can be
1468 * performed after relocations to allow another process to later share the
1469 * relocated segment, if it was loaded at the same address.
1470 *
1471 * Input:
1472 * phdr_table -> program header table
1473 * phdr_count -> number of entries in tables
1474 * load_bias -> load bias
1475 * fd -> writable file descriptor to use
Torne (Richard Coles)fa9f7f22019-04-02 17:04:42 -04001476 * file_offset -> pointer to offset into file descriptor to use/update
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001477 * Return:
Mitch Phillips117e45e2023-10-20 13:32:33 +00001478 * 0 on success, -1 on failure (error code in errno).
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001479 */
Dmitriy Ivanov20d89cb2015-03-30 18:43:38 -07001480int phdr_table_serialize_gnu_relro(const ElfW(Phdr)* phdr_table,
1481 size_t phdr_count,
1482 ElfW(Addr) load_bias,
Torne (Richard Coles)fa9f7f22019-04-02 17:04:42 -04001483 int fd,
1484 size_t* file_offset) {
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001485 const ElfW(Phdr)* phdr = phdr_table;
1486 const ElfW(Phdr)* phdr_limit = phdr + phdr_count;
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001487
1488 for (phdr = phdr_table; phdr < phdr_limit; phdr++) {
1489 if (phdr->p_type != PT_GNU_RELRO) {
1490 continue;
1491 }
1492
Peter Collingbournebb11ee62022-05-02 12:26:16 -07001493 ElfW(Addr) seg_page_start = page_start(phdr->p_vaddr) + load_bias;
1494 ElfW(Addr) seg_page_end = page_end(phdr->p_vaddr + phdr->p_memsz) + load_bias;
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001495 ssize_t size = seg_page_end - seg_page_start;
1496
1497 ssize_t written = TEMP_FAILURE_RETRY(write(fd, reinterpret_cast<void*>(seg_page_start), size));
1498 if (written != size) {
1499 return -1;
1500 }
1501 void* map = mmap(reinterpret_cast<void*>(seg_page_start), size, PROT_READ,
Torne (Richard Coles)fa9f7f22019-04-02 17:04:42 -04001502 MAP_PRIVATE|MAP_FIXED, fd, *file_offset);
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001503 if (map == MAP_FAILED) {
1504 return -1;
1505 }
Torne (Richard Coles)fa9f7f22019-04-02 17:04:42 -04001506 *file_offset += size;
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001507 }
1508 return 0;
1509}
1510
1511/* Where possible, replace the GNU relro segments with mappings of the given
1512 * file descriptor. This can be performed after relocations to allow a file
1513 * previously created by phdr_table_serialize_gnu_relro in another process to
1514 * replace the dirty relocated pages, saving memory, if it was loaded at the
1515 * same address. We have to compare the data before we map over it, since some
1516 * parts of the relro segment may not be identical due to other libraries in
1517 * the process being loaded at different addresses.
1518 *
1519 * Input:
1520 * phdr_table -> program header table
1521 * phdr_count -> number of entries in tables
1522 * load_bias -> load bias
1523 * fd -> readable file descriptor to use
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -04001524 * file_offset -> pointer to offset into file descriptor to use/update
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001525 * Return:
Mitch Phillips117e45e2023-10-20 13:32:33 +00001526 * 0 on success, -1 on failure (error code in errno).
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001527 */
Dmitriy Ivanov20d89cb2015-03-30 18:43:38 -07001528int phdr_table_map_gnu_relro(const ElfW(Phdr)* phdr_table,
1529 size_t phdr_count,
1530 ElfW(Addr) load_bias,
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -04001531 int fd,
1532 size_t* file_offset) {
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001533 // Map the file at a temporary location so we can compare its contents.
1534 struct stat file_stat;
1535 if (TEMP_FAILURE_RETRY(fstat(fd, &file_stat)) != 0) {
1536 return -1;
1537 }
1538 off_t file_size = file_stat.st_size;
Dmitriy Ivanov851135b2014-08-29 12:02:36 -07001539 void* temp_mapping = nullptr;
Torne (Richard Coles)26ec9672014-04-30 15:48:40 +01001540 if (file_size > 0) {
Dmitriy Ivanov851135b2014-08-29 12:02:36 -07001541 temp_mapping = mmap(nullptr, file_size, PROT_READ, MAP_PRIVATE, fd, 0);
Torne (Richard Coles)26ec9672014-04-30 15:48:40 +01001542 if (temp_mapping == MAP_FAILED) {
1543 return -1;
1544 }
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001545 }
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001546
1547 // Iterate over the relro segments and compare/remap the pages.
1548 const ElfW(Phdr)* phdr = phdr_table;
1549 const ElfW(Phdr)* phdr_limit = phdr + phdr_count;
1550
1551 for (phdr = phdr_table; phdr < phdr_limit; phdr++) {
1552 if (phdr->p_type != PT_GNU_RELRO) {
1553 continue;
1554 }
1555
Peter Collingbournebb11ee62022-05-02 12:26:16 -07001556 ElfW(Addr) seg_page_start = page_start(phdr->p_vaddr) + load_bias;
1557 ElfW(Addr) seg_page_end = page_end(phdr->p_vaddr + phdr->p_memsz) + load_bias;
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001558
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -04001559 char* file_base = static_cast<char*>(temp_mapping) + *file_offset;
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001560 char* mem_base = reinterpret_cast<char*>(seg_page_start);
1561 size_t match_offset = 0;
1562 size_t size = seg_page_end - seg_page_start;
1563
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -04001564 if (file_size - *file_offset < size) {
Torne (Richard Coles)26ec9672014-04-30 15:48:40 +01001565 // File is too short to compare to this segment. The contents are likely
1566 // different as well (it's probably for a different library version) so
1567 // just don't bother checking.
1568 break;
1569 }
1570
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001571 while (match_offset < size) {
1572 // Skip over dissimilar pages.
1573 while (match_offset < size &&
Peter Collingbournebb11ee62022-05-02 12:26:16 -07001574 memcmp(mem_base + match_offset, file_base + match_offset, page_size()) != 0) {
1575 match_offset += page_size();
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001576 }
1577
1578 // Count similar pages.
1579 size_t mismatch_offset = match_offset;
1580 while (mismatch_offset < size &&
Peter Collingbournebb11ee62022-05-02 12:26:16 -07001581 memcmp(mem_base + mismatch_offset, file_base + mismatch_offset, page_size()) == 0) {
1582 mismatch_offset += page_size();
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001583 }
1584
1585 // Map over similar pages.
1586 if (mismatch_offset > match_offset) {
1587 void* map = mmap(mem_base + match_offset, mismatch_offset - match_offset,
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -04001588 PROT_READ, MAP_PRIVATE|MAP_FIXED, fd, *file_offset + match_offset);
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001589 if (map == MAP_FAILED) {
1590 munmap(temp_mapping, file_size);
1591 return -1;
1592 }
1593 }
1594
1595 match_offset = mismatch_offset;
1596 }
1597
1598 // Add to the base file offset in case there are multiple relro segments.
Torne (Richard Coles)efbe9a52018-10-17 15:59:38 -04001599 *file_offset += size;
Torne (Richard Coles)183ad9d2014-02-27 13:18:00 +00001600 }
1601 munmap(temp_mapping, file_size);
1602 return 0;
1603}
1604
1605
Elliott Hughes4eeb1f12013-10-25 17:38:02 -07001606#if defined(__arm__)
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001607/* Return the address and size of the .ARM.exidx section in memory,
1608 * if present.
1609 *
1610 * Input:
1611 * phdr_table -> program header table
Elliott Hughes105bc262012-08-15 16:56:00 -07001612 * phdr_count -> number of entries in tables
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001613 * load_bias -> load bias
1614 * Output:
Dmitriy Ivanov851135b2014-08-29 12:02:36 -07001615 * arm_exidx -> address of table in memory (null on failure).
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001616 * arm_exidx_count -> number of items in table (0 on failure).
1617 * Return:
Mitch Phillips117e45e2023-10-20 13:32:33 +00001618 * 0 on success, -1 on failure (_no_ error code in errno)
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001619 */
Elliott Hughes0266ae52014-02-10 17:46:57 -08001620int phdr_table_get_arm_exidx(const ElfW(Phdr)* phdr_table, size_t phdr_count,
1621 ElfW(Addr) load_bias,
Dmitriy Ivanov1649e7e2015-01-22 16:04:25 -08001622 ElfW(Addr)** arm_exidx, size_t* arm_exidx_count) {
Elliott Hughes0266ae52014-02-10 17:46:57 -08001623 const ElfW(Phdr)* phdr = phdr_table;
1624 const ElfW(Phdr)* phdr_limit = phdr + phdr_count;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001625
Elliott Hughes0266ae52014-02-10 17:46:57 -08001626 for (phdr = phdr_table; phdr < phdr_limit; phdr++) {
1627 if (phdr->p_type != PT_ARM_EXIDX) {
1628 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001629 }
Elliott Hughes0266ae52014-02-10 17:46:57 -08001630
1631 *arm_exidx = reinterpret_cast<ElfW(Addr)*>(load_bias + phdr->p_vaddr);
Dmitriy Ivanov1649e7e2015-01-22 16:04:25 -08001632 *arm_exidx_count = phdr->p_memsz / 8;
Elliott Hughes0266ae52014-02-10 17:46:57 -08001633 return 0;
1634 }
Dmitriy Ivanov851135b2014-08-29 12:02:36 -07001635 *arm_exidx = nullptr;
Elliott Hughes0266ae52014-02-10 17:46:57 -08001636 *arm_exidx_count = 0;
1637 return -1;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001638}
Elliott Hughes4eeb1f12013-10-25 17:38:02 -07001639#endif
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001640
Ard Biesheuvel12c78bb2012-08-14 12:30:09 +02001641/* Return the address and size of the ELF file's .dynamic section in memory,
Dmitriy Ivanov851135b2014-08-29 12:02:36 -07001642 * or null if missing.
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001643 *
1644 * Input:
1645 * phdr_table -> program header table
Elliott Hughes105bc262012-08-15 16:56:00 -07001646 * phdr_count -> number of entries in tables
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001647 * load_bias -> load bias
Ard Biesheuvel12c78bb2012-08-14 12:30:09 +02001648 * Output:
Dmitriy Ivanov851135b2014-08-29 12:02:36 -07001649 * dynamic -> address of table in memory (null on failure).
Ningsheng Jiane93be992014-09-16 15:22:10 +08001650 * dynamic_flags -> protection flags for section (unset on failure)
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001651 * Return:
Ard Biesheuvel12c78bb2012-08-14 12:30:09 +02001652 * void
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001653 */
Elliott Hughes0266ae52014-02-10 17:46:57 -08001654void phdr_table_get_dynamic_section(const ElfW(Phdr)* phdr_table, size_t phdr_count,
Ningsheng Jiane93be992014-09-16 15:22:10 +08001655 ElfW(Addr) load_bias, ElfW(Dyn)** dynamic,
1656 ElfW(Word)* dynamic_flags) {
Dmitriy Ivanov498eb182014-09-05 14:57:59 -07001657 *dynamic = nullptr;
Dmitriy Ivanov20d89cb2015-03-30 18:43:38 -07001658 for (size_t i = 0; i<phdr_count; ++i) {
1659 const ElfW(Phdr)& phdr = phdr_table[i];
1660 if (phdr.p_type == PT_DYNAMIC) {
1661 *dynamic = reinterpret_cast<ElfW(Dyn)*>(load_bias + phdr.p_vaddr);
Ningsheng Jiane93be992014-09-16 15:22:10 +08001662 if (dynamic_flags) {
Dmitriy Ivanov20d89cb2015-03-30 18:43:38 -07001663 *dynamic_flags = phdr.p_flags;
Ningsheng Jiane93be992014-09-16 15:22:10 +08001664 }
Dmitriy Ivanov14669a92014-09-05 16:42:53 -07001665 return;
1666 }
Elliott Hughes0266ae52014-02-10 17:46:57 -08001667 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001668}
1669
Evgenii Stepanovd640b222015-07-10 17:54:01 -07001670/* Return the program interpreter string, or nullptr if missing.
1671 *
1672 * Input:
1673 * phdr_table -> program header table
1674 * phdr_count -> number of entries in tables
1675 * load_bias -> load bias
1676 * Return:
1677 * pointer to the program interpreter string.
1678 */
Tamas Petz8d55d182020-02-24 14:15:25 +01001679const char* phdr_table_get_interpreter_name(const ElfW(Phdr)* phdr_table, size_t phdr_count,
Evgenii Stepanovd640b222015-07-10 17:54:01 -07001680 ElfW(Addr) load_bias) {
1681 for (size_t i = 0; i<phdr_count; ++i) {
1682 const ElfW(Phdr)& phdr = phdr_table[i];
1683 if (phdr.p_type == PT_INTERP) {
1684 return reinterpret_cast<const char*>(load_bias + phdr.p_vaddr);
1685 }
1686 }
1687 return nullptr;
1688}
1689
Robert Grosse4544d9f2014-10-15 14:32:19 -07001690// Sets loaded_phdr_ to the address of the program header table as it appears
1691// in the loaded segments in memory. This is in contrast with phdr_table_,
1692// which is temporary and will be released before the library is relocated.
Elliott Hughes650be4e2013-03-05 18:47:58 -08001693bool ElfReader::FindPhdr() {
Elliott Hughes0266ae52014-02-10 17:46:57 -08001694 const ElfW(Phdr)* phdr_limit = phdr_table_ + phdr_num_;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001695
Elliott Hughes650be4e2013-03-05 18:47:58 -08001696 // If there is a PT_PHDR, use it directly.
Elliott Hughes0266ae52014-02-10 17:46:57 -08001697 for (const ElfW(Phdr)* phdr = phdr_table_; phdr < phdr_limit; ++phdr) {
Elliott Hughes650be4e2013-03-05 18:47:58 -08001698 if (phdr->p_type == PT_PHDR) {
1699 return CheckPhdr(load_bias_ + phdr->p_vaddr);
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001700 }
Elliott Hughes650be4e2013-03-05 18:47:58 -08001701 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001702
Elliott Hughes650be4e2013-03-05 18:47:58 -08001703 // Otherwise, check the first loadable segment. If its file offset
1704 // is 0, it starts with the ELF header, and we can trivially find the
1705 // loaded program header from it.
Elliott Hughes0266ae52014-02-10 17:46:57 -08001706 for (const ElfW(Phdr)* phdr = phdr_table_; phdr < phdr_limit; ++phdr) {
Elliott Hughes650be4e2013-03-05 18:47:58 -08001707 if (phdr->p_type == PT_LOAD) {
1708 if (phdr->p_offset == 0) {
Elliott Hughes0266ae52014-02-10 17:46:57 -08001709 ElfW(Addr) elf_addr = load_bias_ + phdr->p_vaddr;
Elliott Hughesfaf05ba2014-02-11 16:59:37 -08001710 const ElfW(Ehdr)* ehdr = reinterpret_cast<const ElfW(Ehdr)*>(elf_addr);
Elliott Hughes0266ae52014-02-10 17:46:57 -08001711 ElfW(Addr) offset = ehdr->e_phoff;
Dmitriy Ivanov1649e7e2015-01-22 16:04:25 -08001712 return CheckPhdr(reinterpret_cast<ElfW(Addr)>(ehdr) + offset);
Elliott Hughes650be4e2013-03-05 18:47:58 -08001713 }
1714 break;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001715 }
Elliott Hughes650be4e2013-03-05 18:47:58 -08001716 }
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001717
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -07001718 DL_ERR("can't find loaded phdr for \"%s\"", name_.c_str());
Elliott Hughes650be4e2013-03-05 18:47:58 -08001719 return false;
1720}
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001721
Tamas Petz8d55d182020-02-24 14:15:25 +01001722// Tries to find .note.gnu.property section.
1723// It is not considered an error if such section is missing.
1724bool ElfReader::FindGnuPropertySection() {
1725#if defined(__aarch64__)
1726 note_gnu_property_ = GnuPropertySection(phdr_table_, phdr_num_, load_start(), name_.c_str());
1727#endif
1728 return true;
1729}
1730
Elliott Hughes650be4e2013-03-05 18:47:58 -08001731// Ensures that our program header is actually within a loadable
1732// segment. This should help catch badly-formed ELF files that
1733// would cause the linker to crash later when trying to access it.
Elliott Hughes0266ae52014-02-10 17:46:57 -08001734bool ElfReader::CheckPhdr(ElfW(Addr) loaded) {
1735 const ElfW(Phdr)* phdr_limit = phdr_table_ + phdr_num_;
1736 ElfW(Addr) loaded_end = loaded + (phdr_num_ * sizeof(ElfW(Phdr)));
Dmitriy Ivanovcf1cbbe2015-10-19 16:57:46 -07001737 for (const ElfW(Phdr)* phdr = phdr_table_; phdr < phdr_limit; ++phdr) {
Elliott Hughes650be4e2013-03-05 18:47:58 -08001738 if (phdr->p_type != PT_LOAD) {
1739 continue;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001740 }
Elliott Hughes0266ae52014-02-10 17:46:57 -08001741 ElfW(Addr) seg_start = phdr->p_vaddr + load_bias_;
1742 ElfW(Addr) seg_end = phdr->p_filesz + seg_start;
Elliott Hughes650be4e2013-03-05 18:47:58 -08001743 if (seg_start <= loaded && loaded_end <= seg_end) {
Elliott Hughes0266ae52014-02-10 17:46:57 -08001744 loaded_phdr_ = reinterpret_cast<const ElfW(Phdr)*>(loaded);
Elliott Hughes650be4e2013-03-05 18:47:58 -08001745 return true;
1746 }
1747 }
Dmitriy Ivanov4f7a7ad2015-10-15 12:07:25 -07001748 DL_ERR("\"%s\" loaded phdr %p not in loadable segment",
1749 name_.c_str(), reinterpret_cast<void*>(loaded));
Elliott Hughes650be4e2013-03-05 18:47:58 -08001750 return false;
David 'Digit' Turnerc1bd5592012-06-19 11:21:29 +02001751}