]>
Commit | Line | Data |
---|---|---|
d696c285 A |
1 | /* -*- mode: C++; c-basic-offset: 4; tab-width: 4 -*- |
2 | * | |
a645023d | 3 | * Copyright (c) 2006-2010 Apple Inc. All rights reserved. |
d696c285 A |
4 | * |
5 | * @APPLE_LICENSE_HEADER_START@ | |
6 | * | |
7 | * This file contains Original Code and/or Modifications of Original Code | |
8 | * as defined in and that are subject to the Apple Public Source License | |
9 | * Version 2.0 (the 'License'). You may not use this file except in | |
10 | * compliance with the License. Please obtain a copy of the License at | |
11 | * http://www.opensource.apple.com/apsl/ and read it before using this | |
12 | * file. | |
13 | * | |
14 | * The Original Code and all software distributed under the License are | |
15 | * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER | |
16 | * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, | |
17 | * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, | |
18 | * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. | |
19 | * Please see the License for the specific language governing rights and | |
20 | * limitations under the License. | |
21 | * | |
22 | * @APPLE_LICENSE_HEADER_END@ | |
23 | */ | |
24 | ||
25 | #include <sys/types.h> | |
26 | #include <sys/stat.h> | |
27 | #include <sys/mman.h> | |
28 | #include <stdarg.h> | |
29 | #include <stdio.h> | |
30 | #include <fcntl.h> | |
31 | #include <unistd.h> | |
55e3d2f6 | 32 | #include <errno.h> |
d696c285 A |
33 | |
34 | #include <vector> | |
a61fdf0a A |
35 | #include <set> |
36 | #include <ext/hash_set> | |
d696c285 A |
37 | |
38 | #include "MachOFileAbstraction.hpp" | |
39 | #include "Architectures.hpp" | |
40 | ||
41 | ||
42 | __attribute__((noreturn)) | |
43 | void throwf(const char* format, ...) | |
44 | { | |
45 | va_list list; | |
46 | char* p; | |
47 | va_start(list, format); | |
48 | vasprintf(&p, format, list); | |
49 | va_end(list); | |
50 | ||
51 | const char* t = p; | |
52 | throw t; | |
53 | } | |
54 | ||
a645023d A |
55 | static uint64_t read_uleb128(const uint8_t*& p, const uint8_t* end) |
56 | { | |
57 | uint64_t result = 0; | |
58 | int bit = 0; | |
59 | do { | |
60 | if (p == end) | |
61 | throwf("malformed uleb128"); | |
62 | ||
63 | uint64_t slice = *p & 0x7f; | |
64 | ||
65 | if (bit >= 64 || slice << bit >> bit != slice) | |
66 | throwf("uleb128 too big"); | |
67 | else { | |
68 | result |= (slice << bit); | |
69 | bit += 7; | |
70 | } | |
71 | } | |
72 | while (*p++ & 0x80); | |
73 | return result; | |
74 | } | |
d696c285 | 75 | |
afe874b1 A |
76 | |
77 | static int64_t read_sleb128(const uint8_t*& p, const uint8_t* end) | |
78 | { | |
79 | int64_t result = 0; | |
80 | int bit = 0; | |
81 | uint8_t byte; | |
82 | do { | |
83 | if (p == end) | |
84 | throwf("malformed sleb128"); | |
85 | byte = *p++; | |
86 | result |= ((byte & 0x7f) << bit); | |
87 | bit += 7; | |
88 | } while (byte & 0x80); | |
89 | // sign extend negative numbers | |
90 | if ( (byte & 0x40) != 0 ) | |
91 | result |= (-1LL) << bit; | |
92 | return result; | |
93 | } | |
94 | ||
95 | ||
d696c285 A |
96 | template <typename A> |
97 | class MachOChecker | |
98 | { | |
99 | public: | |
100 | static bool validFile(const uint8_t* fileContent); | |
101 | static MachOChecker<A>* make(const uint8_t* fileContent, uint32_t fileLength, const char* path) | |
102 | { return new MachOChecker<A>(fileContent, fileLength, path); } | |
103 | virtual ~MachOChecker() {} | |
104 | ||
105 | ||
106 | private: | |
107 | typedef typename A::P P; | |
108 | typedef typename A::P::E E; | |
109 | typedef typename A::P::uint_t pint_t; | |
110 | ||
a61fdf0a A |
111 | class CStringEquals |
112 | { | |
113 | public: | |
114 | bool operator()(const char* left, const char* right) const { return (strcmp(left, right) == 0); } | |
115 | }; | |
116 | ||
117 | typedef __gnu_cxx::hash_set<const char*, __gnu_cxx::hash<const char*>, CStringEquals> StringSet; | |
118 | ||
d696c285 A |
119 | MachOChecker(const uint8_t* fileContent, uint32_t fileLength, const char* path); |
120 | void checkMachHeader(); | |
121 | void checkLoadCommands(); | |
122 | void checkSection(const macho_segment_command<P>* segCmd, const macho_section<P>* sect); | |
123 | uint8_t loadCommandSizeMask(); | |
a61fdf0a | 124 | void checkSymbolTable(); |
afe874b1 | 125 | void checkInitTerms(); |
d696c285 | 126 | void checkIndirectSymbolTable(); |
69a49097 A |
127 | void checkRelocations(); |
128 | void checkExternalReloation(const macho_relocation_info<P>* reloc); | |
129 | void checkLocalReloation(const macho_relocation_info<P>* reloc); | |
130 | pint_t relocBase(); | |
131 | bool addressInWritableSegment(pint_t address); | |
a645023d A |
132 | bool hasTextRelocInRange(pint_t start, pint_t end); |
133 | pint_t segStartAddress(uint8_t segIndex); | |
afe874b1 A |
134 | bool addressIsRebaseSite(pint_t addr); |
135 | bool addressIsBindingSite(pint_t addr); | |
136 | pint_t getInitialStackPointer(const macho_thread_command<P>*); | |
137 | pint_t getEntryPoint(const macho_thread_command<P>*); | |
138 | ||
139 | ||
140 | ||
d696c285 A |
141 | const char* fPath; |
142 | const macho_header<P>* fHeader; | |
143 | uint32_t fLength; | |
144 | const char* fStrings; | |
145 | const char* fStringsEnd; | |
146 | const macho_nlist<P>* fSymbols; | |
147 | uint32_t fSymbolCount; | |
a61fdf0a | 148 | const macho_dysymtab_command<P>* fDynamicSymbolTable; |
d696c285 A |
149 | const uint32_t* fIndirectTable; |
150 | uint32_t fIndirectTableCount; | |
69a49097 A |
151 | const macho_relocation_info<P>* fLocalRelocations; |
152 | uint32_t fLocalRelocationsCount; | |
153 | const macho_relocation_info<P>* fExternalRelocations; | |
154 | uint32_t fExternalRelocationsCount; | |
69a49097 | 155 | bool fWriteableSegmentWithAddrOver4G; |
afe874b1 | 156 | bool fSlidableImage; |
69a49097 A |
157 | const macho_segment_command<P>* fFirstSegment; |
158 | const macho_segment_command<P>* fFirstWritableSegment; | |
afe874b1 | 159 | const macho_segment_command<P>* fTEXTSegment; |
a645023d | 160 | const macho_dyld_info_command<P>* fDyldInfo; |
c211e7c9 | 161 | uint32_t fSectionCount; |
a645023d | 162 | std::vector<const macho_segment_command<P>*>fSegments; |
d696c285 A |
163 | }; |
164 | ||
165 | ||
166 | ||
167 | template <> | |
168 | bool MachOChecker<ppc>::validFile(const uint8_t* fileContent) | |
169 | { | |
170 | const macho_header<P>* header = (const macho_header<P>*)fileContent; | |
171 | if ( header->magic() != MH_MAGIC ) | |
172 | return false; | |
173 | if ( header->cputype() != CPU_TYPE_POWERPC ) | |
174 | return false; | |
175 | switch (header->filetype()) { | |
176 | case MH_EXECUTE: | |
177 | case MH_DYLIB: | |
178 | case MH_BUNDLE: | |
179 | case MH_DYLINKER: | |
180 | return true; | |
181 | } | |
182 | return false; | |
183 | } | |
184 | ||
185 | template <> | |
186 | bool MachOChecker<ppc64>::validFile(const uint8_t* fileContent) | |
187 | { | |
188 | const macho_header<P>* header = (const macho_header<P>*)fileContent; | |
189 | if ( header->magic() != MH_MAGIC_64 ) | |
190 | return false; | |
191 | if ( header->cputype() != CPU_TYPE_POWERPC64 ) | |
192 | return false; | |
193 | switch (header->filetype()) { | |
194 | case MH_EXECUTE: | |
195 | case MH_DYLIB: | |
196 | case MH_BUNDLE: | |
197 | case MH_DYLINKER: | |
198 | return true; | |
199 | } | |
200 | return false; | |
201 | } | |
202 | ||
203 | template <> | |
204 | bool MachOChecker<x86>::validFile(const uint8_t* fileContent) | |
205 | { | |
206 | const macho_header<P>* header = (const macho_header<P>*)fileContent; | |
207 | if ( header->magic() != MH_MAGIC ) | |
208 | return false; | |
209 | if ( header->cputype() != CPU_TYPE_I386 ) | |
210 | return false; | |
211 | switch (header->filetype()) { | |
212 | case MH_EXECUTE: | |
213 | case MH_DYLIB: | |
214 | case MH_BUNDLE: | |
215 | case MH_DYLINKER: | |
216 | return true; | |
217 | } | |
218 | return false; | |
219 | } | |
220 | ||
69a49097 A |
221 | template <> |
222 | bool MachOChecker<x86_64>::validFile(const uint8_t* fileContent) | |
223 | { | |
224 | const macho_header<P>* header = (const macho_header<P>*)fileContent; | |
225 | if ( header->magic() != MH_MAGIC_64 ) | |
226 | return false; | |
227 | if ( header->cputype() != CPU_TYPE_X86_64 ) | |
228 | return false; | |
229 | switch (header->filetype()) { | |
230 | case MH_EXECUTE: | |
231 | case MH_DYLIB: | |
232 | case MH_BUNDLE: | |
233 | case MH_DYLINKER: | |
234 | return true; | |
235 | } | |
236 | return false; | |
237 | } | |
d696c285 | 238 | |
2f2f92e4 A |
239 | template <> |
240 | bool MachOChecker<arm>::validFile(const uint8_t* fileContent) | |
241 | { | |
242 | const macho_header<P>* header = (const macho_header<P>*)fileContent; | |
243 | if ( header->magic() != MH_MAGIC ) | |
244 | return false; | |
245 | if ( header->cputype() != CPU_TYPE_ARM ) | |
246 | return false; | |
247 | switch (header->filetype()) { | |
248 | case MH_EXECUTE: | |
249 | case MH_DYLIB: | |
250 | case MH_BUNDLE: | |
251 | case MH_DYLINKER: | |
252 | return true; | |
253 | } | |
254 | return false; | |
255 | } | |
d696c285 A |
256 | |
257 | template <> uint8_t MachOChecker<ppc>::loadCommandSizeMask() { return 0x03; } | |
258 | template <> uint8_t MachOChecker<ppc64>::loadCommandSizeMask() { return 0x07; } | |
259 | template <> uint8_t MachOChecker<x86>::loadCommandSizeMask() { return 0x03; } | |
69a49097 | 260 | template <> uint8_t MachOChecker<x86_64>::loadCommandSizeMask() { return 0x07; } |
2f2f92e4 | 261 | template <> uint8_t MachOChecker<arm>::loadCommandSizeMask() { return 0x03; } |
d696c285 | 262 | |
afe874b1 A |
263 | |
264 | template <> | |
265 | ppc::P::uint_t MachOChecker<ppc>::getInitialStackPointer(const macho_thread_command<ppc::P>* threadInfo) | |
266 | { | |
267 | return threadInfo->thread_register(3); | |
268 | } | |
269 | ||
270 | template <> | |
271 | ppc64::P::uint_t MachOChecker<ppc64>::getInitialStackPointer(const macho_thread_command<ppc64::P>* threadInfo) | |
272 | { | |
273 | return threadInfo->thread_register(3); | |
274 | } | |
275 | ||
276 | template <> | |
277 | x86::P::uint_t MachOChecker<x86>::getInitialStackPointer(const macho_thread_command<x86::P>* threadInfo) | |
278 | { | |
279 | return threadInfo->thread_register(7); | |
280 | } | |
281 | ||
282 | template <> | |
283 | x86_64::P::uint_t MachOChecker<x86_64>::getInitialStackPointer(const macho_thread_command<x86_64::P>* threadInfo) | |
284 | { | |
285 | return threadInfo->thread_register(7); | |
286 | } | |
287 | ||
288 | template <> | |
289 | arm::P::uint_t MachOChecker<arm>::getInitialStackPointer(const macho_thread_command<arm::P>* threadInfo) | |
290 | { | |
291 | return threadInfo->thread_register(13); | |
292 | } | |
293 | ||
294 | ||
295 | ||
296 | ||
297 | ||
298 | template <> | |
299 | ppc::P::uint_t MachOChecker<ppc>::getEntryPoint(const macho_thread_command<ppc::P>* threadInfo) | |
300 | { | |
301 | return threadInfo->thread_register(0); | |
302 | } | |
303 | ||
304 | template <> | |
305 | ppc64::P::uint_t MachOChecker<ppc64>::getEntryPoint(const macho_thread_command<ppc64::P>* threadInfo) | |
306 | { | |
307 | return threadInfo->thread_register(0); | |
308 | } | |
309 | ||
310 | template <> | |
311 | x86::P::uint_t MachOChecker<x86>::getEntryPoint(const macho_thread_command<x86::P>* threadInfo) | |
312 | { | |
313 | return threadInfo->thread_register(10); | |
314 | } | |
315 | ||
316 | template <> | |
317 | x86_64::P::uint_t MachOChecker<x86_64>::getEntryPoint(const macho_thread_command<x86_64::P>* threadInfo) | |
318 | { | |
319 | return threadInfo->thread_register(16); | |
320 | } | |
321 | ||
322 | template <> | |
323 | arm::P::uint_t MachOChecker<arm>::getEntryPoint(const macho_thread_command<arm::P>* threadInfo) | |
324 | { | |
325 | return threadInfo->thread_register(15); | |
326 | } | |
327 | ||
328 | ||
d696c285 A |
329 | template <typename A> |
330 | MachOChecker<A>::MachOChecker(const uint8_t* fileContent, uint32_t fileLength, const char* path) | |
a61fdf0a | 331 | : fHeader(NULL), fLength(fileLength), fStrings(NULL), fSymbols(NULL), fSymbolCount(0), fDynamicSymbolTable(NULL), fIndirectTableCount(0), |
69a49097 | 332 | fLocalRelocations(NULL), fLocalRelocationsCount(0), fExternalRelocations(NULL), fExternalRelocationsCount(0), |
afe874b1 A |
333 | fWriteableSegmentWithAddrOver4G(false), fSlidableImage(false), fFirstSegment(NULL), fFirstWritableSegment(NULL), |
334 | fTEXTSegment(NULL), fDyldInfo(NULL), fSectionCount(0) | |
d696c285 A |
335 | { |
336 | // sanity check | |
337 | if ( ! validFile(fileContent) ) | |
338 | throw "not a mach-o file that can be checked"; | |
339 | ||
340 | fPath = strdup(path); | |
341 | fHeader = (const macho_header<P>*)fileContent; | |
342 | ||
343 | // sanity check header | |
344 | checkMachHeader(); | |
345 | ||
346 | // check load commands | |
347 | checkLoadCommands(); | |
348 | ||
349 | checkIndirectSymbolTable(); | |
350 | ||
69a49097 | 351 | checkRelocations(); |
a61fdf0a A |
352 | |
353 | checkSymbolTable(); | |
afe874b1 A |
354 | |
355 | checkInitTerms(); | |
d696c285 A |
356 | } |
357 | ||
358 | ||
359 | template <typename A> | |
360 | void MachOChecker<A>::checkMachHeader() | |
361 | { | |
362 | if ( (fHeader->sizeofcmds() + sizeof(macho_header<P>)) > fLength ) | |
363 | throw "sizeofcmds in mach_header is larger than file"; | |
364 | ||
365 | uint32_t flags = fHeader->flags(); | |
a645023d | 366 | const uint32_t invalidBits = MH_INCRLINK | MH_LAZY_INIT | 0xFE000000; |
d696c285 A |
367 | if ( flags & invalidBits ) |
368 | throw "invalid bits in mach_header flags"; | |
a61fdf0a A |
369 | if ( (flags & MH_NO_REEXPORTED_DYLIBS) && (fHeader->filetype() != MH_DYLIB) ) |
370 | throw "MH_NO_REEXPORTED_DYLIBS bit of mach_header flags only valid for dylibs"; | |
afe874b1 A |
371 | |
372 | switch ( fHeader->filetype() ) { | |
373 | case MH_EXECUTE: | |
374 | fSlidableImage = ( flags & MH_PIE ); | |
375 | break; | |
376 | case MH_DYLIB: | |
377 | case MH_BUNDLE: | |
378 | fSlidableImage = true; | |
379 | break; | |
380 | default: | |
381 | throw "not a mach-o file type supported by this tool"; | |
382 | } | |
d696c285 A |
383 | } |
384 | ||
385 | template <typename A> | |
386 | void MachOChecker<A>::checkLoadCommands() | |
387 | { | |
388 | // check that all load commands fit within the load command space file | |
2f2f92e4 | 389 | const macho_encryption_info_command<P>* encryption_info = NULL; |
afe874b1 | 390 | const macho_thread_command<P>* threadInfo = NULL; |
d696c285 A |
391 | const uint8_t* const endOfFile = (uint8_t*)fHeader + fLength; |
392 | const uint8_t* const endOfLoadCommands = (uint8_t*)fHeader + sizeof(macho_header<P>) + fHeader->sizeofcmds(); | |
393 | const uint32_t cmd_count = fHeader->ncmds(); | |
394 | const macho_load_command<P>* const cmds = (macho_load_command<P>*)((uint8_t*)fHeader + sizeof(macho_header<P>)); | |
395 | const macho_load_command<P>* cmd = cmds; | |
396 | for (uint32_t i = 0; i < cmd_count; ++i) { | |
397 | uint32_t size = cmd->cmdsize(); | |
398 | if ( (size & this->loadCommandSizeMask()) != 0 ) | |
399 | throwf("load command #%d has a unaligned size", i); | |
400 | const uint8_t* endOfCmd = ((uint8_t*)cmd)+cmd->cmdsize(); | |
401 | if ( endOfCmd > endOfLoadCommands ) | |
402 | throwf("load command #%d extends beyond the end of the load commands", i); | |
403 | if ( endOfCmd > endOfFile ) | |
404 | throwf("load command #%d extends beyond the end of the file", i); | |
405 | switch ( cmd->cmd() ) { | |
406 | case macho_segment_command<P>::CMD: | |
407 | case LC_SYMTAB: | |
d696c285 A |
408 | case LC_DYSYMTAB: |
409 | case LC_LOAD_DYLIB: | |
410 | case LC_ID_DYLIB: | |
411 | case LC_LOAD_DYLINKER: | |
412 | case LC_ID_DYLINKER: | |
413 | case macho_routines_command<P>::CMD: | |
414 | case LC_SUB_FRAMEWORK: | |
d696c285 A |
415 | case LC_SUB_CLIENT: |
416 | case LC_TWOLEVEL_HINTS: | |
417 | case LC_PREBIND_CKSUM: | |
418 | case LC_LOAD_WEAK_DYLIB: | |
2f2f92e4 | 419 | case LC_LAZY_LOAD_DYLIB: |
d696c285 | 420 | case LC_UUID: |
a61fdf0a A |
421 | case LC_REEXPORT_DYLIB: |
422 | case LC_SEGMENT_SPLIT_INFO: | |
2f2f92e4 | 423 | case LC_CODE_SIGNATURE: |
a645023d A |
424 | case LC_LOAD_UPWARD_DYLIB: |
425 | case LC_VERSION_MIN_MACOSX: | |
426 | case LC_VERSION_MIN_IPHONEOS: | |
427 | case LC_FUNCTION_STARTS: | |
afe874b1 | 428 | case LC_RPATH: |
a645023d | 429 | break; |
55e3d2f6 A |
430 | case LC_DYLD_INFO: |
431 | case LC_DYLD_INFO_ONLY: | |
a645023d | 432 | fDyldInfo = (macho_dyld_info_command<P>*)cmd; |
2f2f92e4 A |
433 | break; |
434 | case LC_ENCRYPTION_INFO: | |
435 | encryption_info = (macho_encryption_info_command<P>*)cmd; | |
a61fdf0a A |
436 | break; |
437 | case LC_SUB_UMBRELLA: | |
438 | case LC_SUB_LIBRARY: | |
439 | if ( fHeader->flags() & MH_NO_REEXPORTED_DYLIBS ) | |
440 | throw "MH_NO_REEXPORTED_DYLIBS bit of mach_header flags should not be set in an image with LC_SUB_LIBRARY or LC_SUB_UMBRELLA"; | |
d696c285 | 441 | break; |
afe874b1 A |
442 | case LC_UNIXTHREAD: |
443 | if ( fHeader->filetype() != MH_EXECUTE ) | |
444 | throw "LC_UNIXTHREAD can only be used in MH_EXECUTE file types"; | |
445 | threadInfo = (macho_thread_command<P>*)cmd; | |
446 | break; | |
d696c285 A |
447 | default: |
448 | throwf("load command #%d is an unknown kind 0x%X", i, cmd->cmd()); | |
449 | } | |
450 | cmd = (const macho_load_command<P>*)endOfCmd; | |
451 | } | |
452 | ||
453 | // check segments | |
454 | cmd = cmds; | |
455 | std::vector<std::pair<pint_t, pint_t> > segmentAddressRanges; | |
456 | std::vector<std::pair<pint_t, pint_t> > segmentFileOffsetRanges; | |
457 | const macho_segment_command<P>* linkEditSegment = NULL; | |
afe874b1 | 458 | const macho_segment_command<P>* stackSegment = NULL; |
d696c285 A |
459 | for (uint32_t i = 0; i < cmd_count; ++i) { |
460 | if ( cmd->cmd() == macho_segment_command<P>::CMD ) { | |
461 | const macho_segment_command<P>* segCmd = (const macho_segment_command<P>*)cmd; | |
a645023d | 462 | fSegments.push_back(segCmd); |
d696c285 A |
463 | if ( segCmd->cmdsize() != (sizeof(macho_segment_command<P>) + segCmd->nsects() * sizeof(macho_section_content<P>)) ) |
464 | throw "invalid segment load command size"; | |
465 | ||
466 | // see if this overlaps another segment address range | |
467 | uint64_t startAddr = segCmd->vmaddr(); | |
468 | uint64_t endAddr = startAddr + segCmd->vmsize(); | |
469 | for (typename std::vector<std::pair<pint_t, pint_t> >::iterator it = segmentAddressRanges.begin(); it != segmentAddressRanges.end(); ++it) { | |
470 | if ( it->first < startAddr ) { | |
471 | if ( it->second > startAddr ) | |
472 | throw "overlapping segment vm addresses"; | |
473 | } | |
474 | else if ( it->first > startAddr ) { | |
475 | if ( it->first < endAddr ) | |
476 | throw "overlapping segment vm addresses"; | |
477 | } | |
478 | else { | |
479 | throw "overlapping segment vm addresses"; | |
480 | } | |
481 | segmentAddressRanges.push_back(std::make_pair<pint_t, pint_t>(startAddr, endAddr)); | |
482 | } | |
483 | // see if this overlaps another segment file offset range | |
484 | uint64_t startOffset = segCmd->fileoff(); | |
485 | uint64_t endOffset = startOffset + segCmd->filesize(); | |
486 | for (typename std::vector<std::pair<pint_t, pint_t> >::iterator it = segmentFileOffsetRanges.begin(); it != segmentFileOffsetRanges.end(); ++it) { | |
487 | if ( it->first < startOffset ) { | |
488 | if ( it->second > startOffset ) | |
489 | throw "overlapping segment file data"; | |
490 | } | |
491 | else if ( it->first > startOffset ) { | |
492 | if ( it->first < endOffset ) | |
493 | throw "overlapping segment file data"; | |
494 | } | |
495 | else { | |
496 | throw "overlapping segment file data"; | |
497 | } | |
498 | segmentFileOffsetRanges.push_back(std::make_pair<pint_t, pint_t>(startOffset, endOffset)); | |
499 | // check is within file bounds | |
500 | if ( (startOffset > fLength) || (endOffset > fLength) ) | |
501 | throw "segment file data is past end of file"; | |
502 | } | |
503 | // verify it fits in file | |
504 | if ( startOffset > fLength ) | |
505 | throw "segment fileoff does not fit in file"; | |
506 | if ( endOffset > fLength ) | |
507 | throw "segment fileoff+filesize does not fit in file"; | |
508 | ||
afe874b1 | 509 | // record special segments |
d696c285 A |
510 | if ( strcmp(segCmd->segname(), "__LINKEDIT") == 0 ) |
511 | linkEditSegment = segCmd; | |
afe874b1 A |
512 | else if ( strcmp(segCmd->segname(), "__UNIXSTACK") == 0 ) |
513 | stackSegment = segCmd; | |
69a49097 A |
514 | |
515 | // cache interesting segments | |
516 | if ( fFirstSegment == NULL ) | |
517 | fFirstSegment = segCmd; | |
afe874b1 A |
518 | if ( (fTEXTSegment == NULL) && (strcmp(segCmd->segname(), "__TEXT") == 0) ) |
519 | fTEXTSegment = segCmd; | |
a61fdf0a A |
520 | if ( (segCmd->initprot() & VM_PROT_WRITE) != 0 ) { |
521 | if ( fFirstWritableSegment == NULL ) | |
522 | fFirstWritableSegment = segCmd; | |
523 | if ( segCmd->vmaddr() > 0x100000000ULL ) | |
524 | fWriteableSegmentWithAddrOver4G = true; | |
525 | } | |
afe874b1 | 526 | |
d696c285 A |
527 | // check section ranges |
528 | const macho_section<P>* const sectionsStart = (macho_section<P>*)((char*)segCmd + sizeof(macho_segment_command<P>)); | |
529 | const macho_section<P>* const sectionsEnd = §ionsStart[segCmd->nsects()]; | |
530 | for(const macho_section<P>* sect = sectionsStart; sect < sectionsEnd; ++sect) { | |
afe874b1 | 531 | // check all non-zero sized sections are within segment |
d696c285 A |
532 | if ( sect->addr() < startAddr ) |
533 | throwf("section %s vm address not within segment", sect->sectname()); | |
534 | if ( (sect->addr()+sect->size()) > endAddr ) | |
535 | throwf("section %s vm address not within segment", sect->sectname()); | |
a645023d A |
536 | if ( ((sect->flags() & SECTION_TYPE) != S_ZEROFILL) |
537 | && ((sect->flags() & SECTION_TYPE) != S_THREAD_LOCAL_ZEROFILL) | |
afe874b1 A |
538 | && (segCmd->filesize() != 0) |
539 | && (sect->size() != 0) ) { | |
d696c285 A |
540 | if ( sect->offset() < startOffset ) |
541 | throwf("section %s file offset not within segment", sect->sectname()); | |
542 | if ( (sect->offset()+sect->size()) > endOffset ) | |
543 | throwf("section %s file offset not within segment", sect->sectname()); | |
544 | } | |
545 | checkSection(segCmd, sect); | |
c211e7c9 | 546 | ++fSectionCount; |
d696c285 A |
547 | } |
548 | } | |
549 | cmd = (const macho_load_command<P>*)(((uint8_t*)cmd)+cmd->cmdsize()); | |
550 | } | |
551 | ||
552 | // verify there was a LINKEDIT segment | |
553 | if ( linkEditSegment == NULL ) | |
554 | throw "no __LINKEDIT segment"; | |
555 | ||
afe874b1 A |
556 | // verify there was an executable __TEXT segment and load commands are in it |
557 | if ( fTEXTSegment == NULL ) | |
558 | throw "no __TEXT segment"; | |
559 | if ( fTEXTSegment->initprot() != (VM_PROT_READ|VM_PROT_EXECUTE) ) | |
560 | throw "__TEXT segment does not have r-x init permissions"; | |
561 | //if ( fTEXTSegment->maxprot() != (VM_PROT_READ|VM_PROT_EXECUTE|VM_PROT_WRITE) ) | |
562 | // throw "__TEXT segment does not have rwx max permissions"; | |
563 | if ( fTEXTSegment->fileoff() != 0 ) | |
564 | throw "__TEXT segment does not start at mach_header"; | |
565 | if ( fTEXTSegment->filesize() < (sizeof(macho_header<P>)+fHeader->sizeofcmds()) ) | |
566 | throw "__TEXT segment smaller than load commands"; | |
567 | ||
568 | // verify if custom stack used, that stack is in __UNIXSTACK segment | |
569 | if ( threadInfo != NULL ) { | |
570 | pint_t initialSP = getInitialStackPointer(threadInfo); | |
571 | if ( initialSP != 0 ) { | |
572 | if ( stackSegment == NULL ) | |
573 | throw "LC_UNIXTHREAD specifics custom initial stack pointer, but no __UNIXSTACK segment"; | |
574 | if ( (initialSP < stackSegment->vmaddr()) || (initialSP > (stackSegment->vmaddr()+stackSegment->vmsize())) ) | |
575 | throw "LC_UNIXTHREAD specifics custom initial stack pointer which does not point into __UNIXSTACK segment"; | |
576 | } | |
577 | } | |
578 | ||
579 | // verify __UNIXSTACK is zero fill | |
580 | if ( stackSegment != NULL ) { | |
581 | if ( (stackSegment->filesize() != 0) || (stackSegment->fileoff() != 0) ) | |
582 | throw "__UNIXSTACK is not a zero-fill segment"; | |
583 | if ( stackSegment->vmsize() < 4096 ) | |
584 | throw "__UNIXSTACK segment is too small"; | |
585 | } | |
586 | ||
587 | // verify entry point is in __TEXT segment | |
588 | if ( threadInfo != NULL ) { | |
589 | pint_t initialPC = getEntryPoint(threadInfo); | |
590 | if ( (initialPC < fTEXTSegment->vmaddr()) || (initialPC >= (fTEXTSegment->vmaddr()+fTEXTSegment->vmsize())) ) | |
591 | throwf("entry point 0x%0llX is outside __TEXT segment", (long long)initialPC); | |
592 | } | |
593 | ||
594 | ||
d696c285 A |
595 | // checks for executables |
596 | bool isStaticExecutable = false; | |
597 | if ( fHeader->filetype() == MH_EXECUTE ) { | |
598 | isStaticExecutable = true; | |
599 | cmd = cmds; | |
600 | for (uint32_t i = 0; i < cmd_count; ++i) { | |
601 | switch ( cmd->cmd() ) { | |
602 | case LC_LOAD_DYLINKER: | |
603 | // the existence of a dyld load command makes a executable dynamic | |
604 | isStaticExecutable = false; | |
605 | break; | |
606 | } | |
607 | cmd = (const macho_load_command<P>*)(((uint8_t*)cmd)+cmd->cmdsize()); | |
608 | } | |
609 | if ( isStaticExecutable ) { | |
610 | if ( fHeader->flags() != MH_NOUNDEFS ) | |
611 | throw "invalid bits in mach_header flags for static executable"; | |
612 | } | |
613 | } | |
614 | ||
2f2f92e4 A |
615 | // verify encryption info |
616 | if ( encryption_info != NULL ) { | |
617 | if ( fHeader->filetype() != MH_EXECUTE ) | |
618 | throw "LC_ENCRYPTION_INFO load command is only legal in main executables"; | |
619 | if ( encryption_info->cryptoff() < (sizeof(macho_header<P>) + fHeader->sizeofcmds()) ) | |
620 | throw "LC_ENCRYPTION_INFO load command has cryptoff covers some load commands"; | |
621 | if ( (encryption_info->cryptoff() % 4096) != 0 ) | |
622 | throw "LC_ENCRYPTION_INFO load command has cryptoff which is not page aligned"; | |
623 | if ( (encryption_info->cryptsize() % 4096) != 0 ) | |
624 | throw "LC_ENCRYPTION_INFO load command has cryptsize which is not page sized"; | |
625 | for (typename std::vector<std::pair<pint_t, pint_t> >::iterator it = segmentFileOffsetRanges.begin(); | |
626 | it != segmentFileOffsetRanges.end(); ++it) { | |
627 | if ( (it->first <= encryption_info->cryptoff()) && (encryption_info->cryptoff() < it->second) ) { | |
628 | if ( (encryption_info->cryptoff() + encryption_info->cryptsize()) > it->second ) | |
629 | throw "LC_ENCRYPTION_INFO load command is not contained within one segment"; | |
630 | } | |
631 | } | |
632 | } | |
633 | ||
a61fdf0a | 634 | // check LC_SYMTAB, LC_DYSYMTAB, and LC_SEGMENT_SPLIT_INFO |
d696c285 A |
635 | cmd = cmds; |
636 | bool foundDynamicSymTab = false; | |
637 | for (uint32_t i = 0; i < cmd_count; ++i) { | |
638 | switch ( cmd->cmd() ) { | |
639 | case LC_SYMTAB: | |
640 | { | |
641 | const macho_symtab_command<P>* symtab = (macho_symtab_command<P>*)cmd; | |
642 | fSymbolCount = symtab->nsyms(); | |
643 | fSymbols = (const macho_nlist<P>*)((char*)fHeader + symtab->symoff()); | |
644 | if ( symtab->symoff() < linkEditSegment->fileoff() ) | |
645 | throw "symbol table not in __LINKEDIT"; | |
646 | if ( (symtab->symoff() + fSymbolCount*sizeof(macho_nlist<P>*)) > (linkEditSegment->fileoff()+linkEditSegment->filesize()) ) | |
647 | throw "symbol table end not in __LINKEDIT"; | |
a61fdf0a A |
648 | if ( (symtab->symoff() % sizeof(pint_t)) != 0 ) |
649 | throw "symbol table start not pointer aligned"; | |
d696c285 A |
650 | fStrings = (char*)fHeader + symtab->stroff(); |
651 | fStringsEnd = fStrings + symtab->strsize(); | |
652 | if ( symtab->stroff() < linkEditSegment->fileoff() ) | |
653 | throw "string pool not in __LINKEDIT"; | |
654 | if ( (symtab->stroff()+symtab->strsize()) > (linkEditSegment->fileoff()+linkEditSegment->filesize()) ) | |
655 | throw "string pool extends beyond __LINKEDIT"; | |
a61fdf0a A |
656 | if ( (symtab->stroff() % 4) != 0 ) // work around until rdar://problem/4737991 is fixed |
657 | throw "string pool start not pointer aligned"; | |
658 | if ( (symtab->strsize() % sizeof(pint_t)) != 0 ) | |
659 | throw "string pool size not a multiple of pointer size"; | |
d696c285 A |
660 | } |
661 | break; | |
662 | case LC_DYSYMTAB: | |
663 | { | |
664 | if ( isStaticExecutable ) | |
665 | throw "LC_DYSYMTAB should not be used in static executable"; | |
666 | foundDynamicSymTab = true; | |
a645023d | 667 | fDynamicSymbolTable = (macho_dysymtab_command<P>*)cmd; |
a61fdf0a A |
668 | fIndirectTable = (uint32_t*)((char*)fHeader + fDynamicSymbolTable->indirectsymoff()); |
669 | fIndirectTableCount = fDynamicSymbolTable->nindirectsyms(); | |
74cfe461 | 670 | if ( fIndirectTableCount != 0 ) { |
a61fdf0a | 671 | if ( fDynamicSymbolTable->indirectsymoff() < linkEditSegment->fileoff() ) |
74cfe461 | 672 | throw "indirect symbol table not in __LINKEDIT"; |
a61fdf0a | 673 | if ( (fDynamicSymbolTable->indirectsymoff()+fIndirectTableCount*8) > (linkEditSegment->fileoff()+linkEditSegment->filesize()) ) |
74cfe461 | 674 | throw "indirect symbol table not in __LINKEDIT"; |
a61fdf0a A |
675 | if ( (fDynamicSymbolTable->indirectsymoff() % sizeof(pint_t)) != 0 ) |
676 | throw "indirect symbol table not pointer aligned"; | |
74cfe461 | 677 | } |
a61fdf0a | 678 | fLocalRelocationsCount = fDynamicSymbolTable->nlocrel(); |
69a49097 | 679 | if ( fLocalRelocationsCount != 0 ) { |
a61fdf0a A |
680 | fLocalRelocations = (const macho_relocation_info<P>*)((char*)fHeader + fDynamicSymbolTable->locreloff()); |
681 | if ( fDynamicSymbolTable->locreloff() < linkEditSegment->fileoff() ) | |
69a49097 | 682 | throw "local relocations not in __LINKEDIT"; |
a61fdf0a | 683 | if ( (fDynamicSymbolTable->locreloff()+fLocalRelocationsCount*sizeof(macho_relocation_info<P>)) > (linkEditSegment->fileoff()+linkEditSegment->filesize()) ) |
69a49097 | 684 | throw "local relocations not in __LINKEDIT"; |
a61fdf0a A |
685 | if ( (fDynamicSymbolTable->locreloff() % sizeof(pint_t)) != 0 ) |
686 | throw "local relocations table not pointer aligned"; | |
69a49097 | 687 | } |
a61fdf0a | 688 | fExternalRelocationsCount = fDynamicSymbolTable->nextrel(); |
69a49097 | 689 | if ( fExternalRelocationsCount != 0 ) { |
a61fdf0a A |
690 | fExternalRelocations = (const macho_relocation_info<P>*)((char*)fHeader + fDynamicSymbolTable->extreloff()); |
691 | if ( fDynamicSymbolTable->extreloff() < linkEditSegment->fileoff() ) | |
692 | throw "external relocations not in __LINKEDIT"; | |
693 | if ( (fDynamicSymbolTable->extreloff()+fExternalRelocationsCount*sizeof(macho_relocation_info<P>)) > (linkEditSegment->fileoff()+linkEditSegment->filesize()) ) | |
694 | throw "external relocations not in __LINKEDIT"; | |
695 | if ( (fDynamicSymbolTable->extreloff() % sizeof(pint_t)) != 0 ) | |
696 | throw "external relocations table not pointer aligned"; | |
69a49097 | 697 | } |
d696c285 A |
698 | } |
699 | break; | |
a61fdf0a A |
700 | case LC_SEGMENT_SPLIT_INFO: |
701 | { | |
702 | if ( isStaticExecutable ) | |
703 | throw "LC_SEGMENT_SPLIT_INFO should not be used in static executable"; | |
a645023d | 704 | const macho_linkedit_data_command<P>* info = (macho_linkedit_data_command<P>*)cmd; |
a61fdf0a A |
705 | if ( info->dataoff() < linkEditSegment->fileoff() ) |
706 | throw "split seg info not in __LINKEDIT"; | |
707 | if ( (info->dataoff()+info->datasize()) > (linkEditSegment->fileoff()+linkEditSegment->filesize()) ) | |
708 | throw "split seg info not in __LINKEDIT"; | |
709 | if ( (info->dataoff() % sizeof(pint_t)) != 0 ) | |
710 | throw "split seg info table not pointer aligned"; | |
711 | if ( (info->datasize() % sizeof(pint_t)) != 0 ) | |
712 | throw "split seg info size not a multiple of pointer size"; | |
713 | } | |
714 | break; | |
a645023d A |
715 | case LC_FUNCTION_STARTS: |
716 | { | |
717 | const macho_linkedit_data_command<P>* info = (macho_linkedit_data_command<P>*)cmd; | |
718 | if ( info->dataoff() < linkEditSegment->fileoff() ) | |
719 | throw "function starts data not in __LINKEDIT"; | |
720 | if ( (info->dataoff()+info->datasize()) > (linkEditSegment->fileoff()+linkEditSegment->filesize()) ) | |
721 | throw "function starts data not in __LINKEDIT"; | |
722 | if ( (info->dataoff() % sizeof(pint_t)) != 0 ) | |
723 | throw "function starts data table not pointer aligned"; | |
724 | if ( (info->datasize() % sizeof(pint_t)) != 0 ) | |
725 | throw "function starts data size not a multiple of pointer size"; | |
726 | } | |
727 | break; | |
d696c285 A |
728 | } |
729 | cmd = (const macho_load_command<P>*)(((uint8_t*)cmd)+cmd->cmdsize()); | |
730 | } | |
731 | if ( !isStaticExecutable && !foundDynamicSymTab ) | |
732 | throw "missing dynamic symbol table"; | |
733 | if ( fStrings == NULL ) | |
734 | throw "missing symbol table"; | |
a61fdf0a | 735 | |
d696c285 A |
736 | } |
737 | ||
738 | template <typename A> | |
739 | void MachOChecker<A>::checkSection(const macho_segment_command<P>* segCmd, const macho_section<P>* sect) | |
740 | { | |
741 | uint8_t sectionType = (sect->flags() & SECTION_TYPE); | |
742 | if ( sectionType == S_ZEROFILL ) { | |
743 | if ( sect->offset() != 0 ) | |
744 | throwf("section offset should be zero for zero-fill section %s", sect->sectname()); | |
745 | } | |
746 | ||
afe874b1 A |
747 | // check section's segment name matches segment |
748 | // if ( strncmp(sect->segname(), segCmd->segname(), 16) != 0 ) | |
749 | // throwf("section %s in segment %s has wrong segment name", sect->sectname(), segCmd->segname()); | |
750 | ||
d696c285 A |
751 | // more section tests here |
752 | } | |
753 | ||
afe874b1 A |
754 | |
755 | ||
756 | ||
d696c285 A |
757 | template <typename A> |
758 | void MachOChecker<A>::checkIndirectSymbolTable() | |
759 | { | |
a645023d A |
760 | // static executables don't have indirect symbol table |
761 | if ( fDynamicSymbolTable == NULL ) | |
762 | return; | |
d696c285 A |
763 | const macho_load_command<P>* const cmds = (macho_load_command<P>*)((uint8_t*)fHeader + sizeof(macho_header<P>)); |
764 | const uint32_t cmd_count = fHeader->ncmds(); | |
765 | const macho_load_command<P>* cmd = cmds; | |
766 | for (uint32_t i = 0; i < cmd_count; ++i) { | |
767 | if ( cmd->cmd() == macho_segment_command<P>::CMD ) { | |
768 | const macho_segment_command<P>* segCmd = (const macho_segment_command<P>*)cmd; | |
769 | const macho_section<P>* const sectionsStart = (macho_section<P>*)((char*)segCmd + sizeof(macho_segment_command<P>)); | |
770 | const macho_section<P>* const sectionsEnd = §ionsStart[segCmd->nsects()]; | |
771 | for(const macho_section<P>* sect = sectionsStart; sect < sectionsEnd; ++sect) { | |
772 | // make sure all magic sections that use indirect symbol table fit within it | |
773 | uint32_t start = 0; | |
774 | uint32_t elementSize = 0; | |
775 | switch ( sect->flags() & SECTION_TYPE ) { | |
776 | case S_SYMBOL_STUBS: | |
777 | elementSize = sect->reserved2(); | |
778 | start = sect->reserved1(); | |
779 | break; | |
780 | case S_LAZY_SYMBOL_POINTERS: | |
781 | case S_NON_LAZY_SYMBOL_POINTERS: | |
782 | elementSize = sizeof(pint_t); | |
783 | start = sect->reserved1(); | |
784 | break; | |
785 | } | |
786 | if ( elementSize != 0 ) { | |
787 | uint32_t count = sect->size() / elementSize; | |
788 | if ( (count*elementSize) != sect->size() ) | |
789 | throwf("%s section size is not an even multiple of element size", sect->sectname()); | |
790 | if ( (start+count) > fIndirectTableCount ) | |
791 | throwf("%s section references beyond end of indirect symbol table (%d > %d)", sect->sectname(), start+count, fIndirectTableCount ); | |
792 | } | |
793 | } | |
794 | } | |
795 | cmd = (const macho_load_command<P>*)(((uint8_t*)cmd)+cmd->cmdsize()); | |
796 | } | |
797 | } | |
798 | ||
799 | ||
afe874b1 A |
800 | |
801 | ||
a61fdf0a A |
802 | template <typename A> |
803 | void MachOChecker<A>::checkSymbolTable() | |
804 | { | |
805 | // verify no duplicate external symbol names | |
806 | if ( fDynamicSymbolTable != NULL ) { | |
807 | StringSet externalNames; | |
808 | const macho_nlist<P>* const exportedStart = &fSymbols[fDynamicSymbolTable->iextdefsym()]; | |
809 | const macho_nlist<P>* const exportedEnd = &exportedStart[fDynamicSymbolTable->nextdefsym()]; | |
55e3d2f6 A |
810 | int i = fDynamicSymbolTable->iextdefsym(); |
811 | for(const macho_nlist<P>* p = exportedStart; p < exportedEnd; ++p, ++i) { | |
a61fdf0a | 812 | const char* symName = &fStrings[p->n_strx()]; |
55e3d2f6 A |
813 | if ( symName > fStringsEnd ) |
814 | throw "string index out of range"; | |
815 | //fprintf(stderr, "sym[%d] = %s\n", i, symName); | |
a61fdf0a A |
816 | if ( externalNames.find(symName) != externalNames.end() ) |
817 | throwf("duplicate external symbol: %s", symName); | |
a645023d A |
818 | if ( (p->n_type() & N_EXT) == 0 ) |
819 | throwf("non-external symbol in external symbol range: %s", symName); | |
820 | // don't add N_INDR to externalNames because there is likely an undefine with same name | |
821 | if ( (p->n_type() & N_INDR) == 0 ) | |
822 | externalNames.insert(symName); | |
a61fdf0a | 823 | } |
55e3d2f6 A |
824 | // verify no undefines with same name as an external symbol |
825 | const macho_nlist<P>* const undefinesStart = &fSymbols[fDynamicSymbolTable->iundefsym()]; | |
826 | const macho_nlist<P>* const undefinesEnd = &undefinesStart[fDynamicSymbolTable->nundefsym()]; | |
827 | for(const macho_nlist<P>* p = undefinesStart; p < undefinesEnd; ++p) { | |
828 | const char* symName = &fStrings[p->n_strx()]; | |
829 | if ( symName > fStringsEnd ) | |
830 | throw "string index out of range"; | |
831 | if ( externalNames.find(symName) != externalNames.end() ) | |
832 | throwf("undefine with same name as external symbol: %s", symName); | |
833 | } | |
c211e7c9 A |
834 | // verify all N_SECT values are valid |
835 | for(const macho_nlist<P>* p = fSymbols; p < &fSymbols[fSymbolCount]; ++p) { | |
836 | uint8_t type = p->n_type(); | |
837 | if ( ((type & N_STAB) == 0) && ((type & N_TYPE) == N_SECT) ) { | |
838 | if ( p->n_sect() > fSectionCount ) { | |
839 | throwf("symbol '%s' has n_sect=%d which is too large", &fStrings[p->n_strx()], p->n_sect()); | |
840 | } | |
841 | } | |
842 | } | |
a61fdf0a A |
843 | } |
844 | } | |
845 | ||
69a49097 | 846 | |
afe874b1 A |
847 | template <typename A> |
848 | void MachOChecker<A>::checkInitTerms() | |
849 | { | |
850 | const macho_load_command<P>* const cmds = (macho_load_command<P>*)((uint8_t*)fHeader + sizeof(macho_header<P>)); | |
851 | const uint32_t cmd_count = fHeader->ncmds(); | |
852 | const macho_load_command<P>* cmd = cmds; | |
853 | for (uint32_t i = 0; i < cmd_count; ++i) { | |
854 | if ( cmd->cmd() == macho_segment_command<P>::CMD ) { | |
855 | const macho_segment_command<P>* segCmd = (const macho_segment_command<P>*)cmd; | |
856 | const macho_section<P>* const sectionsStart = (macho_section<P>*)((char*)segCmd + sizeof(macho_segment_command<P>)); | |
857 | const macho_section<P>* const sectionsEnd = §ionsStart[segCmd->nsects()]; | |
858 | for(const macho_section<P>* sect = sectionsStart; sect < sectionsEnd; ++sect) { | |
859 | // make sure all magic sections that use indirect symbol table fit within it | |
860 | uint32_t count; | |
861 | pint_t* arrayStart; | |
862 | pint_t* arrayEnd; | |
863 | const char* kind = "initializer"; | |
864 | switch ( sect->flags() & SECTION_TYPE ) { | |
865 | case S_MOD_TERM_FUNC_POINTERS: | |
866 | kind = "terminator"; | |
867 | // fall through | |
868 | case S_MOD_INIT_FUNC_POINTERS: | |
869 | count = sect->size() / sizeof(pint_t); | |
870 | if ( (count*sizeof(pint_t)) != sect->size() ) | |
871 | throwf("%s section size is not an even multiple of element size", sect->sectname()); | |
872 | if ( (sect->addr() % sizeof(pint_t)) != 0 ) | |
873 | throwf("%s section size is not pointer size aligned", sect->sectname()); | |
874 | // check each pointer in array points within TEXT | |
875 | arrayStart = (pint_t*)((char*)fHeader + sect->offset()); | |
876 | arrayEnd = (pint_t*)((char*)fHeader + sect->offset() + sect->size()); | |
877 | for (pint_t* p=arrayStart; p < arrayEnd; ++p) { | |
878 | pint_t pointer = P::getP(*p); | |
879 | if ( (pointer < fTEXTSegment->vmaddr()) || (pointer >= (fTEXTSegment->vmaddr()+fTEXTSegment->vmsize())) ) | |
880 | throwf("%s 0x%08llX points outside __TEXT segment", kind, (long long)pointer); | |
881 | } | |
882 | // check each pointer in array will be rebased and not bound | |
883 | if ( fSlidableImage ) { | |
884 | pint_t sectionBeginAddr = sect->addr(); | |
885 | pint_t sectionEndddr = sect->addr() + sect->size(); | |
886 | for(pint_t addr = sectionBeginAddr; addr < sectionEndddr; addr += sizeof(pint_t)) { | |
887 | if ( addressIsBindingSite(addr) ) | |
888 | throwf("%s at 0x%0llX has binding to external symbol", kind, (long long)addr); | |
889 | if ( ! addressIsRebaseSite(addr) ) | |
890 | throwf("%s at 0x%0llX is not rebased", kind, (long long)addr); | |
891 | } | |
892 | } | |
893 | break; | |
894 | } | |
895 | } | |
896 | } | |
897 | cmd = (const macho_load_command<P>*)(((uint8_t*)cmd)+cmd->cmdsize()); | |
898 | } | |
899 | ||
900 | } | |
901 | ||
902 | ||
69a49097 A |
903 | template <> |
904 | ppc::P::uint_t MachOChecker<ppc>::relocBase() | |
905 | { | |
906 | if ( fHeader->flags() & MH_SPLIT_SEGS ) | |
907 | return fFirstWritableSegment->vmaddr(); | |
908 | else | |
909 | return fFirstSegment->vmaddr(); | |
910 | } | |
911 | ||
912 | template <> | |
913 | ppc64::P::uint_t MachOChecker<ppc64>::relocBase() | |
914 | { | |
915 | if ( fWriteableSegmentWithAddrOver4G ) | |
916 | return fFirstWritableSegment->vmaddr(); | |
917 | else | |
918 | return fFirstSegment->vmaddr(); | |
919 | } | |
920 | ||
921 | template <> | |
922 | x86::P::uint_t MachOChecker<x86>::relocBase() | |
923 | { | |
924 | if ( fHeader->flags() & MH_SPLIT_SEGS ) | |
925 | return fFirstWritableSegment->vmaddr(); | |
926 | else | |
927 | return fFirstSegment->vmaddr(); | |
928 | } | |
929 | ||
930 | template <> | |
931 | x86_64::P::uint_t MachOChecker<x86_64>::relocBase() | |
932 | { | |
933 | // check for split-seg | |
934 | return fFirstWritableSegment->vmaddr(); | |
935 | } | |
936 | ||
2f2f92e4 A |
937 | template <> |
938 | arm::P::uint_t MachOChecker<arm>::relocBase() | |
939 | { | |
940 | if ( fHeader->flags() & MH_SPLIT_SEGS ) | |
941 | return fFirstWritableSegment->vmaddr(); | |
942 | else | |
943 | return fFirstSegment->vmaddr(); | |
944 | } | |
945 | ||
69a49097 A |
946 | |
947 | template <typename A> | |
948 | bool MachOChecker<A>::addressInWritableSegment(pint_t address) | |
949 | { | |
950 | const macho_load_command<P>* const cmds = (macho_load_command<P>*)((uint8_t*)fHeader + sizeof(macho_header<P>)); | |
951 | const uint32_t cmd_count = fHeader->ncmds(); | |
952 | const macho_load_command<P>* cmd = cmds; | |
953 | for (uint32_t i = 0; i < cmd_count; ++i) { | |
954 | if ( cmd->cmd() == macho_segment_command<P>::CMD ) { | |
955 | const macho_segment_command<P>* segCmd = (const macho_segment_command<P>*)cmd; | |
2f2f92e4 A |
956 | if ( (address >= segCmd->vmaddr()) && (address < segCmd->vmaddr()+segCmd->vmsize()) ) { |
957 | // if segment is writable, we are fine | |
958 | if ( (segCmd->initprot() & VM_PROT_WRITE) != 0 ) | |
69a49097 | 959 | return true; |
2f2f92e4 A |
960 | // could be a text reloc, make sure section bit is set |
961 | const macho_section<P>* const sectionsStart = (macho_section<P>*)((char*)segCmd + sizeof(macho_segment_command<P>)); | |
962 | const macho_section<P>* const sectionsEnd = §ionsStart[segCmd->nsects()]; | |
963 | for(const macho_section<P>* sect = sectionsStart; sect < sectionsEnd; ++sect) { | |
964 | if ( (sect->addr() <= address) && (address < (sect->addr()+sect->size())) ) { | |
965 | // found section for this address, if has relocs we are fine | |
966 | return ( (sect->flags() & (S_ATTR_EXT_RELOC|S_ATTR_LOC_RELOC)) != 0 ); | |
967 | } | |
968 | } | |
69a49097 A |
969 | } |
970 | } | |
971 | cmd = (const macho_load_command<P>*)(((uint8_t*)cmd)+cmd->cmdsize()); | |
972 | } | |
973 | return false; | |
974 | } | |
975 | ||
976 | ||
977 | template <> | |
978 | void MachOChecker<ppc>::checkExternalReloation(const macho_relocation_info<P>* reloc) | |
979 | { | |
a61fdf0a A |
980 | if ( reloc->r_length() != 2 ) |
981 | throw "bad external relocation length"; | |
982 | if ( reloc->r_type() != GENERIC_RELOC_VANILLA ) | |
983 | throw "unknown external relocation type"; | |
984 | if ( reloc->r_pcrel() != 0 ) | |
985 | throw "bad external relocation pc_rel"; | |
986 | if ( reloc->r_extern() == 0 ) | |
987 | throw "local relocation found with external relocations"; | |
988 | if ( ! this->addressInWritableSegment(reloc->r_address() + this->relocBase()) ) | |
989 | throw "external relocation address not in writable segment"; | |
990 | // FIX: check r_symbol | |
69a49097 A |
991 | } |
992 | ||
993 | template <> | |
994 | void MachOChecker<ppc64>::checkExternalReloation(const macho_relocation_info<P>* reloc) | |
995 | { | |
996 | if ( reloc->r_length() != 3 ) | |
997 | throw "bad external relocation length"; | |
998 | if ( reloc->r_type() != GENERIC_RELOC_VANILLA ) | |
999 | throw "unknown external relocation type"; | |
1000 | if ( reloc->r_pcrel() != 0 ) | |
1001 | throw "bad external relocation pc_rel"; | |
1002 | if ( reloc->r_extern() == 0 ) | |
1003 | throw "local relocation found with external relocations"; | |
1004 | if ( ! this->addressInWritableSegment(reloc->r_address() + this->relocBase()) ) | |
a61fdf0a | 1005 | throw "external relocation address not in writable segment"; |
69a49097 A |
1006 | // FIX: check r_symbol |
1007 | } | |
1008 | ||
1009 | template <> | |
1010 | void MachOChecker<x86>::checkExternalReloation(const macho_relocation_info<P>* reloc) | |
1011 | { | |
a61fdf0a A |
1012 | if ( reloc->r_length() != 2 ) |
1013 | throw "bad external relocation length"; | |
1014 | if ( reloc->r_type() != GENERIC_RELOC_VANILLA ) | |
1015 | throw "unknown external relocation type"; | |
1016 | if ( reloc->r_pcrel() != 0 ) | |
1017 | throw "bad external relocation pc_rel"; | |
1018 | if ( reloc->r_extern() == 0 ) | |
1019 | throw "local relocation found with external relocations"; | |
1020 | if ( ! this->addressInWritableSegment(reloc->r_address() + this->relocBase()) ) | |
1021 | throw "external relocation address not in writable segment"; | |
1022 | // FIX: check r_symbol | |
69a49097 A |
1023 | } |
1024 | ||
1025 | ||
1026 | template <> | |
1027 | void MachOChecker<x86_64>::checkExternalReloation(const macho_relocation_info<P>* reloc) | |
1028 | { | |
1029 | if ( reloc->r_length() != 3 ) | |
1030 | throw "bad external relocation length"; | |
1031 | if ( reloc->r_type() != X86_64_RELOC_UNSIGNED ) | |
1032 | throw "unknown external relocation type"; | |
1033 | if ( reloc->r_pcrel() != 0 ) | |
1034 | throw "bad external relocation pc_rel"; | |
1035 | if ( reloc->r_extern() == 0 ) | |
1036 | throw "local relocation found with external relocations"; | |
1037 | if ( ! this->addressInWritableSegment(reloc->r_address() + this->relocBase()) ) | |
1038 | throw "exernal relocation address not in writable segment"; | |
1039 | // FIX: check r_symbol | |
1040 | } | |
1041 | ||
2f2f92e4 A |
1042 | template <> |
1043 | void MachOChecker<arm>::checkExternalReloation(const macho_relocation_info<P>* reloc) | |
1044 | { | |
1045 | if ( reloc->r_length() != 2 ) | |
1046 | throw "bad external relocation length"; | |
1047 | if ( reloc->r_type() != ARM_RELOC_VANILLA ) | |
1048 | throw "unknown external relocation type"; | |
1049 | if ( reloc->r_pcrel() != 0 ) | |
1050 | throw "bad external relocation pc_rel"; | |
1051 | if ( reloc->r_extern() == 0 ) | |
1052 | throw "local relocation found with external relocations"; | |
1053 | if ( ! this->addressInWritableSegment(reloc->r_address() + this->relocBase()) ) | |
1054 | throw "external relocation address not in writable segment"; | |
1055 | // FIX: check r_symbol | |
1056 | } | |
1057 | ||
1058 | ||
69a49097 A |
1059 | template <> |
1060 | void MachOChecker<ppc>::checkLocalReloation(const macho_relocation_info<P>* reloc) | |
1061 | { | |
1062 | if ( reloc->r_address() & R_SCATTERED ) { | |
1063 | // scattered | |
1064 | const macho_scattered_relocation_info<P>* sreloc = (const macho_scattered_relocation_info<P>*)reloc; | |
1065 | // FIX | |
1066 | ||
1067 | } | |
1068 | else { | |
1069 | // FIX | |
1070 | if ( ! this->addressInWritableSegment(reloc->r_address() + this->relocBase()) ) | |
2f2f92e4 | 1071 | throwf("local relocation address 0x%08X not in writable segment", reloc->r_address()); |
69a49097 A |
1072 | } |
1073 | } | |
1074 | ||
1075 | ||
1076 | template <> | |
1077 | void MachOChecker<ppc64>::checkLocalReloation(const macho_relocation_info<P>* reloc) | |
1078 | { | |
1079 | if ( reloc->r_length() != 3 ) | |
1080 | throw "bad local relocation length"; | |
1081 | if ( reloc->r_type() != GENERIC_RELOC_VANILLA ) | |
1082 | throw "unknown local relocation type"; | |
1083 | if ( reloc->r_pcrel() != 0 ) | |
1084 | throw "bad local relocation pc_rel"; | |
1085 | if ( reloc->r_extern() != 0 ) | |
1086 | throw "external relocation found with local relocations"; | |
1087 | if ( ! this->addressInWritableSegment(reloc->r_address() + this->relocBase()) ) | |
1088 | throw "local relocation address not in writable segment"; | |
1089 | } | |
1090 | ||
1091 | template <> | |
1092 | void MachOChecker<x86>::checkLocalReloation(const macho_relocation_info<P>* reloc) | |
1093 | { | |
1094 | // FIX | |
1095 | } | |
1096 | ||
1097 | template <> | |
1098 | void MachOChecker<x86_64>::checkLocalReloation(const macho_relocation_info<P>* reloc) | |
1099 | { | |
1100 | if ( reloc->r_length() != 3 ) | |
1101 | throw "bad local relocation length"; | |
1102 | if ( reloc->r_type() != X86_64_RELOC_UNSIGNED ) | |
1103 | throw "unknown local relocation type"; | |
1104 | if ( reloc->r_pcrel() != 0 ) | |
1105 | throw "bad local relocation pc_rel"; | |
1106 | if ( reloc->r_extern() != 0 ) | |
1107 | throw "external relocation found with local relocations"; | |
1108 | if ( ! this->addressInWritableSegment(reloc->r_address() + this->relocBase()) ) | |
1109 | throw "local relocation address not in writable segment"; | |
1110 | } | |
1111 | ||
2f2f92e4 A |
1112 | template <> |
1113 | void MachOChecker<arm>::checkLocalReloation(const macho_relocation_info<P>* reloc) | |
1114 | { | |
1115 | if ( reloc->r_address() & R_SCATTERED ) { | |
1116 | // scattered | |
1117 | const macho_scattered_relocation_info<P>* sreloc = (const macho_scattered_relocation_info<P>*)reloc; | |
1118 | if ( sreloc->r_length() != 2 ) | |
1119 | throw "bad local scattered relocation length"; | |
1120 | if ( sreloc->r_type() != ARM_RELOC_PB_LA_PTR ) | |
1121 | throw "bad local scattered relocation type"; | |
1122 | } | |
1123 | else { | |
1124 | if ( reloc->r_length() != 2 ) | |
1125 | throw "bad local relocation length"; | |
1126 | if ( reloc->r_extern() != 0 ) | |
1127 | throw "external relocation found with local relocations"; | |
1128 | if ( ! this->addressInWritableSegment(reloc->r_address() + this->relocBase()) ) | |
1129 | throw "local relocation address not in writable segment"; | |
1130 | } | |
1131 | } | |
69a49097 A |
1132 | |
1133 | template <typename A> | |
1134 | void MachOChecker<A>::checkRelocations() | |
1135 | { | |
a61fdf0a A |
1136 | // external relocations should be sorted to minimize dyld symbol lookups |
1137 | // therefore every reloc with the same r_symbolnum value should be contiguous | |
1138 | std::set<uint32_t> previouslySeenSymbolIndexes; | |
1139 | uint32_t lastSymbolIndex = 0xFFFFFFFF; | |
69a49097 A |
1140 | const macho_relocation_info<P>* const externRelocsEnd = &fExternalRelocations[fExternalRelocationsCount]; |
1141 | for (const macho_relocation_info<P>* reloc = fExternalRelocations; reloc < externRelocsEnd; ++reloc) { | |
1142 | this->checkExternalReloation(reloc); | |
a61fdf0a A |
1143 | if ( reloc->r_symbolnum() != lastSymbolIndex ) { |
1144 | if ( previouslySeenSymbolIndexes.count(reloc->r_symbolnum()) != 0 ) | |
1145 | throw "external relocations not sorted"; | |
1146 | previouslySeenSymbolIndexes.insert(lastSymbolIndex); | |
1147 | lastSymbolIndex = reloc->r_symbolnum(); | |
1148 | } | |
69a49097 A |
1149 | } |
1150 | ||
1151 | const macho_relocation_info<P>* const localRelocsEnd = &fLocalRelocations[fLocalRelocationsCount]; | |
1152 | for (const macho_relocation_info<P>* reloc = fLocalRelocations; reloc < localRelocsEnd; ++reloc) { | |
1153 | this->checkLocalReloation(reloc); | |
1154 | } | |
a645023d A |
1155 | |
1156 | // verify any section with S_ATTR_LOC_RELOC bits set actually has text relocs | |
1157 | const macho_load_command<P>* const cmds = (macho_load_command<P>*)((uint8_t*)fHeader + sizeof(macho_header<P>)); | |
1158 | const uint32_t cmd_count = fHeader->ncmds(); | |
1159 | const macho_load_command<P>* cmd = cmds; | |
1160 | for (uint32_t i = 0; i < cmd_count; ++i) { | |
1161 | if ( cmd->cmd() == macho_segment_command<P>::CMD ) { | |
1162 | const macho_segment_command<P>* segCmd = (const macho_segment_command<P>*)cmd; | |
1163 | // if segment is writable, we are fine | |
1164 | if ( (segCmd->initprot() & VM_PROT_WRITE) != 0 ) | |
1165 | continue; | |
1166 | // look at sections that have text reloc bit set | |
1167 | const macho_section<P>* const sectionsStart = (macho_section<P>*)((char*)segCmd + sizeof(macho_segment_command<P>)); | |
1168 | const macho_section<P>* const sectionsEnd = §ionsStart[segCmd->nsects()]; | |
1169 | for(const macho_section<P>* sect = sectionsStart; sect < sectionsEnd; ++sect) { | |
1170 | if ( (sect->flags() & S_ATTR_LOC_RELOC) != 0 ) { | |
1171 | if ( ! hasTextRelocInRange(sect->addr(), sect->addr()+sect->size()) ) { | |
1172 | throwf("section %s has attribute set that it has relocs, but it has none", sect->sectname()); | |
1173 | } | |
1174 | } | |
1175 | } | |
1176 | } | |
1177 | cmd = (const macho_load_command<P>*)(((uint8_t*)cmd)+cmd->cmdsize()); | |
1178 | } | |
69a49097 A |
1179 | } |
1180 | ||
a645023d A |
1181 | template <typename A> |
1182 | typename A::P::uint_t MachOChecker<A>::segStartAddress(uint8_t segIndex) | |
1183 | { | |
1184 | if ( segIndex > fSegments.size() ) | |
1185 | throw "segment index out of range"; | |
1186 | return fSegments[segIndex]->vmaddr(); | |
1187 | } | |
1188 | ||
1189 | template <typename A> | |
1190 | bool MachOChecker<A>::hasTextRelocInRange(pint_t rangeStart, pint_t rangeEnd) | |
1191 | { | |
1192 | // look at local relocs | |
1193 | const macho_relocation_info<P>* const localRelocsEnd = &fLocalRelocations[fLocalRelocationsCount]; | |
1194 | for (const macho_relocation_info<P>* reloc = fLocalRelocations; reloc < localRelocsEnd; ++reloc) { | |
1195 | pint_t relocAddress = reloc->r_address() + this->relocBase(); | |
1196 | if ( (rangeStart <= relocAddress) && (relocAddress < rangeEnd) ) | |
1197 | return true; | |
1198 | } | |
1199 | // look rebase info | |
1200 | if ( fDyldInfo != NULL ) { | |
1201 | const uint8_t* p = (uint8_t*)fHeader + fDyldInfo->rebase_off(); | |
1202 | const uint8_t* end = &p[fDyldInfo->rebase_size()]; | |
1203 | ||
1204 | uint8_t type = 0; | |
1205 | uint64_t segOffset = 0; | |
1206 | uint32_t count; | |
1207 | uint32_t skip; | |
1208 | int segIndex; | |
1209 | pint_t segStartAddr = 0; | |
1210 | pint_t addr; | |
1211 | bool done = false; | |
1212 | while ( !done && (p < end) ) { | |
1213 | uint8_t immediate = *p & REBASE_IMMEDIATE_MASK; | |
1214 | uint8_t opcode = *p & REBASE_OPCODE_MASK; | |
1215 | ++p; | |
1216 | switch (opcode) { | |
1217 | case REBASE_OPCODE_DONE: | |
1218 | done = true; | |
1219 | break; | |
1220 | case REBASE_OPCODE_SET_TYPE_IMM: | |
1221 | type = immediate; | |
1222 | break; | |
1223 | case REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB: | |
1224 | segIndex = immediate; | |
1225 | segStartAddr = segStartAddress(segIndex); | |
1226 | segOffset = read_uleb128(p, end); | |
1227 | break; | |
1228 | case REBASE_OPCODE_ADD_ADDR_ULEB: | |
1229 | segOffset += read_uleb128(p, end); | |
1230 | break; | |
1231 | case REBASE_OPCODE_ADD_ADDR_IMM_SCALED: | |
1232 | segOffset += immediate*sizeof(pint_t); | |
1233 | break; | |
1234 | case REBASE_OPCODE_DO_REBASE_IMM_TIMES: | |
1235 | for (int i=0; i < immediate; ++i) { | |
1236 | addr = segStartAddr+segOffset; | |
1237 | if ( (rangeStart <= addr) && (addr < rangeEnd) ) | |
1238 | return true; | |
1239 | //printf("%-7s %-16s 0x%08llX %s\n", segName, sectionName(segIndex, segStartAddr+segOffset), segStartAddr+segOffset, typeName); | |
1240 | segOffset += sizeof(pint_t); | |
1241 | } | |
1242 | break; | |
1243 | case REBASE_OPCODE_DO_REBASE_ULEB_TIMES: | |
1244 | count = read_uleb128(p, end); | |
1245 | for (uint32_t i=0; i < count; ++i) { | |
1246 | addr = segStartAddr+segOffset; | |
1247 | if ( (rangeStart <= addr) && (addr < rangeEnd) ) | |
1248 | return true; | |
1249 | //printf("%-7s %-16s 0x%08llX %s\n", segName, sectionName(segIndex, segStartAddr+segOffset), segStartAddr+segOffset, typeName); | |
1250 | segOffset += sizeof(pint_t); | |
1251 | } | |
1252 | break; | |
1253 | case REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB: | |
1254 | addr = segStartAddr+segOffset; | |
1255 | if ( (rangeStart <= addr) && (addr < rangeEnd) ) | |
1256 | return true; | |
1257 | //printf("%-7s %-16s 0x%08llX %s\n", segName, sectionName(segIndex, segStartAddr+segOffset), segStartAddr+segOffset, typeName); | |
1258 | segOffset += read_uleb128(p, end) + sizeof(pint_t); | |
1259 | break; | |
1260 | case REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_ULEB: | |
1261 | count = read_uleb128(p, end); | |
1262 | skip = read_uleb128(p, end); | |
1263 | for (uint32_t i=0; i < count; ++i) { | |
1264 | addr = segStartAddr+segOffset; | |
1265 | if ( (rangeStart <= addr) && (addr < rangeEnd) ) | |
1266 | return true; | |
1267 | //printf("%-7s %-16s 0x%08llX %s\n", segName, sectionName(segIndex, segStartAddr+segOffset), segStartAddr+segOffset, typeName); | |
1268 | segOffset += skip + sizeof(pint_t); | |
1269 | } | |
1270 | break; | |
1271 | default: | |
1272 | throwf("bad rebase opcode %d", *p); | |
1273 | } | |
1274 | } | |
1275 | } | |
1276 | } | |
69a49097 | 1277 | |
afe874b1 A |
1278 | template <typename A> |
1279 | bool MachOChecker<A>::addressIsRebaseSite(pint_t targetAddr) | |
1280 | { | |
1281 | // look at local relocs | |
1282 | const macho_relocation_info<P>* const localRelocsEnd = &fLocalRelocations[fLocalRelocationsCount]; | |
1283 | for (const macho_relocation_info<P>* reloc = fLocalRelocations; reloc < localRelocsEnd; ++reloc) { | |
1284 | pint_t relocAddress = reloc->r_address() + this->relocBase(); | |
1285 | if ( relocAddress == targetAddr ) | |
1286 | return true; | |
1287 | } | |
1288 | // look rebase info | |
1289 | if ( fDyldInfo != NULL ) { | |
1290 | const uint8_t* p = (uint8_t*)fHeader + fDyldInfo->rebase_off(); | |
1291 | const uint8_t* end = &p[fDyldInfo->rebase_size()]; | |
1292 | ||
1293 | uint8_t type = 0; | |
1294 | uint64_t segOffset = 0; | |
1295 | uint32_t count; | |
1296 | uint32_t skip; | |
1297 | int segIndex; | |
1298 | pint_t segStartAddr = 0; | |
1299 | pint_t addr; | |
1300 | bool done = false; | |
1301 | while ( !done && (p < end) ) { | |
1302 | uint8_t immediate = *p & REBASE_IMMEDIATE_MASK; | |
1303 | uint8_t opcode = *p & REBASE_OPCODE_MASK; | |
1304 | ++p; | |
1305 | switch (opcode) { | |
1306 | case REBASE_OPCODE_DONE: | |
1307 | done = true; | |
1308 | break; | |
1309 | case REBASE_OPCODE_SET_TYPE_IMM: | |
1310 | type = immediate; | |
1311 | break; | |
1312 | case REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB: | |
1313 | segIndex = immediate; | |
1314 | segStartAddr = segStartAddress(segIndex); | |
1315 | segOffset = read_uleb128(p, end); | |
1316 | break; | |
1317 | case REBASE_OPCODE_ADD_ADDR_ULEB: | |
1318 | segOffset += read_uleb128(p, end); | |
1319 | break; | |
1320 | case REBASE_OPCODE_ADD_ADDR_IMM_SCALED: | |
1321 | segOffset += immediate*sizeof(pint_t); | |
1322 | break; | |
1323 | case REBASE_OPCODE_DO_REBASE_IMM_TIMES: | |
1324 | for (int i=0; i < immediate; ++i) { | |
1325 | addr = segStartAddr+segOffset; | |
1326 | if ( addr == targetAddr ) | |
1327 | return true; | |
1328 | //printf("%-7s %-16s 0x%08llX %s\n", segName, sectionName(segIndex, segStartAddr+segOffset), segStartAddr+segOffset, typeName); | |
1329 | segOffset += sizeof(pint_t); | |
1330 | } | |
1331 | break; | |
1332 | case REBASE_OPCODE_DO_REBASE_ULEB_TIMES: | |
1333 | count = read_uleb128(p, end); | |
1334 | for (uint32_t i=0; i < count; ++i) { | |
1335 | addr = segStartAddr+segOffset; | |
1336 | if ( addr == targetAddr ) | |
1337 | return true; | |
1338 | //printf("%-7s %-16s 0x%08llX %s\n", segName, sectionName(segIndex, segStartAddr+segOffset), segStartAddr+segOffset, typeName); | |
1339 | segOffset += sizeof(pint_t); | |
1340 | } | |
1341 | break; | |
1342 | case REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB: | |
1343 | addr = segStartAddr+segOffset; | |
1344 | if ( addr == targetAddr ) | |
1345 | return true; | |
1346 | //printf("%-7s %-16s 0x%08llX %s\n", segName, sectionName(segIndex, segStartAddr+segOffset), segStartAddr+segOffset, typeName); | |
1347 | segOffset += read_uleb128(p, end) + sizeof(pint_t); | |
1348 | break; | |
1349 | case REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_ULEB: | |
1350 | count = read_uleb128(p, end); | |
1351 | skip = read_uleb128(p, end); | |
1352 | for (uint32_t i=0; i < count; ++i) { | |
1353 | addr = segStartAddr+segOffset; | |
1354 | if ( addr == targetAddr ) | |
1355 | return true; | |
1356 | //printf("%-7s %-16s 0x%08llX %s\n", segName, sectionName(segIndex, segStartAddr+segOffset), segStartAddr+segOffset, typeName); | |
1357 | segOffset += skip + sizeof(pint_t); | |
1358 | } | |
1359 | break; | |
1360 | default: | |
1361 | throwf("bad rebase opcode %d", *p); | |
1362 | } | |
1363 | } | |
1364 | } | |
1365 | return false; | |
1366 | } | |
1367 | ||
1368 | ||
1369 | template <typename A> | |
1370 | bool MachOChecker<A>::addressIsBindingSite(pint_t targetAddr) | |
1371 | { | |
1372 | // look at external relocs | |
1373 | const macho_relocation_info<P>* const externRelocsEnd = &fExternalRelocations[fExternalRelocationsCount]; | |
1374 | for (const macho_relocation_info<P>* reloc = fExternalRelocations; reloc < externRelocsEnd; ++reloc) { | |
1375 | pint_t relocAddress = reloc->r_address() + this->relocBase(); | |
1376 | if ( relocAddress == targetAddr ) | |
1377 | return true; | |
1378 | } | |
1379 | // look bind info | |
1380 | if ( fDyldInfo != NULL ) { | |
1381 | const uint8_t* p = (uint8_t*)fHeader + fDyldInfo->bind_off(); | |
1382 | const uint8_t* end = &p[fDyldInfo->bind_size()]; | |
1383 | ||
1384 | uint8_t type = 0; | |
1385 | uint64_t segOffset = 0; | |
1386 | uint32_t count; | |
1387 | uint32_t skip; | |
1388 | uint8_t flags; | |
1389 | const char* symbolName = NULL; | |
1390 | int libraryOrdinal = 0; | |
1391 | int segIndex; | |
1392 | int64_t addend = 0; | |
1393 | pint_t segStartAddr = 0; | |
1394 | pint_t addr; | |
1395 | bool done = false; | |
1396 | while ( !done && (p < end) ) { | |
1397 | uint8_t immediate = *p & BIND_IMMEDIATE_MASK; | |
1398 | uint8_t opcode = *p & BIND_OPCODE_MASK; | |
1399 | ++p; | |
1400 | switch (opcode) { | |
1401 | case BIND_OPCODE_DONE: | |
1402 | done = true; | |
1403 | break; | |
1404 | case BIND_OPCODE_SET_DYLIB_ORDINAL_IMM: | |
1405 | libraryOrdinal = immediate; | |
1406 | break; | |
1407 | case BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB: | |
1408 | libraryOrdinal = read_uleb128(p, end); | |
1409 | break; | |
1410 | case BIND_OPCODE_SET_DYLIB_SPECIAL_IMM: | |
1411 | // the special ordinals are negative numbers | |
1412 | if ( immediate == 0 ) | |
1413 | libraryOrdinal = 0; | |
1414 | else { | |
1415 | int8_t signExtended = BIND_OPCODE_MASK | immediate; | |
1416 | libraryOrdinal = signExtended; | |
1417 | } | |
1418 | break; | |
1419 | case BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM: | |
1420 | symbolName = (char*)p; | |
1421 | while (*p != '\0') | |
1422 | ++p; | |
1423 | ++p; | |
1424 | break; | |
1425 | case BIND_OPCODE_SET_TYPE_IMM: | |
1426 | type = immediate; | |
1427 | break; | |
1428 | case BIND_OPCODE_SET_ADDEND_SLEB: | |
1429 | addend = read_sleb128(p, end); | |
1430 | break; | |
1431 | case BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB: | |
1432 | segIndex = immediate; | |
1433 | segStartAddr = segStartAddress(segIndex); | |
1434 | segOffset = read_uleb128(p, end); | |
1435 | break; | |
1436 | case BIND_OPCODE_ADD_ADDR_ULEB: | |
1437 | segOffset += read_uleb128(p, end); | |
1438 | break; | |
1439 | case BIND_OPCODE_DO_BIND: | |
1440 | if ( (segStartAddr+segOffset) == targetAddr ) | |
1441 | return true; | |
1442 | segOffset += sizeof(pint_t); | |
1443 | break; | |
1444 | case BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB: | |
1445 | if ( (segStartAddr+segOffset) == targetAddr ) | |
1446 | return true; | |
1447 | segOffset += read_uleb128(p, end) + sizeof(pint_t); | |
1448 | break; | |
1449 | case BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED: | |
1450 | if ( (segStartAddr+segOffset) == targetAddr ) | |
1451 | return true; | |
1452 | segOffset += immediate*sizeof(pint_t) + sizeof(pint_t); | |
1453 | break; | |
1454 | case BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB: | |
1455 | count = read_uleb128(p, end); | |
1456 | skip = read_uleb128(p, end); | |
1457 | for (uint32_t i=0; i < count; ++i) { | |
1458 | if ( (segStartAddr+segOffset) == targetAddr ) | |
1459 | return true; | |
1460 | segOffset += skip + sizeof(pint_t); | |
1461 | } | |
1462 | break; | |
1463 | default: | |
1464 | throwf("bad bind opcode %d", *p); | |
1465 | } | |
1466 | } | |
1467 | } | |
1468 | return false; | |
1469 | } | |
1470 | ||
1471 | ||
d696c285 A |
1472 | static void check(const char* path) |
1473 | { | |
1474 | struct stat stat_buf; | |
1475 | ||
1476 | try { | |
1477 | int fd = ::open(path, O_RDONLY, 0); | |
1478 | if ( fd == -1 ) | |
1479 | throw "cannot open file"; | |
55e3d2f6 A |
1480 | if ( ::fstat(fd, &stat_buf) != 0 ) |
1481 | throwf("fstat(%s) failed, errno=%d\n", path, errno); | |
d696c285 | 1482 | uint32_t length = stat_buf.st_size; |
69a49097 A |
1483 | uint8_t* p = (uint8_t*)::mmap(NULL, stat_buf.st_size, PROT_READ, MAP_FILE | MAP_PRIVATE, fd, 0); |
1484 | if ( p == ((uint8_t*)(-1)) ) | |
1485 | throw "cannot map file"; | |
d696c285 A |
1486 | ::close(fd); |
1487 | const mach_header* mh = (mach_header*)p; | |
1488 | if ( mh->magic == OSSwapBigToHostInt32(FAT_MAGIC) ) { | |
1489 | const struct fat_header* fh = (struct fat_header*)p; | |
1490 | const struct fat_arch* archs = (struct fat_arch*)(p + sizeof(struct fat_header)); | |
a61fdf0a A |
1491 | for (unsigned long i=0; i < OSSwapBigToHostInt32(fh->nfat_arch); ++i) { |
1492 | size_t offset = OSSwapBigToHostInt32(archs[i].offset); | |
1493 | size_t size = OSSwapBigToHostInt32(archs[i].size); | |
1494 | unsigned int cputype = OSSwapBigToHostInt32(archs[i].cputype); | |
1495 | ||
1496 | switch(cputype) { | |
1497 | case CPU_TYPE_POWERPC: | |
1498 | if ( MachOChecker<ppc>::validFile(p + offset) ) | |
1499 | MachOChecker<ppc>::make(p + offset, size, path); | |
d696c285 A |
1500 | else |
1501 | throw "in universal file, ppc slice does not contain ppc mach-o"; | |
a61fdf0a A |
1502 | break; |
1503 | case CPU_TYPE_I386: | |
1504 | if ( MachOChecker<x86>::validFile(p + offset) ) | |
1505 | MachOChecker<x86>::make(p + offset, size, path); | |
d696c285 A |
1506 | else |
1507 | throw "in universal file, i386 slice does not contain i386 mach-o"; | |
a61fdf0a A |
1508 | break; |
1509 | case CPU_TYPE_POWERPC64: | |
1510 | if ( MachOChecker<ppc64>::validFile(p + offset) ) | |
1511 | MachOChecker<ppc64>::make(p + offset, size, path); | |
d696c285 A |
1512 | else |
1513 | throw "in universal file, ppc64 slice does not contain ppc64 mach-o"; | |
a61fdf0a A |
1514 | break; |
1515 | case CPU_TYPE_X86_64: | |
1516 | if ( MachOChecker<x86_64>::validFile(p + offset) ) | |
1517 | MachOChecker<x86_64>::make(p + offset, size, path); | |
69a49097 A |
1518 | else |
1519 | throw "in universal file, x86_64 slice does not contain x86_64 mach-o"; | |
a61fdf0a | 1520 | break; |
2f2f92e4 A |
1521 | case CPU_TYPE_ARM: |
1522 | if ( MachOChecker<arm>::validFile(p + offset) ) | |
1523 | MachOChecker<arm>::make(p + offset, size, path); | |
1524 | else | |
1525 | throw "in universal file, arm slice does not contain arm mach-o"; | |
1526 | break; | |
a61fdf0a A |
1527 | default: |
1528 | throwf("in universal file, unknown architecture slice 0x%x\n", cputype); | |
d696c285 A |
1529 | } |
1530 | } | |
1531 | } | |
1532 | else if ( MachOChecker<x86>::validFile(p) ) { | |
1533 | MachOChecker<x86>::make(p, length, path); | |
1534 | } | |
1535 | else if ( MachOChecker<ppc>::validFile(p) ) { | |
1536 | MachOChecker<ppc>::make(p, length, path); | |
1537 | } | |
1538 | else if ( MachOChecker<ppc64>::validFile(p) ) { | |
1539 | MachOChecker<ppc64>::make(p, length, path); | |
1540 | } | |
69a49097 A |
1541 | else if ( MachOChecker<x86_64>::validFile(p) ) { |
1542 | MachOChecker<x86_64>::make(p, length, path); | |
1543 | } | |
2f2f92e4 A |
1544 | else if ( MachOChecker<arm>::validFile(p) ) { |
1545 | MachOChecker<arm>::make(p, length, path); | |
1546 | } | |
d696c285 A |
1547 | else { |
1548 | throw "not a known file type"; | |
1549 | } | |
1550 | } | |
1551 | catch (const char* msg) { | |
1552 | throwf("%s in %s", msg, path); | |
1553 | } | |
1554 | } | |
1555 | ||
1556 | ||
1557 | int main(int argc, const char* argv[]) | |
1558 | { | |
afe874b1 A |
1559 | bool progress = false; |
1560 | int result = 0; | |
1561 | for(int i=1; i < argc; ++i) { | |
1562 | const char* arg = argv[i]; | |
1563 | if ( arg[0] == '-' ) { | |
1564 | if ( strcmp(arg, "-progress") == 0 ) { | |
1565 | progress = true; | |
d696c285 A |
1566 | } |
1567 | else { | |
afe874b1 A |
1568 | throwf("unknown option: %s\n", arg); |
1569 | } | |
1570 | } | |
1571 | else { | |
1572 | bool success = true; | |
1573 | try { | |
d696c285 A |
1574 | check(arg); |
1575 | } | |
afe874b1 A |
1576 | catch (const char* msg) { |
1577 | fprintf(stderr, "machocheck failed: %s %s\n", arg, msg); | |
1578 | result = 1; | |
1579 | success = false; | |
1580 | } | |
1581 | if ( success && progress ) | |
1582 | printf("ok: %s\n", arg); | |
d696c285 A |
1583 | } |
1584 | } | |
d696c285 | 1585 | |
afe874b1 | 1586 | return result; |
d696c285 A |
1587 | } |
1588 | ||
1589 | ||
1590 |