1 /* -*- mode: C++; c-basic-offset: 4; tab-width: 4 -*-
3 * Copyright (c) 2004-2010 Apple Inc. All rights reserved.
5 * @APPLE_LICENSE_HEADER_START@
7 * This file contains Original Code and/or Modifications of Original Code
8 * as defined in and that are subject to the Apple Public Source License
9 * Version 2.0 (the 'License'). You may not use this file except in
10 * compliance with the License. Please obtain a copy of the License at
11 * http://www.opensource.apple.com/apsl/ and read it before using this
14 * The Original Code and all software distributed under the License are
15 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
16 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
17 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
19 * Please see the License for the specific language governing rights and
20 * limitations under the License.
22 * @APPLE_LICENSE_HEADER_END@
25 // work around until conformance work is complete rdar://problem/4508801
34 #include <sys/types.h>
35 #include <sys/fcntl.h>
38 #include <mach/mach.h>
39 #include <mach/thread_status.h>
40 #include <mach-o/loader.h>
41 #include <mach-o/reloc.h>
42 #include <mach-o/nlist.h>
43 #include <sys/sysctl.h>
44 #include <libkern/OSAtomic.h>
45 #include <libkern/OSCacheControl.h>
48 #include <mach-o/x86_64/reloc.h>
51 #include <mach-o/arm/reloc.h>
54 #include "ImageLoaderMachOClassic.h"
55 #include "mach-o/dyld_images.h"
58 extern "C" void stub_binding_helper_i386_old();
62 #define POINTER_RELOC X86_64_RELOC_UNSIGNED
64 #define POINTER_RELOC GENERIC_RELOC_VANILLA
68 // relocation_info.r_length field has value 3 for 64-bit executables and value 2 for 32-bit executables
71 #define LC_SEGMENT_COMMAND LC_SEGMENT_64
72 #define LC_ROUTINES_COMMAND LC_ROUTINES_64
73 struct macho_segment_command
: public segment_command_64
{};
74 struct macho_section
: public section_64
{};
75 struct macho_routines_command
: public routines_command_64
{};
78 #define LC_SEGMENT_COMMAND LC_SEGMENT
79 #define LC_ROUTINES_COMMAND LC_ROUTINES
80 struct macho_segment_command
: public segment_command
{};
81 struct macho_section
: public section
{};
82 struct macho_routines_command
: public routines_command
{};
88 // create image for main executable
89 ImageLoaderMachOClassic
* ImageLoaderMachOClassic::instantiateMainExecutable(const macho_header
* mh
, uintptr_t slide
, const char* path
,
90 unsigned int segCount
, unsigned int libCount
, const LinkContext
& context
)
92 ImageLoaderMachOClassic
* image
= ImageLoaderMachOClassic::instantiateStart(mh
, path
, segCount
, libCount
);
94 // set slide for PIE programs
95 image
->setSlide(slide
);
97 // for PIE record end of program, to know where to start loading dylibs
99 fgNextPIEDylibAddress
= (uintptr_t)image
->getEnd();
101 image
->disableCoverageCheck();
102 image
->instantiateFinish(context
);
103 image
->setMapped(context
);
106 // kernel may have mapped in __IMPORT segment read-only, we need it read/write to do binding
107 if ( image
->fReadOnlyImportSegment
) {
108 for(unsigned int i
=0; i
< image
->fSegmentsCount
; ++i
) {
109 if ( image
->segIsReadOnlyImport(i
) )
110 image
->segMakeWritable(i
, context
);
115 if ( context
.verboseMapping
) {
116 dyld::log("dyld: Main executable mapped %s\n", path
);
117 for(unsigned int i
=0, e
=image
->segmentCount(); i
< e
; ++i
) {
118 const char* name
= image
->segName(i
);
119 if ( (strcmp(name
, "__PAGEZERO") == 0) || (strcmp(name
, "__UNIXSTACK") == 0) )
120 dyld::log("%18s at 0x%08lX->0x%08lX\n", name
, image
->segPreferredLoadAddress(i
), image
->segPreferredLoadAddress(i
)+image
->segSize(i
));
122 dyld::log("%18s at 0x%08lX->0x%08lX\n", name
, image
->segActualLoadAddress(i
), image
->segActualEndAddress(i
));
129 // create image by mapping in a mach-o file
130 ImageLoaderMachOClassic
* ImageLoaderMachOClassic::instantiateFromFile(const char* path
, int fd
, const uint8_t* fileData
, size_t lenFileData
,
131 uint64_t offsetInFat
, uint64_t lenInFat
, const struct stat
& info
,
132 unsigned int segCount
, unsigned int libCount
,
133 const struct linkedit_data_command
* codeSigCmd
, const LinkContext
& context
)
135 ImageLoaderMachOClassic
* image
= ImageLoaderMachOClassic::instantiateStart((macho_header
*)fileData
, path
, segCount
, libCount
);
137 // record info about file
138 image
->setFileInfo(info
.st_dev
, info
.st_ino
, info
.st_mtime
);
140 // if this image is code signed, let kernel validate signature before mapping any pages from image
141 image
->loadCodeSignature(codeSigCmd
, fd
, offsetInFat
, context
);
143 // Validate that first data we read with pread actually matches with code signature
144 image
->validateFirstPages(codeSigCmd
, fd
, fileData
, lenFileData
, offsetInFat
, context
);
147 image
->mapSegmentsClassic(fd
, offsetInFat
, lenInFat
, info
.st_size
, context
);
150 image
->instantiateFinish(context
);
152 // if path happens to be same as in LC_DYLIB_ID load command use that, otherwise malloc a copy of the path
153 const char* installName
= image
->getInstallPath();
154 if ( (installName
!= NULL
) && (strcmp(installName
, path
) == 0) && (path
[0] == '/') )
155 image
->setPathUnowned(installName
);
156 else if ( (path
[0] != '/') || (strstr(path
, "../") != NULL
) ) {
157 // rdar://problem/10733082 Fix up @path based paths during introspection
158 // rdar://problem/5135363 turn relative paths into absolute paths so gdb, Symbolication can later find them
159 char realPath
[MAXPATHLEN
];
160 if ( fcntl(fd
, F_GETPATH
, realPath
) == 0 )
161 image
->setPaths(path
, realPath
);
163 image
->setPath(path
);
166 image
->setPath(path
);
168 // make sure path is stable before recording in dyld_all_image_infos
169 image
->setMapped(context
);
171 // pre-fetch content of __DATA segment for faster launches
172 // don't do this on prebound images or if prefetching is disabled
173 if ( !context
.preFetchDisabled
&& !image
->isPrebindable())
174 image
->preFetchDATA(fd
, offsetInFat
, context
);
178 // ImageLoader::setMapped() can throw an exception to block loading of image
179 // <rdar://problem/6169686> Leaked fSegmentsArray and image segments during failed dlopen_preflight
187 // create image by using cached mach-o file
188 ImageLoaderMachOClassic
* ImageLoaderMachOClassic::instantiateFromCache(const macho_header
* mh
, const char* path
, long slide
, const struct stat
& info
,
189 unsigned int segCount
, unsigned int libCount
, const LinkContext
& context
)
191 ImageLoaderMachOClassic
* image
= ImageLoaderMachOClassic::instantiateStart(mh
, path
, segCount
, libCount
);
193 // record info about file
194 image
->setFileInfo(info
.st_dev
, info
.st_ino
, info
.st_mtime
);
196 // remember this is from shared cache and cannot be unloaded
197 image
->fInSharedCache
= true;
198 image
->setNeverUnload();
199 image
->disableCoverageCheck();
201 // segments already mapped in cache
202 if ( context
.verboseMapping
) {
203 dyld::log("dyld: Using shared cached for %s\n", path
);
204 for(unsigned int i
=0, e
=image
->segmentCount(); i
< e
; ++i
) {
205 dyld::log("%18s at 0x%08lX->0x%08lX\n", image
->segName(i
), image
->segActualLoadAddress(i
), image
->segActualEndAddress(i
));
209 image
->instantiateFinish(context
);
210 image
->setMapped(context
);
213 // ImageLoader::setMapped() can throw an exception to block loading of image
214 // <rdar://problem/6169686> Leaked fSegmentsArray and image segments during failed dlopen_preflight
222 // create image by copying an in-memory mach-o file
223 ImageLoaderMachOClassic
* ImageLoaderMachOClassic::instantiateFromMemory(const char* moduleName
, const macho_header
* mh
, uint64_t len
,
224 unsigned int segCount
, unsigned int libCount
, const LinkContext
& context
)
226 ImageLoaderMachOClassic
* image
= ImageLoaderMachOClassic::instantiateStart(mh
, moduleName
, segCount
, libCount
);
229 if ( mh
->filetype
== MH_EXECUTE
)
230 throw "can't load another MH_EXECUTE";
233 image
->ImageLoaderMachO::mapSegments((const void*)mh
, len
, context
);
235 // for compatibility, never unload dylibs loaded from memory
236 image
->setNeverUnload();
238 image
->disableCoverageCheck();
240 // bundle loads need path copied
241 if ( moduleName
!= NULL
)
242 image
->setPath(moduleName
);
244 image
->instantiateFinish(context
);
245 image
->setMapped(context
);
248 // ImageLoader::setMapped() can throw an exception to block loading of image
249 // <rdar://problem/6169686> Leaked fSegmentsArray and image segments during failed dlopen_preflight
258 ImageLoaderMachOClassic::ImageLoaderMachOClassic(const macho_header
* mh
, const char* path
,
259 unsigned int segCount
, uint32_t segOffsets
[], unsigned int libCount
)
260 : ImageLoaderMachO(mh
, path
, segCount
, segOffsets
, libCount
), fStrings(NULL
), fSymbolTable(NULL
), fDynamicInfo(NULL
)
264 // construct ImageLoaderMachOClassic using "placement new" with SegmentMachO objects array at end
265 ImageLoaderMachOClassic
* ImageLoaderMachOClassic::instantiateStart(const macho_header
* mh
, const char* path
,
266 unsigned int segCount
, unsigned int libCount
)
268 size_t size
= sizeof(ImageLoaderMachOClassic
) + segCount
* sizeof(uint32_t) + libCount
* sizeof(ImageLoader
*);
269 ImageLoaderMachOClassic
* allocatedSpace
= static_cast<ImageLoaderMachOClassic
*>(malloc(size
));
270 if ( allocatedSpace
== NULL
)
271 throw "malloc failed";
272 uint32_t* segOffsets
= ((uint32_t*)(((uint8_t*)allocatedSpace
) + sizeof(ImageLoaderMachOClassic
)));
273 bzero(&segOffsets
[segCount
], libCount
*sizeof(void*)); // zero out lib array
274 return new (allocatedSpace
) ImageLoaderMachOClassic(mh
, path
, segCount
, segOffsets
, libCount
);
279 // common code to finish initializing object
280 void ImageLoaderMachOClassic::instantiateFinish(const LinkContext
& context
)
282 // now that segments are mapped in, get real fMachOData, fLinkEditBase, and fSlide
283 this->parseLoadCmds(context
);
286 ImageLoaderMachOClassic::~ImageLoaderMachOClassic()
288 // don't do clean up in ~ImageLoaderMachO() because virtual call to segmentCommandOffsets() won't work
292 uint32_t* ImageLoaderMachOClassic::segmentCommandOffsets() const
294 return ((uint32_t*)(((uint8_t*)this) + sizeof(ImageLoaderMachOClassic
)));
298 ImageLoader
* ImageLoaderMachOClassic::libImage(unsigned int libIndex
) const
300 const uintptr_t* images
= ((uintptr_t*)(((uint8_t*)this) + sizeof(ImageLoaderMachOClassic
) + fSegmentsCount
*sizeof(uint32_t)));
302 return (ImageLoader
*)(images
[libIndex
] & (-4));
305 bool ImageLoaderMachOClassic::libReExported(unsigned int libIndex
) const
307 const uintptr_t* images
= ((uintptr_t*)(((uint8_t*)this) + sizeof(ImageLoaderMachOClassic
) + fSegmentsCount
*sizeof(uint32_t)));
308 // re-export flag is low bit
309 return ((images
[libIndex
] & 1) != 0);
312 bool ImageLoaderMachOClassic::libIsUpward(unsigned int libIndex
) const
314 const uintptr_t* images
= ((uintptr_t*)(((uint8_t*)this) + sizeof(ImageLoaderMachOClassic
) + fSegmentsCount
*sizeof(uint32_t)));
315 // upward flag is second bit
316 return ((images
[libIndex
] & 2) != 0);
320 void ImageLoaderMachOClassic::setLibImage(unsigned int libIndex
, ImageLoader
* image
, bool reExported
, bool upward
)
322 uintptr_t* images
= ((uintptr_t*)(((uint8_t*)this) + sizeof(ImageLoaderMachOClassic
) + fSegmentsCount
*sizeof(uint32_t)));
323 uintptr_t value
= (uintptr_t)image
;
328 images
[libIndex
] = value
;
332 void ImageLoaderMachOClassic::setSymbolTableInfo(const macho_nlist
* symbols
, const char* strings
, const dysymtab_command
* dynSym
)
334 fSymbolTable
= symbols
;
336 fDynamicInfo
= dynSym
;
339 void ImageLoaderMachOClassic::prefetchLINKEDIT(const LinkContext
& context
)
341 // always prefetch a subrange of __LINKEDIT pages
342 uintptr_t symbolTableStart
= (uintptr_t)fSymbolTable
;
343 uintptr_t stringTableStart
= (uintptr_t)fStrings
;
345 // if image did not load at preferred address
346 if ( segPreferredLoadAddress(0) != (uintptr_t)fMachOData
) {
347 // local relocations will be processed, so start pre-fetch at local symbols
348 start
= (uintptr_t)fMachOData
+ fDynamicInfo
->locreloff
;
351 // otherwise start pre-fetch at global symbols section of symbol table
352 start
= symbolTableStart
+ fDynamicInfo
->iextdefsym
* sizeof(macho_nlist
);
354 // prefetch ends at end of last undefined string in string pool
355 uintptr_t end
= stringTableStart
;
356 if ( fDynamicInfo
->nundefsym
!= 0 )
357 end
+= fSymbolTable
[fDynamicInfo
->iundefsym
+fDynamicInfo
->nundefsym
-1].n_un
.n_strx
;
358 else if ( fDynamicInfo
->nextdefsym
!= 0 )
359 end
+= fSymbolTable
[fDynamicInfo
->iextdefsym
+fDynamicInfo
->nextdefsym
-1].n_un
.n_strx
;
361 // round to whole pages
362 start
= dyld_page_trunc(start
);
363 end
= dyld_page_round(end
);
365 // skip if there is only one page
366 if ( (end
-start
) > dyld_page_size
) {
367 madvise((void*)start
, end
-start
, MADV_WILLNEED
);
368 fgTotalBytesPreFetched
+= (end
-start
);
369 if ( context
.verboseMapping
) {
370 dyld::log("%18s prefetching 0x%0lX -> 0x%0lX\n", "__LINKEDIT", start
, end
-1);
376 #if SPLIT_SEG_DYLIB_SUPPORT
378 ImageLoaderMachOClassic::getExtraZeroFillEntriesCount()
380 // calculate mapping entries
381 unsigned int extraZeroFillEntries
= 0;
382 for(unsigned int i
=0; i
< fSegmentsCount
; ++i
) {
383 if ( segHasTrailingZeroFill(i
) )
384 ++extraZeroFillEntries
;
387 return extraZeroFillEntries
;
391 ImageLoaderMachOClassic::initMappingTable(uint64_t offsetInFat
,
392 shared_file_mapping_np
*mappingTable
)
394 for(unsigned int i
=0,entryIndex
=0; i
< fSegmentsCount
; ++i
, ++entryIndex
) {
395 shared_file_mapping_np
* entry
= &mappingTable
[entryIndex
];
396 entry
->sfm_address
= segActualLoadAddress(i
);
397 entry
->sfm_size
= segFileSize(i
);
398 entry
->sfm_file_offset
= segFileOffset(i
) + offsetInFat
;
399 entry
->sfm_init_prot
= VM_PROT_NONE
;
400 if ( !segUnaccessible(i
) ) {
401 if ( segExecutable(i
) )
402 entry
->sfm_init_prot
|= VM_PROT_EXECUTE
;
403 if ( segReadable(i
) )
404 entry
->sfm_init_prot
|= VM_PROT_READ
;
405 if ( segWriteable(i
) )
406 entry
->sfm_init_prot
|= VM_PROT_WRITE
| VM_PROT_COW
;
408 entry
->sfm_max_prot
= entry
->sfm_init_prot
;
409 if ( segHasTrailingZeroFill(i
) ) {
410 shared_file_mapping_np
* zfentry
= &mappingTable
[++entryIndex
];
411 zfentry
->sfm_address
= entry
->sfm_address
+ segFileSize(i
);
412 zfentry
->sfm_size
= segSize(i
) - segFileSize(i
);
413 zfentry
->sfm_file_offset
= 0;
414 zfentry
->sfm_init_prot
= entry
->sfm_init_prot
| VM_PROT_COW
| VM_PROT_ZF
;
415 zfentry
->sfm_max_prot
= zfentry
->sfm_init_prot
;
421 ImageLoaderMachOClassic::mapSplitSegDylibOutsideSharedRegion(int fd
,
422 uint64_t offsetInFat
,
425 const LinkContext
& context
)
427 uintptr_t nextAltLoadAddress
= 0;
428 const unsigned int segmentCount
= fSegmentsCount
;
429 const unsigned int extraZeroFillEntries
= getExtraZeroFillEntriesCount();
430 const unsigned int regionCount
= segmentCount
+extraZeroFillEntries
;
431 shared_file_mapping_np regions
[regionCount
];
432 initMappingTable(offsetInFat
, regions
);
434 // find space somewhere to allocate split seg
435 bool foundRoom
= false;
436 while ( ! foundRoom
) {
438 for(unsigned int i
=0; i
< regionCount
; ++i
) {
439 vm_address_t addr
= (vm_address_t
)(nextAltLoadAddress
+ regions
[i
].sfm_address
- regions
[0].sfm_address
);
440 vm_size_t size
= (vm_size_t
)regions
[i
].sfm_size
;
441 r
= vm_allocate(mach_task_self(), &addr
, size
, false /*only this range*/);
443 // no room here, deallocate what has succeeded so far
444 for(unsigned int j
=0; j
< i
; ++j
) {
445 addr
= (vm_address_t
)(nextAltLoadAddress
+ regions
[j
].sfm_address
- regions
[0].sfm_address
);
446 size
= (vm_size_t
)(regions
[j
].sfm_size
);
447 (void)vm_deallocate(mach_task_self(), addr
, size
);
449 nextAltLoadAddress
+= 0x00100000; // skip ahead 1MB and try again
450 // skip over shared region
451 if ( (SHARED_REGION_BASE
<= nextAltLoadAddress
) && (nextAltLoadAddress
< (SHARED_REGION_BASE
+ SHARED_REGION_SIZE
)) )
452 nextAltLoadAddress
= (SHARED_REGION_BASE
+ SHARED_REGION_SIZE
);
453 if ( nextAltLoadAddress
> 0xFF000000 )
454 throw "can't map split seg anywhere";
461 // map in each region
462 uintptr_t slide
= (uintptr_t)(nextAltLoadAddress
- regions
[0].sfm_address
);
463 this->setSlide(slide
);
464 for(unsigned int i
=0; i
< regionCount
; ++i
) {
465 if ( ((regions
[i
].sfm_init_prot
& VM_PROT_ZF
) != 0) || (regions
[i
].sfm_size
== 0) ) {
466 // nothing to mmap for zero-fills areas, they are just vm_allocated
469 void* mmapAddress
= (void*)(uintptr_t)(regions
[i
].sfm_address
+ slide
);
470 size_t size
= (size_t)regions
[i
].sfm_size
;
472 if ( regions
[i
].sfm_init_prot
& VM_PROT_EXECUTE
)
473 protection
|= PROT_EXEC
;
474 if ( regions
[i
].sfm_init_prot
& VM_PROT_READ
)
475 protection
|= PROT_READ
;
476 if ( regions
[i
].sfm_init_prot
& VM_PROT_WRITE
)
477 protection
|= PROT_WRITE
;
478 off_t offset
= regions
[i
].sfm_file_offset
;
479 //dyld::log("mmap(%p, 0x%08lX, %s\n", mmapAddress, size, fPath);
480 mmapAddress
= mmap(mmapAddress
, size
, protection
, MAP_FIXED
| MAP_PRIVATE
, fd
, offset
);
481 if ( mmapAddress
== ((void*)(-1)) )
487 if ( context
.verboseMapping
) {
488 dyld::log("dyld: Mapping split-seg outside shared region, slid by 0x%08lX %s\n", this->fSlide
, this->getPath());
489 for(unsigned int segIndex
=0,entryIndex
=0; segIndex
< segmentCount
; ++segIndex
, ++entryIndex
){
490 const shared_file_mapping_np
* entry
= ®ions
[entryIndex
];
491 if ( (entry
->sfm_init_prot
& VM_PROT_ZF
) == 0 )
492 dyld::log("%18s at 0x%08lX->0x%08lX\n",
493 segName(segIndex
), segActualLoadAddress(segIndex
), segActualEndAddress(segIndex
)-1);
494 if ( entryIndex
< (regionCount
-1) ) {
495 const shared_file_mapping_np
* nextEntry
= ®ions
[entryIndex
+1];
496 if ( (nextEntry
->sfm_init_prot
& VM_PROT_ZF
) != 0 ) {
497 uint64_t segOffset
= nextEntry
->sfm_address
- entry
->sfm_address
;
498 dyld::log("%18s at 0x%08lX->0x%08lX (zerofill)\n",
499 segName(segIndex
), (uintptr_t)(segActualLoadAddress(segIndex
) + segOffset
), (uintptr_t)(segActualLoadAddress(segIndex
) + segOffset
+ nextEntry
->sfm_size
- 1));
508 #endif // SPLIT_SEG_DYLIB_SUPPORT
511 void ImageLoaderMachOClassic::mapSegmentsClassic(int fd
, uint64_t offsetInFat
, uint64_t lenInFat
, uint64_t fileLen
, const LinkContext
& context
)
513 // non-split segment libraries handled by super class
515 return ImageLoaderMachO::mapSegments(fd
, offsetInFat
, lenInFat
, fileLen
, context
);
517 #if SPLIT_SEG_SHARED_REGION_SUPPORT
518 // don't map split-seg dylibs into shared region if shared cache is in use
519 if ( ! context
.dyldLoadedAtSameAddressNeededBySharedCache
) {
520 // try to map into shared region at preferred address
521 if ( mapSplitSegDylibInfoSharedRegion(fd
, offsetInFat
, lenInFat
, fileLen
, context
) == 0)
524 // if there is a problem, fall into case where we map file somewhere outside the shared region
527 #if SPLIT_SEG_DYLIB_SUPPORT
528 // support old split-seg dylibs by mapping them where ever we find space
529 if ( mapSplitSegDylibOutsideSharedRegion(fd
, offsetInFat
, lenInFat
, fileLen
, context
) != 0 )
531 throw "mapping error";
535 #if SPLIT_SEG_SHARED_REGION_SUPPORT
536 static int _shared_region_map_np(int fd
, uint32_t count
, const shared_file_mapping_np mappings
[])
538 return syscall(295, fd
, count
, mappings
);
542 ImageLoaderMachOClassic::mapSplitSegDylibInfoSharedRegion(int fd
,
543 uint64_t offsetInFat
,
546 const LinkContext
& context
)
548 // build table of segments to map
549 const unsigned int segmentCount
= fSegmentsCount
;
550 const unsigned int extraZeroFillEntries
= getExtraZeroFillEntriesCount();
551 const unsigned int mappingTableCount
= segmentCount
+extraZeroFillEntries
;
552 shared_file_mapping_np mappingTable
[mappingTableCount
];
553 initMappingTable(offsetInFat
, mappingTable
);
555 // try to map it in shared
556 int r
= _shared_region_map_np(fd
, mappingTableCount
, mappingTable
);
558 this->setNeverUnload();
559 if ( context
.verboseMapping
) {
560 dyld::log("dyld: Mapping split-seg shared %s\n", this->getPath());
561 for(unsigned int segIndex
=0,entryIndex
=0; segIndex
< segmentCount
; ++segIndex
, ++entryIndex
){
562 const shared_file_mapping_np
* entry
= &mappingTable
[entryIndex
];
563 if ( (entry
->sfm_init_prot
& VM_PROT_ZF
) == 0 )
564 dyld::log("%18s at 0x%08lX->0x%08lX\n",
565 segName(segIndex
), segActualLoadAddress(segIndex
), segActualEndAddress(segIndex
)-1);
566 if ( entryIndex
< (mappingTableCount
-1) ) {
567 const shared_file_mapping_np
* nextEntry
= &mappingTable
[entryIndex
+1];
568 if ( (nextEntry
->sfm_init_prot
& VM_PROT_ZF
) != 0 ) {
569 uint64_t segOffset
= nextEntry
->sfm_address
- entry
->sfm_address
;
570 dyld::log("%18s at 0x%08lX->0x%08lX\n",
571 segName(segIndex
), (uintptr_t)(segActualLoadAddress(segIndex
) + segOffset
),
572 (uintptr_t)(segActualLoadAddress(segIndex
) + segOffset
+ nextEntry
->sfm_size
- 1));
582 #endif // SPLIT_SEG_SHARED_REGION_SUPPORT
584 // test if this image is re-exported through parent (the image that loaded this one)
585 bool ImageLoaderMachOClassic::isSubframeworkOf(const LinkContext
& context
, const ImageLoader
* parent
) const
588 const uint32_t cmd_count
= ((macho_header
*)fMachOData
)->ncmds
;
589 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
590 const struct load_command
* cmd
= cmds
;
591 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
592 if (cmd
->cmd
== LC_SUB_FRAMEWORK
) {
593 const struct sub_framework_command
* subf
= (struct sub_framework_command
*)cmd
;
594 const char* exportThruName
= (char*)cmd
+ subf
->umbrella
.offset
;
595 // need to match LC_SUB_FRAMEWORK string against the leaf name of the install location of parent...
596 const char* parentInstallPath
= parent
->getInstallPath();
597 if ( parentInstallPath
!= NULL
) {
598 const char* lastSlash
= strrchr(parentInstallPath
, '/');
599 if ( lastSlash
!= NULL
) {
600 if ( strcmp(&lastSlash
[1], exportThruName
) == 0 )
602 if ( context
.imageSuffix
!= NULL
) {
603 // when DYLD_IMAGE_SUFFIX is used, lastSlash string needs imageSuffix removed from end
604 for(const char* const* suffix
= context
.imageSuffix
; *suffix
!= NULL
; ++suffix
) {
605 char reexportAndSuffix
[strlen(*suffix
)+strlen(exportThruName
)+1];
606 strcpy(reexportAndSuffix
, exportThruName
);
607 strcat(reexportAndSuffix
, *suffix
);
608 if ( strcmp(&lastSlash
[1], reexportAndSuffix
) == 0 )
615 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
621 // test if child is re-exported
622 bool ImageLoaderMachOClassic::hasSubLibrary(const LinkContext
& context
, const ImageLoader
* child
) const
624 if ( fHasSubLibraries
) {
625 // need to match LC_SUB_LIBRARY string against the leaf name (without extension) of the install location of child...
626 const char* childInstallPath
= child
->getInstallPath();
627 if ( childInstallPath
!= NULL
) {
628 const char* lastSlash
= strrchr(childInstallPath
, '/');
629 if ( lastSlash
!= NULL
) {
630 const char* firstDot
= strchr(lastSlash
, '.');
632 if ( firstDot
== NULL
)
633 len
= strlen(lastSlash
);
635 len
= firstDot
-lastSlash
-1;
636 char childLeafName
[len
+1];
637 strncpy(childLeafName
, &lastSlash
[1], len
);
638 childLeafName
[len
] = '\0';
639 const uint32_t cmd_count
= ((macho_header
*)fMachOData
)->ncmds
;
640 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
641 const struct load_command
* cmd
= cmds
;
642 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
646 const struct sub_library_command
* lib
= (struct sub_library_command
*)cmd
;
647 const char* aSubLibName
= (char*)cmd
+ lib
->sub_library
.offset
;
648 if ( strcmp(aSubLibName
, childLeafName
) == 0 )
650 if ( context
.imageSuffix
!= NULL
) {
651 // when DYLD_IMAGE_SUFFIX is used, childLeafName string needs imageSuffix removed from end
652 for(const char* const* suffix
= context
.imageSuffix
; *suffix
!= NULL
; ++suffix
) {
653 char aSubLibNameAndSuffix
[strlen(*suffix
)+strlen(aSubLibName
)+1];
654 strcpy(aSubLibNameAndSuffix
, aSubLibName
);
655 strcat(aSubLibNameAndSuffix
, *suffix
);
656 if ( strcmp(aSubLibNameAndSuffix
, childLeafName
) == 0 )
663 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
668 if ( fHasSubUmbrella
) {
669 // need to match LC_SUB_UMBRELLA string against the leaf name of install location of child...
670 const char* childInstallPath
= child
->getInstallPath();
671 if ( childInstallPath
!= NULL
) {
672 const char* lastSlash
= strrchr(childInstallPath
, '/');
673 if ( lastSlash
!= NULL
) {
674 const uint32_t cmd_count
= ((macho_header
*)fMachOData
)->ncmds
;
675 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
676 const struct load_command
* cmd
= cmds
;
677 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
679 case LC_SUB_UMBRELLA
:
681 const struct sub_umbrella_command
* um
= (struct sub_umbrella_command
*)cmd
;
682 const char* aSubUmbrellaName
= (char*)cmd
+ um
->sub_umbrella
.offset
;
683 if ( strcmp(aSubUmbrellaName
, &lastSlash
[1]) == 0 )
685 if ( context
.imageSuffix
!= NULL
) {
686 // when DYLD_IMAGE_SUFFIX is used, lastSlash string needs imageSuffix removed from end
687 for(const char* const* suffix
= context
.imageSuffix
; *suffix
!= NULL
; ++suffix
) {
688 char umbrellaAndSuffix
[strlen(*suffix
)+strlen(aSubUmbrellaName
)+1];
689 strcpy(umbrellaAndSuffix
, aSubUmbrellaName
);
690 strcat(umbrellaAndSuffix
, *suffix
);
691 if ( strcmp(umbrellaAndSuffix
, &lastSlash
[1]) == 0 )
698 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
707 uintptr_t ImageLoaderMachOClassic::getFirstWritableSegmentAddress()
709 // in split segment libraries r_address is offset from first writable segment
710 for(unsigned int i
=0; i
< fSegmentsCount
; ++i
) {
711 if ( segWriteable(i
) )
712 return segActualLoadAddress(i
);
714 throw "no writable segment";
717 uintptr_t ImageLoaderMachOClassic::getRelocBase()
719 // r_address is either an offset from the first segment address
720 // or from the first writable segment address
722 return getFirstWritableSegmentAddress();
725 return getFirstWritableSegmentAddress();
727 return segActualLoadAddress(0);
732 #if PREBOUND_IMAGE_SUPPORT
733 void ImageLoaderMachOClassic::resetPreboundLazyPointers(const LinkContext
& context
)
735 // loop through all local (internal) relocation records looking for pre-bound-lazy-pointer values
736 const uintptr_t relocBase
= this->getRelocBase();
737 const uintptr_t slide
= this->fSlide
;
738 const relocation_info
* const relocsStart
= (struct relocation_info
*)(&fLinkEditBase
[fDynamicInfo
->locreloff
]);
739 const relocation_info
* const relocsEnd
= &relocsStart
[fDynamicInfo
->nlocrel
];
740 for (const relocation_info
* reloc
=relocsStart
; reloc
< relocsEnd
; ++reloc
) {
741 if ( (reloc
->r_address
& R_SCATTERED
) != 0 ) {
742 const struct scattered_relocation_info
* sreloc
= (struct scattered_relocation_info
*)reloc
;
743 if (sreloc
->r_length
== RELOC_SIZE
) {
744 uintptr_t* locationToFix
= (uintptr_t*)(sreloc
->r_address
+ relocBase
);
745 switch(sreloc
->r_type
) {
747 case GENERIC_RELOC_PB_LA_PTR
:
748 *locationToFix
= sreloc
->r_value
+ slide
;
752 case ARM_RELOC_PB_LA_PTR
:
753 *locationToFix
= sreloc
->r_value
+ slide
;
766 void ImageLoaderMachOClassic::rebase(const LinkContext
& context
, uintptr_t slide
)
768 CRSetCrashLogMessage2(this->getPath());
769 const uintptr_t relocBase
= this->getRelocBase();
771 // prefetch any LINKEDIT pages needed
772 if ( !context
.preFetchDisabled
&& !this->isPrebindable())
773 this->prefetchLINKEDIT(context
);
775 // loop through all local (internal) relocation records
776 const relocation_info
* const relocsStart
= (struct relocation_info
*)(&fLinkEditBase
[fDynamicInfo
->locreloff
]);
777 const relocation_info
* const relocsEnd
= &relocsStart
[fDynamicInfo
->nlocrel
];
778 for (const relocation_info
* reloc
=relocsStart
; reloc
< relocsEnd
; ++reloc
) {
779 uintptr_t rebaseAddr
;
781 #if LINKEDIT_USAGE_DEBUG
782 noteAccessedLinkEditAddress(reloc
);
785 // only one kind of local relocation supported for x86_64
786 if ( reloc
->r_length
!= 3 )
787 throw "bad local relocation length";
788 if ( reloc
->r_type
!= X86_64_RELOC_UNSIGNED
)
789 throw "unknown local relocation type";
790 if ( reloc
->r_pcrel
!= 0 )
791 throw "bad local relocation pc_rel";
792 if ( reloc
->r_extern
!= 0 )
793 throw "extern relocation found with local relocations";
794 rebaseAddr
= reloc
->r_address
+ relocBase
;
795 if ( ! this->containsAddress((void*)rebaseAddr
) )
796 dyld::throwf("local reloc %p not in mapped image\n", (void*)rebaseAddr
);
797 *((uintptr_t*)rebaseAddr
) += slide
;
798 if ( context
.verboseRebase
)
799 dyld::log("dyld: rebase: %s:*0x%08lX += 0x%08lX\n", this->getShortName(), rebaseAddr
, slide
);
801 if ( (reloc
->r_address
& R_SCATTERED
) == 0 ) {
802 if ( reloc
->r_symbolnum
== R_ABS
) {
803 // ignore absolute relocations
805 else if (reloc
->r_length
== RELOC_SIZE
) {
806 switch(reloc
->r_type
) {
807 case GENERIC_RELOC_VANILLA
:
808 rebaseAddr
= reloc
->r_address
+ relocBase
;
809 if ( ! this->containsAddress((void*)rebaseAddr
) )
810 dyld::throwf("local reloc %p not in mapped image\n", (void*)rebaseAddr
);
811 *((uintptr_t*)rebaseAddr
) += slide
;
812 if ( context
.verboseRebase
)
813 dyld::log("dyld: rebase: %s:*0x%08lX += 0x%08lX\n", this->getShortName(), rebaseAddr
, slide
);
816 throw "unknown local relocation type";
820 throw "bad local relocation length";
824 const struct scattered_relocation_info
* sreloc
= (struct scattered_relocation_info
*)reloc
;
825 if (sreloc
->r_length
== RELOC_SIZE
) {
826 uintptr_t* locationToFix
= (uintptr_t*)(sreloc
->r_address
+ relocBase
);
827 switch(sreloc
->r_type
) {
828 case GENERIC_RELOC_VANILLA
:
829 if ( ! this->containsAddress((void*)locationToFix
) )
830 dyld::throwf("local scattered reloc %p not in mapped image\n", locationToFix
);
831 *locationToFix
+= slide
;
832 if ( context
.verboseRebase
)
833 dyld::log("dyld: rebase: %s:*0x%08lX += 0x%08lX\n", this->getShortName(), (uintptr_t)locationToFix
, slide
);
836 case GENERIC_RELOC_PB_LA_PTR
:
840 case ARM_RELOC_PB_LA_PTR
:
845 throw "unknown local scattered relocation type";
849 throw "bad local scattered relocation length";
854 catch (const char* msg
) {
855 const uint8_t* r
= (uint8_t*)reloc
;
856 dyld::throwf("%s in %s. reloc record at %p: 0x%02X 0x%02X 0x%02X 0x%02X 0x%02X 0x%02X 0x%02X 0x%02X",
857 msg
, this->getPath(), reloc
, r
[0], r
[1], r
[2], r
[3], r
[4], r
[5], r
[6], r
[7]);
862 fgTotalRebaseFixups
+= fDynamicInfo
->nlocrel
;
863 CRSetCrashLogMessage2(NULL
);
868 const struct macho_nlist
* ImageLoaderMachOClassic::binarySearchWithToc(const char* key
, const char stringPool
[], const struct macho_nlist symbols
[],
869 const struct dylib_table_of_contents toc
[], uint32_t symbolCount
, uint32_t hintIndex
) const
871 int32_t high
= symbolCount
-1;
872 int32_t mid
= hintIndex
;
874 // handle out of range hint
875 if ( mid
>= (int32_t)symbolCount
)
877 ++ImageLoaderMachO::fgSymbolTableBinarySearchs
;
878 ++fgTotalBindImageSearches
;
880 //dyld::log("dyld: binarySearchWithToc for %s in %s\n", key, this->getShortName());
882 for (int32_t low
= 0; low
<= high
; mid
= (low
+high
)/2) {
883 const uint32_t index
= toc
[mid
].symbol_index
;
884 const struct macho_nlist
* pivot
= &symbols
[index
];
885 const char* pivotStr
= &stringPool
[pivot
->n_un
.n_strx
];
886 #if LINKEDIT_USAGE_DEBUG
887 noteAccessedLinkEditAddress(&toc
[mid
]);
888 noteAccessedLinkEditAddress(pivot
);
889 noteAccessedLinkEditAddress(pivotStr
);
891 int cmp
= strcmp(key
, pivotStr
);
906 const struct macho_nlist
* ImageLoaderMachOClassic::binarySearch(const char* key
, const char stringPool
[], const struct macho_nlist symbols
[], uint32_t symbolCount
) const
909 ++fgTotalBindImageSearches
;
910 ++ImageLoaderMachO::fgSymbolTableBinarySearchs
;
912 //dyld::log("dyld: binarySearch for %s in %s, stringpool=%p, symbols=%p, symbolCount=%u\n",
913 // key, this->getShortName(), stringPool, symbols, symbolCount);
915 const struct macho_nlist
* base
= symbols
;
916 for (uint32_t n
= symbolCount
; n
> 0; n
/= 2) {
917 const struct macho_nlist
* pivot
= &base
[n
/2];
918 const char* pivotStr
= &stringPool
[pivot
->n_un
.n_strx
];
919 #if LINKEDIT_USAGE_DEBUG
920 noteAccessedLinkEditAddress(pivot
);
921 noteAccessedLinkEditAddress(pivotStr
);
923 int cmp
= strcmp(key
, pivotStr
);
928 // move base to symbol after pivot
941 const ImageLoader::Symbol
* ImageLoaderMachOClassic::findShallowExportedSymbol(const char* name
, const ImageLoader
** foundIn
) const
943 const struct macho_nlist
* sym
= NULL
;
944 if ( fDynamicInfo
->tocoff
== 0 )
945 sym
= binarySearch(name
, fStrings
, &fSymbolTable
[fDynamicInfo
->iextdefsym
], fDynamicInfo
->nextdefsym
);
947 sym
= binarySearchWithToc(name
, fStrings
, fSymbolTable
, (dylib_table_of_contents
*)&fLinkEditBase
[fDynamicInfo
->tocoff
],
948 fDynamicInfo
->ntoc
, fDynamicInfo
->nextdefsym
);
950 if ( foundIn
!= NULL
)
951 *foundIn
= (ImageLoader
*)this;
952 return (const Symbol
*)sym
;
959 bool ImageLoaderMachOClassic::containsSymbol(const void* addr
) const
961 return ( (fSymbolTable
<= addr
) && (addr
< fStrings
) );
965 uintptr_t ImageLoaderMachOClassic::exportedSymbolAddress(const LinkContext
& context
, const Symbol
* symbol
, const ImageLoader
* requestor
, bool runResolver
) const
967 const struct macho_nlist
* sym
= (macho_nlist
*)symbol
;
968 uintptr_t result
= sym
->n_value
+ fSlide
;
970 // processor assumes code address with low bit set is thumb
971 if (sym
->n_desc
& N_ARM_THUMB_DEF
)
977 bool ImageLoaderMachOClassic::exportedSymbolIsWeakDefintion(const Symbol
* symbol
) const
979 const struct macho_nlist
* nlistSym
= (const struct macho_nlist
*)symbol
;
980 return ( (nlistSym
->n_desc
& N_WEAK_DEF
) != 0 );
983 const char* ImageLoaderMachOClassic::exportedSymbolName(const Symbol
* symbol
) const
985 const struct macho_nlist
* nlistSym
= (const struct macho_nlist
*)symbol
;
986 return &fStrings
[nlistSym
->n_un
.n_strx
];
989 unsigned int ImageLoaderMachOClassic::exportedSymbolCount() const
991 return fDynamicInfo
->nextdefsym
;
994 const ImageLoader::Symbol
* ImageLoaderMachOClassic::exportedSymbolIndexed(unsigned int index
) const
996 if ( index
< fDynamicInfo
->nextdefsym
) {
997 const struct macho_nlist
* sym
= &fSymbolTable
[fDynamicInfo
->iextdefsym
+ index
];
998 return (const ImageLoader::Symbol
*)sym
;
1003 unsigned int ImageLoaderMachOClassic::importedSymbolCount() const
1005 return fDynamicInfo
->nundefsym
;
1008 const ImageLoader::Symbol
* ImageLoaderMachOClassic::importedSymbolIndexed(unsigned int index
) const
1010 if ( index
< fDynamicInfo
->nundefsym
) {
1011 const struct macho_nlist
* sym
= &fSymbolTable
[fDynamicInfo
->iundefsym
+ index
];
1012 return (const ImageLoader::Symbol
*)sym
;
1017 const char* ImageLoaderMachOClassic::importedSymbolName(const Symbol
* symbol
) const
1019 const struct macho_nlist
* nlistSym
= (const struct macho_nlist
*)symbol
;
1020 return &fStrings
[nlistSym
->n_un
.n_strx
];
1025 bool ImageLoaderMachOClassic::symbolIsWeakDefinition(const struct macho_nlist
* symbol
)
1027 // if a define and weak ==> coalesced
1028 if ( ((symbol
->n_type
& N_TYPE
) == N_SECT
) && ((symbol
->n_desc
& N_WEAK_DEF
) != 0) )
1035 bool ImageLoaderMachOClassic::symbolIsWeakReference(const struct macho_nlist
* symbol
)
1037 // if an undefine and not referencing a weak symbol ==> coalesced
1038 if ( ((symbol
->n_type
& N_TYPE
) != N_SECT
) && ((symbol
->n_desc
& N_REF_TO_WEAK
) != 0) )
1045 uintptr_t ImageLoaderMachOClassic::getSymbolAddress(const macho_nlist
* sym
, const LinkContext
& context
, bool runResolver
) const
1047 return ImageLoaderMachO::getSymbolAddress((Symbol
*)sym
, this, context
, runResolver
);
1050 uintptr_t ImageLoaderMachOClassic::resolveUndefined(const LinkContext
& context
, const struct macho_nlist
* undefinedSymbol
,
1051 bool twoLevel
, bool dontCoalesce
, bool runResolver
, const ImageLoader
** foundIn
)
1053 ++fgTotalBindSymbolsResolved
;
1054 const char* symbolName
= &fStrings
[undefinedSymbol
->n_un
.n_strx
];
1056 #if LINKEDIT_USAGE_DEBUG
1057 noteAccessedLinkEditAddress(undefinedSymbol
);
1058 noteAccessedLinkEditAddress(symbolName
);
1060 if ( context
.bindFlat
|| !twoLevel
) {
1062 if ( ((undefinedSymbol
->n_type
& N_PEXT
) != 0) && ((undefinedSymbol
->n_type
& N_TYPE
) == N_SECT
) ) {
1063 // is a multi-module private_extern internal reference that the linker did not optimize away
1064 uintptr_t addr
= this->getSymbolAddress(undefinedSymbol
, context
, false);
1069 if ( context
.flatExportFinder(symbolName
, &sym
, foundIn
) ) {
1070 if ( *foundIn
!= this )
1071 context
.addDynamicReference(this, const_cast<ImageLoader
*>(*foundIn
));
1072 return (*foundIn
)->getExportedSymbolAddress(sym
, context
, this);
1074 // if a bundle is loaded privately the above will not find its exports
1075 if ( this->isBundle() && this->hasHiddenExports() ) {
1076 // look in self for needed symbol
1077 sym
= this->findShallowExportedSymbol(symbolName
, foundIn
);
1079 return (*foundIn
)->getExportedSymbolAddress(sym
, context
, this);
1081 if ( (undefinedSymbol
->n_desc
& N_WEAK_REF
) != 0 ) {
1082 // definition can't be found anywhere
1083 // if reference is weak_import, then it is ok, just return 0
1086 throwSymbolNotFound(context
, symbolName
, this->getPath(), "", "flat namespace");
1089 // symbol requires searching images with coalesced symbols (not done during prebinding)
1090 if ( !context
.prebinding
&& !dontCoalesce
&& (symbolIsWeakReference(undefinedSymbol
) || symbolIsWeakDefinition(undefinedSymbol
)) ) {
1092 if ( context
.coalescedExportFinder(symbolName
, &sym
, foundIn
, nullptr) ) {
1093 if ( *foundIn
!= this )
1094 context
.addDynamicReference(this, const_cast<ImageLoader
*>(*foundIn
));
1095 return (*foundIn
)->getExportedSymbolAddress(sym
, context
, this);
1097 //throwSymbolNotFound(context, symbolName, this->getPath(), "coalesced namespace");
1098 //dyld::log("dyld: coalesced symbol %s not found in any coalesced image, falling back to two-level lookup", symbolName);
1101 // if this is a real definition (not an undefined symbol) there is no ordinal
1102 if ( (undefinedSymbol
->n_type
& N_TYPE
) == N_SECT
) {
1103 // static linker should never generate this case, but if it does, do something sane
1104 uintptr_t addr
= this->getSymbolAddress(undefinedSymbol
, context
, false);
1110 ImageLoader
* target
= NULL
;
1111 uint8_t ord
= GET_LIBRARY_ORDINAL(undefinedSymbol
->n_desc
);
1112 if ( ord
== EXECUTABLE_ORDINAL
) {
1113 target
= context
.mainExecutable
;
1115 else if ( ord
== SELF_LIBRARY_ORDINAL
) {
1118 else if ( ord
== DYNAMIC_LOOKUP_ORDINAL
) {
1119 // rnielsen: HACKHACK
1122 if ( context
.flatExportFinder(symbolName
, &sym
, foundIn
) )
1123 return (*foundIn
)->getExportedSymbolAddress(sym
, context
, this);
1124 // no image has exports this symbol
1126 context
.undefinedHandler(symbolName
);
1127 // try looking again
1128 if ( context
.flatExportFinder(symbolName
, &sym
, foundIn
) )
1129 return (*foundIn
)->getExportedSymbolAddress(sym
, context
, this);
1131 throwSymbolNotFound(context
, symbolName
, this->getPath(), "", "dynamic lookup");
1133 else if ( ord
<= libraryCount() ) {
1134 target
= libImage(ord
-1);
1135 if ( target
== NULL
) {
1136 // if target library not loaded and reference is weak or library is weak return 0
1141 dyld::throwf("bad mach-o binary, library ordinal (%u) too big (max %u) for symbol %s in %s",
1142 ord
, libraryCount(), symbolName
, this->getPath());
1145 if ( target
== NULL
) {
1146 //dyld::log("resolveUndefined(%s) in %s\n", symbolName, this->getPath());
1147 throw "symbol not found";
1151 if ( target
->findExportedSymbolAddress(context
, symbolName
, this, ord
, runResolver
, foundIn
, &address
) )
1154 if ( (undefinedSymbol
->n_type
& N_PEXT
) != 0 ) {
1155 // don't know why the static linker did not eliminate the internal reference to a private extern definition
1157 return this->getSymbolAddress(undefinedSymbol
, context
, false);
1159 else if ( (undefinedSymbol
->n_desc
& N_WEAK_REF
) != 0 ) {
1160 // if definition not found and reference is weak return 0
1164 // nowhere to be found
1165 throwSymbolNotFound(context
, symbolName
, this->getPath(), "", target
->getPath());
1171 // returns if 'addr' is within the address range of section 'sectionIndex'
1172 // fSlide is not used. 'addr' is assumed to be a prebound address in this image
1173 bool ImageLoaderMachOClassic::isAddrInSection(uintptr_t addr
, uint8_t sectionIndex
)
1175 uint8_t currentSectionIndex
= 1;
1176 const uint32_t cmd_count
= ((macho_header
*)fMachOData
)->ncmds
;
1177 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
1178 const struct load_command
* cmd
= cmds
;
1179 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
1180 if ( cmd
->cmd
== LC_SEGMENT_COMMAND
) {
1181 const struct macho_segment_command
* seg
= (struct macho_segment_command
*)cmd
;
1182 if ( (currentSectionIndex
<= sectionIndex
) && (sectionIndex
< currentSectionIndex
+seg
->nsects
) ) {
1183 // 'sectionIndex' is in this segment, get section info
1184 const struct macho_section
* const sectionsStart
= (struct macho_section
*)((char*)seg
+ sizeof(struct macho_segment_command
));
1185 const struct macho_section
* const section
= §ionsStart
[sectionIndex
-currentSectionIndex
];
1186 return ( (section
->addr
<= addr
) && (addr
< section
->addr
+section
->size
) );
1189 // 'sectionIndex' not in this segment, skip to next segment
1190 currentSectionIndex
+= seg
->nsects
;
1193 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
1199 void ImageLoaderMachOClassic::doBindExternalRelocations(const LinkContext
& context
)
1201 const uintptr_t relocBase
= this->getRelocBase();
1202 const bool twoLevel
= this->usesTwoLevelNameSpace();
1203 const bool prebound
= this->isPrebindable();
1205 #if TEXT_RELOC_SUPPORT
1206 // if there are __TEXT fixups, temporarily make __TEXT writable
1207 if ( fTextSegmentBinds
)
1208 this->makeTextSegmentWritable(context
, true);
1210 // cache last lookup
1211 const struct macho_nlist
* lastUndefinedSymbol
= NULL
;
1212 uintptr_t symbolAddr
= 0;
1213 const ImageLoader
* image
= NULL
;
1215 // loop through all external relocation records and bind each
1216 const relocation_info
* const relocsStart
= (struct relocation_info
*)(&fLinkEditBase
[fDynamicInfo
->extreloff
]);
1217 const relocation_info
* const relocsEnd
= &relocsStart
[fDynamicInfo
->nextrel
];
1218 for (const relocation_info
* reloc
=relocsStart
; reloc
< relocsEnd
; ++reloc
) {
1219 if (reloc
->r_length
== RELOC_SIZE
) {
1220 switch(reloc
->r_type
) {
1223 const struct macho_nlist
* undefinedSymbol
= &fSymbolTable
[reloc
->r_symbolnum
];
1224 uintptr_t* location
= ((uintptr_t*)(reloc
->r_address
+ relocBase
));
1225 if ( ! this->containsAddress((void*)location
) )
1226 dyld::throwf("external reloc %p not in mapped image %s\n", (void*)location
, this->getPath());
1227 uintptr_t value
= *location
;
1228 bool symbolAddrCached
= true;
1230 if ( reloc
->r_pcrel
) {
1231 value
+= (uintptr_t)location
+ 4 - fSlide
;
1235 // we are doing relocations, so prebinding was not usable
1236 // in a prebound executable, the n_value field of an undefined symbol is set to the address where the symbol was found when prebound
1237 // so, subtracting that gives the initial displacement which we need to add to the newly found symbol address
1238 // if mach-o relocation structs had an "addend" field this complication would not be necessary.
1239 if ( ((undefinedSymbol
->n_type
& N_TYPE
) == N_SECT
) && ((undefinedSymbol
->n_desc
& N_WEAK_DEF
) != 0) ) {
1240 // weak symbols need special casing, since *location may have been prebound to a definition in another image.
1241 // If *location is currently prebound to somewhere in the same section as the weak definition, we assume
1242 // that we can subtract off the weak symbol address to get the addend.
1243 // If prebound elsewhere, we've lost the addend and have to assume it is zero.
1244 // The prebinding to elsewhere only happens with 10.4+ update_prebinding which only operates on a small set of Apple dylibs
1245 if ( (value
== undefinedSymbol
->n_value
) || this->isAddrInSection(value
, undefinedSymbol
->n_sect
) ) {
1246 value
-= undefinedSymbol
->n_value
;
1248 // if weak and thumb subtract off extra thumb bit
1249 if ( (undefinedSymbol
->n_desc
& N_ARM_THUMB_DEF
) != 0 )
1257 else if ( ((undefinedSymbol
->n_type
& N_TYPE
) == N_SECT
) && ((undefinedSymbol
->n_desc
& N_ARM_THUMB_DEF
) != 0) ) {
1258 // it was prebound to a defined symbol for thumb code in the same linkage unit
1259 // we need to subtract off one to get real addend
1260 value
-= (undefinedSymbol
->n_value
+1);
1264 // is undefined or non-weak symbol, so do subtraction to get addend
1265 value
-= undefinedSymbol
->n_value
;
1268 // if undefinedSymbol is same as last time, then symbolAddr and image will resolve to the same too
1269 if ( undefinedSymbol
!= lastUndefinedSymbol
) {
1270 bool dontCoalesce
= true;
1271 if ( symbolIsWeakReference(undefinedSymbol
) ) {
1272 // when weakbind() is run on a classic mach-o encoding, it won't try
1273 // to coalesce N_REF_TO_WEAK symbols because they are not in the sorted
1274 // range of global symbols. To handle that case we do the coalesing now.
1275 dontCoalesce
= false;
1277 symbolAddr
= this->resolveUndefined(context
, undefinedSymbol
, twoLevel
, dontCoalesce
, false, &image
);
1278 lastUndefinedSymbol
= undefinedSymbol
;
1279 symbolAddrCached
= false;
1281 if ( context
.verboseBind
) {
1282 const char *path
= NULL
;
1283 if ( image
!= NULL
) {
1284 path
= image
->getShortName();
1286 const char* cachedString
= "(cached)";
1287 if ( !symbolAddrCached
)
1290 dyld::log("dyld: bind: %s:0x%08lX = %s:%s, *0x%08lX = 0x%08lX%s\n",
1291 this->getShortName(), (uintptr_t)location
,
1292 path
, &fStrings
[undefinedSymbol
->n_un
.n_strx
], (uintptr_t)location
, symbolAddr
, cachedString
);
1295 dyld::log("dyld: bind: %s:0x%08lX = %s:%s, *0x%08lX = 0x%08lX%s + %ld\n",
1296 this->getShortName(), (uintptr_t)location
,
1297 path
, &fStrings
[undefinedSymbol
->n_un
.n_strx
], (uintptr_t)location
, symbolAddr
, cachedString
, value
);
1300 value
+= symbolAddr
;
1302 if ( reloc
->r_pcrel
) {
1303 *location
= value
- ((uintptr_t)location
+ 4);
1306 // don't dirty page if prebound value was correct
1307 if ( !prebound
|| (*location
!= value
) )
1311 // don't dirty page if prebound value was correct
1312 if ( !prebound
|| (*location
!= value
) )
1316 ++fgTotalBindFixups
;
1320 throw "unknown external relocation type";
1324 throw "bad external relocation length";
1328 #if TEXT_RELOC_SUPPORT
1329 // if there were __TEXT fixups, restore write protection
1330 if ( fTextSegmentBinds
) {
1331 this->makeTextSegmentWritable(context
, true);
1338 uintptr_t ImageLoaderMachOClassic::bindIndirectSymbol(uintptr_t* ptrToBind
, const struct macho_section
* sect
, const char* symbolName
, uintptr_t targetAddr
, const ImageLoader
* targetImage
, const LinkContext
& context
)
1340 if ( context
.verboseBind
) {
1341 const char* path
= NULL
;
1342 if ( targetImage
!= NULL
)
1343 path
= targetImage
->getShortName();
1344 dyld::log("dyld: bind indirect sym: %s:%s$%s = %s:%s, *0x%08lx = 0x%08lx\n",
1345 this->getShortName(), symbolName
, (((sect
->flags
& SECTION_TYPE
)==S_NON_LAZY_SYMBOL_POINTERS
) ? "non_lazy_ptr" : "lazy_ptr"),
1346 ((path
!= NULL
) ? path
: "<weak_import-not-found>"), symbolName
, (uintptr_t)ptrToBind
, targetAddr
);
1348 if ( context
.bindingHandler
!= NULL
) {
1349 const char* path
= NULL
;
1350 if ( targetImage
!= NULL
)
1351 path
= targetImage
->getShortName();
1352 targetAddr
= (uintptr_t)context
.bindingHandler(path
, symbolName
, (void *)targetAddr
);
1355 // i386 has special self-modifying stubs that change from "CALL rel32" to "JMP rel32"
1356 if ( ((sect
->flags
& SECTION_TYPE
) == S_SYMBOL_STUBS
) && ((sect
->flags
& S_ATTR_SELF_MODIFYING_CODE
) != 0) && (sect
->reserved2
== 5) ) {
1357 uint32_t rel32
= targetAddr
- (((uint32_t)ptrToBind
)+5);
1358 // re-write instruction in a thread-safe manner
1359 // use 8-byte compare-and-swap to alter 5-byte jump table entries
1360 // loop is required in case the extra three bytes that cover the next entry are altered by another thread
1363 volatile int64_t* jumpPtr
= (int64_t*)ptrToBind
;
1365 // By default the three extra bytes swapped follow the 5-byte JMP.
1366 // But, if the 5-byte jump is up against the end of the __IMPORT segment
1367 // We don't want to access bytes off the end of the segment, so we shift
1368 // the extra bytes to precede the 5-byte JMP.
1369 if ( (((uint32_t)ptrToBind
+ 8) & 0x00000FFC) == 0x00000000 ) {
1370 jumpPtr
= (int64_t*)((uint32_t)ptrToBind
- 3);
1373 int64_t oldEntry
= *jumpPtr
;
1378 newEntry
.int64
= oldEntry
;
1379 newEntry
.bytes
[pad
+0] = 0xE9; // JMP rel32
1380 newEntry
.bytes
[pad
+1] = rel32
& 0xFF;
1381 newEntry
.bytes
[pad
+2] = (rel32
>> 8) & 0xFF;
1382 newEntry
.bytes
[pad
+3] = (rel32
>> 16) & 0xFF;
1383 newEntry
.bytes
[pad
+4] = (rel32
>> 24) & 0xFF;
1384 done
= OSAtomicCompareAndSwap64Barrier(oldEntry
, newEntry
.int64
, (int64_t*)jumpPtr
);
1389 *ptrToBind
= targetAddr
;
1393 uintptr_t ImageLoaderMachOClassic::doBindFastLazySymbol(uint32_t lazyBindingInfoOffset
, const LinkContext
& context
, void (*lock
)(), void (*unlock
)())
1395 throw "compressed LINKEDIT lazy binder called with classic LINKEDIT";
1398 uintptr_t ImageLoaderMachOClassic::doBindLazySymbol(uintptr_t* lazyPointer
, const LinkContext
& context
)
1400 // scan for all lazy-pointer sections
1401 const bool twoLevel
= this->usesTwoLevelNameSpace();
1402 const uint32_t cmd_count
= ((macho_header
*)fMachOData
)->ncmds
;
1403 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
1404 const struct load_command
* cmd
= cmds
;
1405 const uint32_t* const indirectTable
= (uint32_t*)&fLinkEditBase
[fDynamicInfo
->indirectsymoff
];
1406 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
1408 case LC_SEGMENT_COMMAND
:
1410 const struct macho_segment_command
* seg
= (struct macho_segment_command
*)cmd
;
1411 const struct macho_section
* const sectionsStart
= (struct macho_section
*)((char*)seg
+ sizeof(struct macho_segment_command
));
1412 const struct macho_section
* const sectionsEnd
= §ionsStart
[seg
->nsects
];
1413 for (const struct macho_section
* sect
=sectionsStart
; sect
< sectionsEnd
; ++sect
) {
1414 const uint8_t type
= sect
->flags
& SECTION_TYPE
;
1415 uint32_t symbolIndex
= INDIRECT_SYMBOL_LOCAL
;
1416 if ( type
== S_LAZY_SYMBOL_POINTERS
) {
1417 const size_t pointerCount
= sect
->size
/ sizeof(uintptr_t);
1418 uintptr_t* const symbolPointers
= (uintptr_t*)(sect
->addr
+ fSlide
);
1419 if ( (lazyPointer
>= symbolPointers
) && (lazyPointer
< &symbolPointers
[pointerCount
]) ) {
1420 const uint32_t indirectTableOffset
= sect
->reserved1
;
1421 const size_t lazyIndex
= lazyPointer
- symbolPointers
;
1422 symbolIndex
= indirectTable
[indirectTableOffset
+ lazyIndex
];
1426 else if ( (type
== S_SYMBOL_STUBS
) && (sect
->flags
& S_ATTR_SELF_MODIFYING_CODE
) && (sect
->reserved2
== 5) ) {
1427 // 5 bytes stubs on i386 are new "fast stubs"
1428 uint8_t* const jmpTableBase
= (uint8_t*)(sect
->addr
+ fSlide
);
1429 uint8_t* const jmpTableEnd
= jmpTableBase
+ sect
->size
;
1430 // initial CALL instruction in jump table leaves pointer to next entry, so back up
1431 uint8_t* const jmpTableEntryToPatch
= ((uint8_t*)lazyPointer
) - 5;
1432 lazyPointer
= (uintptr_t*)jmpTableEntryToPatch
;
1433 if ( (jmpTableEntryToPatch
>= jmpTableBase
) && (jmpTableEntryToPatch
< jmpTableEnd
) ) {
1434 const uint32_t indirectTableOffset
= sect
->reserved1
;
1435 const uint32_t entryIndex
= (jmpTableEntryToPatch
- jmpTableBase
)/5;
1436 symbolIndex
= indirectTable
[indirectTableOffset
+ entryIndex
];
1440 if ( symbolIndex
!= INDIRECT_SYMBOL_ABS
&& symbolIndex
!= INDIRECT_SYMBOL_LOCAL
) {
1441 const char* symbolName
= &fStrings
[fSymbolTable
[symbolIndex
].n_un
.n_strx
];
1442 const ImageLoader
* image
= NULL
;
1443 uintptr_t symbolAddr
= this->resolveUndefined(context
, &fSymbolTable
[symbolIndex
], twoLevel
, false, true, &image
);
1444 symbolAddr
= this->bindIndirectSymbol(lazyPointer
, sect
, symbolName
, symbolAddr
, image
, context
);
1445 ++fgTotalLazyBindFixups
;
1452 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
1454 dyld::throwf("lazy pointer not found at address %p in image %s", lazyPointer
, this->getPath());
1459 void ImageLoaderMachOClassic::initializeCoalIterator(CoalIterator
& it
, unsigned int loadOrder
, unsigned)
1462 it
.symbolName
= " ";
1463 it
.loadOrder
= loadOrder
;
1464 it
.weakSymbol
= false;
1465 it
.symbolMatches
= false;
1468 if ( fDynamicInfo
->tocoff
!= 0 ) {
1470 it
.endIndex
= fDynamicInfo
->ntoc
;
1474 it
.endIndex
= fDynamicInfo
->nextdefsym
;
1479 bool ImageLoaderMachOClassic::incrementCoalIterator(CoalIterator
& it
)
1484 if ( fDynamicInfo
->tocoff
!= 0 ) {
1485 if ( it
.curIndex
>= fDynamicInfo
->ntoc
) {
1487 it
.symbolName
= "~~~";
1491 const dylib_table_of_contents
* toc
= (dylib_table_of_contents
*)&fLinkEditBase
[fDynamicInfo
->tocoff
];
1492 const uint32_t index
= toc
[it
.curIndex
].symbol_index
;
1493 const struct macho_nlist
* sym
= &fSymbolTable
[index
];
1494 const char* symStr
= &fStrings
[sym
->n_un
.n_strx
];
1495 it
.symbolName
= symStr
;
1496 it
.weakSymbol
= (sym
->n_desc
& N_WEAK_DEF
);
1497 it
.symbolMatches
= false;
1498 it
.type
= 0; // clear flag that says we applied updates for this symbol
1499 //dyld::log("incrementCoalIterator() curIndex=%ld, symbolName=%s in %s\n", it.curIndex, symStr, this->getPath());
1505 if ( it
.curIndex
>= fDynamicInfo
->nextdefsym
) {
1507 it
.symbolName
= "~~~";
1511 const struct macho_nlist
* sym
= &fSymbolTable
[fDynamicInfo
->iextdefsym
+it
.curIndex
];
1512 const char* symStr
= &fStrings
[sym
->n_un
.n_strx
];
1513 it
.symbolName
= symStr
;
1514 it
.weakSymbol
= (sym
->n_desc
& N_WEAK_DEF
);
1515 it
.symbolMatches
= false;
1516 it
.type
= 0; // clear flag that says we applied updates for this symbol
1517 //dyld::log("incrementCoalIterator() curIndex=%ld, symbolName=%s in %s\n", it.curIndex, symStr, this->getPath());
1526 uintptr_t ImageLoaderMachOClassic::getAddressCoalIterator(CoalIterator
& it
, const LinkContext
& context
)
1528 uint32_t symbol_index
= 0;
1529 if ( fDynamicInfo
->tocoff
!= 0 ) {
1530 const dylib_table_of_contents
* toc
= (dylib_table_of_contents
*)&fLinkEditBase
[fDynamicInfo
->tocoff
];
1531 symbol_index
= toc
[it
.curIndex
-1].symbol_index
;
1534 symbol_index
= fDynamicInfo
->iextdefsym
+ (uint32_t)it
.curIndex
- 1;
1536 const struct macho_nlist
* sym
= &fSymbolTable
[symbol_index
];
1537 //dyld::log("getAddressCoalIterator() => 0x%llX, %s symbol_index=%d, in %s\n", (uint64_t)(sym->n_value + fSlide), &fStrings[sym->n_un.n_strx], symbol_index, this->getPath());
1539 // processor assumes code address with low bit set is thumb
1540 if (sym
->n_desc
& N_ARM_THUMB_DEF
)
1541 return (sym
->n_value
| 1) + fSlide
;
1543 return sym
->n_value
+ fSlide
;
1545 return sym
->n_value
+ fSlide
;
1550 void ImageLoaderMachOClassic::updateUsesCoalIterator(CoalIterator
& it
, uintptr_t value
, ImageLoader
* targetImage
, unsigned targetIndex
, const LinkContext
& context
)
1552 // flat_namespace images with classic LINKEDIT do not need late coalescing.
1553 // They still need to be iterated becuase they may implement
1554 // something needed by other coalescing images.
1555 // But they need no updating because during the bind phase every symbol lookup is a full scan.
1556 if ( !this->usesTwoLevelNameSpace() )
1559 // <rdar://problem/6570879> weak binding done too early with inserted libraries
1560 if ( this->getState() < dyld_image_state_bound
)
1563 uint32_t symbol_index
= 0;
1564 if ( fDynamicInfo
->tocoff
!= 0 ) {
1565 const dylib_table_of_contents
* toc
= (dylib_table_of_contents
*)&fLinkEditBase
[fDynamicInfo
->tocoff
];
1566 symbol_index
= toc
[it
.curIndex
-1].symbol_index
;
1569 symbol_index
= fDynamicInfo
->iextdefsym
+ (uint32_t)it
.curIndex
- 1;
1572 // if this image's copy of the symbol is not a weak definition nor a weak reference then nothing to coalesce here
1573 if ( !symbolIsWeakReference(&fSymbolTable
[symbol_index
]) && !symbolIsWeakDefinition(&fSymbolTable
[symbol_index
]) ) {
1577 // <rdar://problem/6555720> malformed dylib with duplicate weak symbols causes re-binding
1581 bool boundSomething
= false;
1582 // scan external relocations for uses of symbol_index
1583 const uintptr_t relocBase
= this->getRelocBase();
1584 const bool prebound
= this->isPrebindable();
1585 const relocation_info
* const relocsStart
= (struct relocation_info
*)(&fLinkEditBase
[fDynamicInfo
->extreloff
]);
1586 const relocation_info
* const relocsEnd
= &relocsStart
[fDynamicInfo
->nextrel
];
1587 for (const relocation_info
* reloc
=relocsStart
; reloc
< relocsEnd
; ++reloc
) {
1588 if ( reloc
->r_symbolnum
== symbol_index
) {
1589 //dyld::log("found external reloc using symbol_index=%d in %s\n",symbol_index, this->getPath());
1590 const struct macho_nlist
* undefinedSymbol
= &fSymbolTable
[reloc
->r_symbolnum
];
1591 const char* symbolName
= &fStrings
[undefinedSymbol
->n_un
.n_strx
];
1592 uintptr_t* location
= ((uintptr_t*)(reloc
->r_address
+ relocBase
));
1593 const uintptr_t initialValue
= *location
;
1594 uintptr_t addend
= 0;
1596 // we are doing relocations, so prebinding was not usable
1597 // in a prebound executable, the n_value field of an undefined symbol is set to the address where the symbol was found when prebound
1598 // so, subtracting that gives the initial displacement which we need to add to the newly found symbol address
1599 // if mach-o relocation structs had an "addend" field this complication would not be necessary.
1600 if ( ((undefinedSymbol
->n_type
& N_TYPE
) == N_SECT
) && ((undefinedSymbol
->n_desc
& N_WEAK_DEF
) != 0) ) {
1601 // weak symbols need special casing, since *location may have been prebound to a definition in another image.
1602 // If *location is currently prebound to somewhere in the same section as the weak definition, we assume
1603 // that we can subtract off the weak symbol address to get the addend.
1604 // If prebound elsewhere, we've lost the addend and have to assume it is zero.
1605 // The prebinding to elsewhere only happens with 10.4+ update_prebinding which only operates on a small set of Apple dylibs
1606 if ( (initialValue
== undefinedSymbol
->n_value
) || this->isAddrInSection(initialValue
, undefinedSymbol
->n_sect
) ) {
1607 addend
= initialValue
- undefinedSymbol
->n_value
;
1609 // if weak and thumb subtract off extra thumb bit
1610 if ( (undefinedSymbol
->n_desc
& N_ARM_THUMB_DEF
) != 0 )
1616 else if ( ((undefinedSymbol
->n_type
& N_TYPE
) == N_SECT
) && ((undefinedSymbol
->n_desc
& N_ARM_THUMB_DEF
) != 0) ) {
1617 // it was prebound to a defined symbol for thumb code in the same linkage unit
1618 // we need to subtract off one to get real addend
1619 addend
= initialValue
- (undefinedSymbol
->n_value
+1);
1623 // is undefined or non-weak symbol, so do subtraction to get addend
1624 addend
= initialValue
- undefinedSymbol
->n_value
;
1628 // non-prebound case
1629 if ( ((undefinedSymbol
->n_type
& N_TYPE
) == N_SECT
) && ((undefinedSymbol
->n_desc
& N_WEAK_DEF
) != 0) ) {
1630 // if target is weak-def in same linkage unit, then bind phase has already set initialValue
1631 // to be definition address plus addend
1632 //dyld::log("weak def, initialValue=0x%lX, undefAddr=0x%lX\n", initialValue, undefinedSymbol->n_value+fSlide);
1633 addend
= initialValue
- (undefinedSymbol
->n_value
+ fSlide
);
1635 // if weak and thumb subtract off extra thumb bit
1636 if ( (undefinedSymbol
->n_desc
& N_ARM_THUMB_DEF
) != 0 )
1641 // nothing fixed up yet, addend is just initial value
1642 //dyld::log("addend=0x%lX\n", initialValue);
1643 addend
= initialValue
;
1647 uint8_t type
= BIND_TYPE_POINTER
;
1649 if ( reloc
->r_pcrel
)
1650 type
= BIND_TYPE_TEXT_PCREL32
;
1652 this->bindLocation(context
, this->imageBaseAddress(), (uintptr_t)location
, value
, type
, symbolName
, addend
, this->getPath(), targetImage
? targetImage
->getPath() : NULL
, "weak ", NULL
, fSlide
);
1653 boundSomething
= true;
1657 // scan lazy and non-lazy pointers for uses of symbol_index
1658 const uint32_t cmd_count
= ((macho_header
*)fMachOData
)->ncmds
;
1659 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
1660 const struct load_command
* cmd
= cmds
;
1661 const uint32_t* const indirectTable
= (uint32_t*)&fLinkEditBase
[fDynamicInfo
->indirectsymoff
];
1662 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
1663 if ( cmd
->cmd
== LC_SEGMENT_COMMAND
) {
1664 const struct macho_segment_command
* seg
= (struct macho_segment_command
*)cmd
;
1665 const struct macho_section
* const sectionsStart
= (struct macho_section
*)((char*)seg
+ sizeof(struct macho_segment_command
));
1666 const struct macho_section
* const sectionsEnd
= §ionsStart
[seg
->nsects
];
1667 for (const struct macho_section
* sect
=sectionsStart
; sect
< sectionsEnd
; ++sect
) {
1668 uint32_t elementSize
= sizeof(uintptr_t);
1669 switch ( sect
->flags
& SECTION_TYPE
) {
1671 case S_SYMBOL_STUBS
:
1672 if ( ((sect
->flags
& S_ATTR_SELF_MODIFYING_CODE
) ==0) || (sect
->reserved2
!= 5) )
1676 case S_NON_LAZY_SYMBOL_POINTERS
:
1677 case S_LAZY_SYMBOL_POINTERS
:
1679 size_t elementCount
= sect
->size
/ elementSize
;
1680 const uint32_t indirectTableOffset
= sect
->reserved1
;
1681 uint8_t* ptrToBind
= (uint8_t*)(sect
->addr
+ fSlide
);
1682 //dyld::log(" scanning section %s of %s starting at %p\n", sect->sectname, this->getShortName(), ptrToBind);
1683 for (size_t j
=0; j
< elementCount
; ++j
, ptrToBind
+= elementSize
) {
1684 if ( indirectTable
[indirectTableOffset
+ j
] == symbol_index
) {
1685 //dyld::log(" found symbol index match at %d/%d, ptrToBind=%p\n", j, elementCount, ptrToBind);
1687 this->bindIndirectSymbol((uintptr_t*)ptrToBind
, sect
, it
.symbolName
, value
, targetImage
, context
);
1688 boundSomething
= true;
1696 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
1698 if ( boundSomething
&& (targetImage
!= this) ) {
1699 context
.addDynamicReference(this, targetImage
);
1702 // mark that this symbol has already been bound, so we don't try to bind again
1707 void ImageLoaderMachOClassic::bindIndirectSymbolPointers(const LinkContext
& context
, bool bindNonLazys
, bool bindLazys
)
1709 // scan for all non-lazy-pointer sections
1710 const bool twoLevel
= this->usesTwoLevelNameSpace();
1711 const uint32_t cmd_count
= ((macho_header
*)fMachOData
)->ncmds
;
1712 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
1713 const struct load_command
* cmd
= cmds
;
1714 const uint32_t* const indirectTable
= (uint32_t*)&fLinkEditBase
[fDynamicInfo
->indirectsymoff
];
1715 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
1717 case LC_SEGMENT_COMMAND
:
1719 const struct macho_segment_command
* seg
= (struct macho_segment_command
*)cmd
;
1720 const struct macho_section
* const sectionsStart
= (struct macho_section
*)((char*)seg
+ sizeof(struct macho_segment_command
));
1721 const struct macho_section
* const sectionsEnd
= §ionsStart
[seg
->nsects
];
1722 for (const struct macho_section
* sect
=sectionsStart
; sect
< sectionsEnd
; ++sect
) {
1723 bool isLazySymbol
= false;
1724 const uint8_t type
= sect
->flags
& SECTION_TYPE
;
1725 uint32_t elementSize
= sizeof(uintptr_t);
1726 size_t elementCount
= sect
->size
/ elementSize
;
1727 if ( type
== S_NON_LAZY_SYMBOL_POINTERS
) {
1728 if ( ! bindNonLazys
)
1731 else if ( type
== S_LAZY_SYMBOL_POINTERS
) {
1732 // process each symbol pointer in this section
1733 fgTotalPossibleLazyBindFixups
+= elementCount
;
1734 isLazySymbol
= true;
1739 else if ( (type
== S_SYMBOL_STUBS
) && (sect
->flags
& S_ATTR_SELF_MODIFYING_CODE
) && (sect
->reserved2
== 5) ) {
1740 // process each jmp entry in this section
1741 elementCount
= sect
->size
/ 5;
1743 fgTotalPossibleLazyBindFixups
+= elementCount
;
1744 isLazySymbol
= true;
1752 const uint32_t indirectTableOffset
= sect
->reserved1
;
1753 uint8_t* ptrToBind
= (uint8_t*)(sect
->addr
+ fSlide
);
1754 for (size_t j
=0; j
< elementCount
; ++j
, ptrToBind
+= elementSize
) {
1755 #if LINKEDIT_USAGE_DEBUG
1756 noteAccessedLinkEditAddress(&indirectTable
[indirectTableOffset
+ j
]);
1758 uint32_t symbolIndex
= indirectTable
[indirectTableOffset
+ j
];
1759 if ( symbolIndex
== INDIRECT_SYMBOL_LOCAL
) {
1760 *((uintptr_t*)ptrToBind
) += this->fSlide
;
1762 else if ( symbolIndex
== INDIRECT_SYMBOL_ABS
) {
1763 // do nothing since already has absolute address
1766 const struct macho_nlist
* sym
= &fSymbolTable
[symbolIndex
];
1767 if ( symbolIndex
== 0 ) {
1768 // This could be rdar://problem/3534709
1769 if ( ((const macho_header
*)fMachOData
)->filetype
== MH_EXECUTE
) {
1770 static bool alreadyWarned
= false;
1771 if ( (sym
->n_type
& N_TYPE
) != N_UNDF
) {
1772 // The indirect table parallels the (non)lazy pointer sections. For
1773 // instance, to find info about the fifth lazy pointer you look at the
1774 // fifth entry in the indirect table. (try otool -Iv on a file).
1775 // The entry in the indirect table contains an index into the symbol table.
1777 // The bug in ld caused the entry in the indirect table to be zero
1778 // (instead of a magic value that means a local symbol). So, if the
1779 // symbolIndex == 0, we may be encountering the bug, or 0 may be a valid
1780 // symbol table index. The check I put in place is to see if the zero'th
1781 // symbol table entry is an import entry (usually it is a local symbol
1783 if ( context
.verboseWarnings
&& !alreadyWarned
) {
1784 dyld::log("dyld: malformed executable '%s', skipping indirect symbol to %s\n",
1785 this->getPath(), &fStrings
[sym
->n_un
.n_strx
]);
1786 alreadyWarned
= true;
1792 const ImageLoader
* image
= NULL
;
1793 // let weak definitions resolve to themselves, later coalescing may overwrite them
1794 bool dontCoalesce
= true;
1795 if ( bindLazys
&& isLazySymbol
) {
1796 // if this is something normally lazy bound, but we are forcing
1797 // it to be bound now, do coalescing
1798 dontCoalesce
= false;
1800 if ( symbolIsWeakReference(sym
) ) {
1801 // when weakbind() is run on a classic mach-o encoding, it won't try
1802 // to coalesce N_REF_TO_WEAK symbols because they are not in the sorted
1803 // range of global symbols. To handle that case we do the coalesing now.
1804 dontCoalesce
= false;
1806 uintptr_t symbolAddr
= resolveUndefined(context
, sym
, twoLevel
, dontCoalesce
, false, &image
);
1808 symbolAddr
= this->bindIndirectSymbol((uintptr_t*)ptrToBind
, sect
, &fStrings
[sym
->n_un
.n_strx
], symbolAddr
, image
, context
);
1810 ++fgTotalBindFixups
;
1817 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
1824 void ImageLoaderMachOClassic::initializeLazyStubs(const LinkContext
& context
)
1826 if ( ! this->usablePrebinding(context
) ) {
1827 // reset all "fast" stubs
1828 const macho_header
* mh
= (macho_header
*)fMachOData
;
1829 const uint32_t cmd_count
= mh
->ncmds
;
1830 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
1831 const struct load_command
* cmd
= cmds
;
1832 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
1834 case LC_SEGMENT_COMMAND
:
1836 const struct macho_segment_command
* seg
= (struct macho_segment_command
*)cmd
;
1837 const struct macho_section
* const sectionsStart
= (struct macho_section
*)((char*)seg
+ sizeof(struct macho_segment_command
));
1838 const struct macho_section
* const sectionsEnd
= §ionsStart
[seg
->nsects
];
1839 for (const struct macho_section
* sect
=sectionsStart
; sect
< sectionsEnd
; ++sect
) {
1840 const uint8_t type
= sect
->flags
& SECTION_TYPE
;
1841 if ( (type
== S_SYMBOL_STUBS
) && (sect
->flags
& S_ATTR_SELF_MODIFYING_CODE
) && (sect
->reserved2
== 5) ) {
1842 // reset each jmp entry in this section
1843 const uint32_t indirectTableOffset
= sect
->reserved1
;
1844 const uint32_t* const indirectTable
= (uint32_t*)&fLinkEditBase
[fDynamicInfo
->indirectsymoff
];
1845 uint8_t* start
= (uint8_t*)(sect
->addr
+ this->fSlide
);
1846 uint8_t* end
= start
+ sect
->size
;
1847 uintptr_t dyldHandler
= (uintptr_t)&stub_binding_helper_i386_old
;
1848 uint32_t entryIndex
= 0;
1849 for (uint8_t* entry
= start
; entry
< end
; entry
+= 5, ++entryIndex
) {
1850 bool installLazyHandler
= true;
1851 // jump table entries that cross a (64-byte) cache line boundary have the potential to cause crashes
1852 // if the instruction is updated by one thread while being executed by another
1853 if ( ((uint32_t)entry
& 0xFFFFFFC0) != ((uint32_t)entry
+4 & 0xFFFFFFC0) ) {
1854 // need to bind this now to avoid a potential problem if bound lazily
1855 uint32_t symbolIndex
= indirectTable
[indirectTableOffset
+ entryIndex
];
1856 // the latest linker marks 64-byte crossing stubs with INDIRECT_SYMBOL_ABS so they are not used
1857 if ( symbolIndex
!= INDIRECT_SYMBOL_ABS
) {
1858 const char* symbolName
= &fStrings
[fSymbolTable
[symbolIndex
].n_un
.n_strx
];
1859 const ImageLoader
* image
= NULL
;
1861 uintptr_t symbolAddr
= this->resolveUndefined(context
, &fSymbolTable
[symbolIndex
], this->usesTwoLevelNameSpace(), false, false, &image
);
1862 symbolAddr
= this->bindIndirectSymbol((uintptr_t*)entry
, sect
, symbolName
, symbolAddr
, image
, context
);
1863 ++fgTotalBindFixups
;
1864 uint32_t rel32
= symbolAddr
- (((uint32_t)entry
)+5);
1865 entry
[0] = 0xE9; // JMP rel32
1866 entry
[1] = rel32
& 0xFF;
1867 entry
[2] = (rel32
>> 8) & 0xFF;
1868 entry
[3] = (rel32
>> 16) & 0xFF;
1869 entry
[4] = (rel32
>> 24) & 0xFF;
1870 installLazyHandler
= false;
1872 catch (const char* msg
) {
1873 // ignore errors when binding symbols early
1874 // maybe the function is never called, and therefore erroring out now would be a regression
1878 if ( installLazyHandler
) {
1879 uint32_t rel32
= dyldHandler
- (((uint32_t)entry
)+5);
1880 entry
[0] = 0xE8; // CALL rel32
1881 entry
[1] = rel32
& 0xFF;
1882 entry
[2] = (rel32
>> 8) & 0xFF;
1883 entry
[3] = (rel32
>> 16) & 0xFF;
1884 entry
[4] = (rel32
>> 24) & 0xFF;
1891 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
1898 void ImageLoaderMachOClassic::doBind(const LinkContext
& context
, bool forceLazysBound
)
1900 CRSetCrashLogMessage2(this->getPath());
1902 this->initializeLazyStubs(context
);
1905 // if prebound and loaded at prebound address, and all libraries are same as when this was prebound, then no need to bind
1906 // note: flat-namespace binaries need to have imports rebound (even if correctly prebound)
1907 if ( this->usablePrebinding(context
) ) {
1908 // binding already up to date
1911 // no valid prebinding, so bind symbols.
1912 // values bound by name are stored two different ways in classic mach-o:
1914 #if TEXT_RELOC_SUPPORT
1915 // if there are __TEXT fixups, temporarily make __TEXT writable
1916 if ( fTextSegmentBinds
)
1917 this->makeTextSegmentWritable(context
, true);
1920 // 1) external relocations are used for data initialized to external symbols
1921 this->doBindExternalRelocations(context
);
1923 // 2) "indirect symbols" are used for code references to external symbols
1924 // if this image is in the shared cache, there is no way to reset the lazy pointers, so bind them now
1925 this->bindIndirectSymbolPointers(context
, true, forceLazysBound
|| fInSharedCache
);
1927 #if TEXT_RELOC_SUPPORT
1928 // if there were __TEXT fixups, restore write protection
1929 if ( fTextSegmentBinds
)
1930 this->makeTextSegmentWritable(context
, false);
1934 // set up dyld entry points in image
1935 this->setupLazyPointerHandler(context
);
1937 CRSetCrashLogMessage2(NULL
);
1940 void ImageLoaderMachOClassic::doBindJustLazies(const LinkContext
& context
)
1942 // some API called requested that all lazy pointers in this image be force bound
1943 this->bindIndirectSymbolPointers(context
, false, true);
1946 void ImageLoaderMachOClassic::doInterpose(const LinkContext
& context
)
1948 if ( context
.verboseInterposing
)
1949 dyld::log("dyld: interposing %lu tuples onto: %s\n", fgInterposingTuples
.size(), this->getPath());
1951 // scan indirect symbols
1952 const uint32_t cmd_count
= ((macho_header
*)fMachOData
)->ncmds
;
1953 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
1954 const struct load_command
* cmd
= cmds
;
1955 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
1957 case LC_SEGMENT_COMMAND
:
1959 const struct macho_segment_command
* seg
= (struct macho_segment_command
*)cmd
;
1960 const struct macho_section
* const sectionsStart
= (struct macho_section
*)((char*)seg
+ sizeof(struct macho_segment_command
));
1961 const struct macho_section
* const sectionsEnd
= §ionsStart
[seg
->nsects
];
1962 for (const struct macho_section
* sect
=sectionsStart
; sect
< sectionsEnd
; ++sect
) {
1963 const uint8_t type
= sect
->flags
& SECTION_TYPE
;
1964 if ( (type
== S_NON_LAZY_SYMBOL_POINTERS
) || (type
== S_LAZY_SYMBOL_POINTERS
) ) {
1965 const size_t pointerCount
= sect
->size
/ sizeof(uintptr_t);
1966 uintptr_t* const symbolPointers
= (uintptr_t*)(sect
->addr
+ fSlide
);
1967 for (size_t pointerIndex
=0; pointerIndex
< pointerCount
; ++pointerIndex
) {
1968 uintptr_t newValue
= interposedAddress(context
, symbolPointers
[pointerIndex
], this);
1969 if ( newValue
!= symbolPointers
[pointerIndex
] )
1970 symbolPointers
[pointerIndex
] = newValue
;
1974 // i386 has special self-modifying stubs that might be prebound to "JMP rel32" that need checking
1975 else if ( (type
== S_SYMBOL_STUBS
) && ((sect
->flags
& S_ATTR_SELF_MODIFYING_CODE
) != 0) && (sect
->reserved2
== 5) ) {
1976 // check each jmp entry in this section
1977 uint8_t* start
= (uint8_t*)(sect
->addr
+ this->fSlide
);
1978 uint8_t* end
= start
+ sect
->size
;
1979 for (uint8_t* entry
= start
; entry
< end
; entry
+= 5) {
1980 if ( entry
[0] == 0xE9 ) { // 0xE9 == JMP
1981 uint32_t rel32
= *((uint32_t*)&entry
[1]); // assume unaligned load of uint32_t is ok
1982 uint32_t target
= (uint32_t)&entry
[5] + rel32
;
1983 uint32_t newTarget
= interposedAddress(context
, target
, this);
1984 if ( newTarget
!= target
) {
1985 uint32_t newRel32
= newTarget
- (uint32_t)&entry
[5];
1986 *((uint32_t*)&entry
[1]) = newRel32
; // assume unaligned store of uint32_t is ok
1996 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
1999 // scan external relocations
2000 const uintptr_t relocBase
= this->getRelocBase();
2001 const relocation_info
* const relocsStart
= (struct relocation_info
*)(&fLinkEditBase
[fDynamicInfo
->extreloff
]);
2002 const relocation_info
* const relocsEnd
= &relocsStart
[fDynamicInfo
->nextrel
];
2003 for (const relocation_info
* reloc
=relocsStart
; reloc
< relocsEnd
; ++reloc
) {
2004 if (reloc
->r_length
== RELOC_SIZE
) {
2005 switch(reloc
->r_type
) {
2008 uintptr_t* location
= ((uintptr_t*)(reloc
->r_address
+ relocBase
));
2009 uintptr_t value
= *location
;
2010 uintptr_t newValue
= interposedAddress(context
, value
, this);
2011 if ( newValue
!= value
)
2012 *location
= newValue
;
2020 void ImageLoaderMachOClassic::dynamicInterpose(const LinkContext
& context
)
2022 if ( context
.verboseInterposing
)
2023 dyld::log("dyld: dynamic interposing %lu tuples onto image: %s\n", context
.dynamicInterposeCount
, this->getPath());
2025 // scan indirect symbols
2026 const uint32_t cmd_count
= ((macho_header
*)fMachOData
)->ncmds
;
2027 const struct load_command
* const cmds
= (struct load_command
*)&fMachOData
[sizeof(macho_header
)];
2028 const struct load_command
* cmd
= cmds
;
2029 for (uint32_t i
= 0; i
< cmd_count
; ++i
) {
2031 case LC_SEGMENT_COMMAND
:
2033 const struct macho_segment_command
* seg
= (struct macho_segment_command
*)cmd
;
2034 const struct macho_section
* const sectionsStart
= (struct macho_section
*)((char*)seg
+ sizeof(struct macho_segment_command
));
2035 const struct macho_section
* const sectionsEnd
= §ionsStart
[seg
->nsects
];
2036 for (const struct macho_section
* sect
=sectionsStart
; sect
< sectionsEnd
; ++sect
) {
2037 const uint8_t type
= sect
->flags
& SECTION_TYPE
;
2038 if ( (type
== S_NON_LAZY_SYMBOL_POINTERS
) || (type
== S_LAZY_SYMBOL_POINTERS
) ) {
2039 const size_t pointerCount
= sect
->size
/ sizeof(uintptr_t);
2040 uintptr_t* const symbolPointers
= (uintptr_t*)(sect
->addr
+ fSlide
);
2041 for (size_t pointerIndex
=0; pointerIndex
< pointerCount
; ++pointerIndex
) {
2042 for(size_t j
=0; j
< context
.dynamicInterposeCount
; ++j
) {
2043 // replace all references to 'replacee' with 'replacement'
2044 if ( symbolPointers
[pointerIndex
] == (uintptr_t)context
.dynamicInterposeArray
[j
].replacee
) {
2045 if ( context
.verboseInterposing
) {
2046 dyld::log("dyld: dynamic interposing: at %p replace %p with %p in %s\n",
2047 &symbolPointers
[pointerIndex
], context
.dynamicInterposeArray
[j
].replacee
, context
.dynamicInterposeArray
[j
].replacement
, this->getPath());
2049 symbolPointers
[pointerIndex
] = (uintptr_t)context
.dynamicInterposeArray
[j
].replacement
;
2058 cmd
= (const struct load_command
*)(((char*)cmd
)+cmd
->cmdsize
);
2061 // scan external relocations
2062 const uintptr_t relocBase
= this->getRelocBase();
2063 const relocation_info
* const relocsStart
= (struct relocation_info
*)(&fLinkEditBase
[fDynamicInfo
->extreloff
]);
2064 const relocation_info
* const relocsEnd
= &relocsStart
[fDynamicInfo
->nextrel
];
2065 for (const relocation_info
* reloc
=relocsStart
; reloc
< relocsEnd
; ++reloc
) {
2066 if (reloc
->r_length
== RELOC_SIZE
) {
2067 switch(reloc
->r_type
) {
2070 uintptr_t* location
= ((uintptr_t*)(reloc
->r_address
+ relocBase
));
2071 for(size_t i
=0; i
< context
.dynamicInterposeCount
; ++i
) {
2072 // replace all references to 'replacee' with 'replacement'
2073 if ( *location
== (uintptr_t)context
.dynamicInterposeArray
[i
].replacee
) {
2074 if ( context
.verboseInterposing
) {
2075 dyld::log("dyld: dynamic interposing: at %p replace %p with %p in %s\n",
2076 location
, context
.dynamicInterposeArray
[i
].replacee
, context
.dynamicInterposeArray
[i
].replacement
, this->getPath());
2078 *location
= (uintptr_t)context
.dynamicInterposeArray
[i
].replacement
;
2089 const char* ImageLoaderMachOClassic::findClosestSymbol(const void* addr
, const void** closestAddr
) const
2091 uintptr_t targetAddress
= (uintptr_t)addr
- fSlide
;
2092 const struct macho_nlist
* bestSymbol
= NULL
;
2093 // first walk all global symbols
2094 const struct macho_nlist
* const globalsStart
= &fSymbolTable
[fDynamicInfo
->iextdefsym
];
2095 const struct macho_nlist
* const globalsEnd
= &globalsStart
[fDynamicInfo
->nextdefsym
];
2096 for (const struct macho_nlist
* s
= globalsStart
; s
< globalsEnd
; ++s
) {
2097 if ( (s
->n_type
& N_TYPE
) == N_SECT
) {
2098 if ( bestSymbol
== NULL
) {
2099 if ( s
->n_value
<= targetAddress
)
2102 else if ( (s
->n_value
<= targetAddress
) && (bestSymbol
->n_value
< s
->n_value
) ) {
2107 // next walk all local symbols
2108 const struct macho_nlist
* const localsStart
= &fSymbolTable
[fDynamicInfo
->ilocalsym
];
2109 const struct macho_nlist
* const localsEnd
= &localsStart
[fDynamicInfo
->nlocalsym
];
2110 for (const struct macho_nlist
* s
= localsStart
; s
< localsEnd
; ++s
) {
2111 if ( ((s
->n_type
& N_TYPE
) == N_SECT
) && ((s
->n_type
& N_STAB
) == 0) ) {
2112 if ( bestSymbol
== NULL
) {
2113 if ( s
->n_value
<= targetAddress
)
2116 else if ( (s
->n_value
<= targetAddress
) && (bestSymbol
->n_value
< s
->n_value
) ) {
2121 if ( bestSymbol
!= NULL
) {
2123 if (bestSymbol
->n_desc
& N_ARM_THUMB_DEF
)
2124 *closestAddr
= (void*)((bestSymbol
->n_value
| 1) + fSlide
);
2126 *closestAddr
= (void*)(bestSymbol
->n_value
+ fSlide
);
2128 *closestAddr
= (void*)(bestSymbol
->n_value
+ fSlide
);
2130 return &fStrings
[bestSymbol
->n_un
.n_strx
];