1 /* -*- mode: C++; c-basic-offset: 4; tab-width: 4 -*-
3 * Copyright (c) 2006-2010 Apple Inc. All rights reserved.
5 * @APPLE_LICENSE_HEADER_START@
7 * This file contains Original Code and/or Modifications of Original Code
8 * as defined in and that are subject to the Apple Public Source License
9 * Version 2.0 (the 'License'). You may not use this file except in
10 * compliance with the License. Please obtain a copy of the License at
11 * http://www.opensource.apple.com/apsl/ and read it before using this
14 * The Original Code and all software distributed under the License are
15 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
16 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
17 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
19 * Please see the License for the specific language governing rights and
20 * limitations under the License.
22 * @APPLE_LICENSE_HEADER_END@
25 #ifndef __LTO_READER_H__
26 #define __LTO_READER_H__
29 #include <sys/param.h>
30 #include <sys/fcntl.h>
33 #include <mach-o/dyld.h>
35 #include <ext/hash_set>
36 #include <ext/hash_map>
38 #include "MachOFileAbstraction.hpp"
39 #include "Architectures.hpp"
41 #include "macho_relocatable_file.h"
44 // #defines are a work around for <rdar://problem/8760268>
45 #define __STDC_LIMIT_MACROS 1
46 #define __STDC_CONSTANT_MACROS 1
47 #include "llvm-c/lto.h"
54 // ld64 only tracks non-internal symbols from an llvm bitcode file.
55 // We model this by having an InternalAtom which represent all internal functions and data.
56 // All non-interal symbols from a bitcode file are represented by an Atom
57 // and each Atom has a reference to the InternalAtom. The InternalAtom
58 // also has references to each symbol external to the bitcode file.
60 class InternalAtom
: public ld::Atom
63 InternalAtom(class File
& f
);
64 // overrides of ld::Atom
65 virtual ld::File
* file() const { return &_file
; }
66 virtual const char* name() const { return "import-atom"; }
67 virtual uint64_t size() const { return 0; }
68 virtual uint64_t objectAddress() const { return 0; }
69 virtual void copyRawContent(uint8_t buffer
[]) const { }
70 virtual void setScope(Scope
) { }
71 virtual ld::Fixup::iterator
fixupsBegin() const { return &_undefs
[0]; }
72 virtual ld::Fixup::iterator
fixupsEnd() const { return &_undefs
[_undefs
.size()]; }
74 // for adding references to symbols outside bitcode file
75 void addReference(const char* nm
)
76 { _undefs
.push_back(ld::Fixup(0, ld::Fixup::k1of1
,
77 ld::Fixup::kindNone
, false, nm
)); }
81 mutable std::vector
<ld::Fixup
> _undefs
;
88 class File
: public ld::relocatable::File
91 File(const char* path
, time_t mTime
, ld::File::Ordinal ordinal
,
92 const uint8_t* content
, uint32_t contentLength
, cpu_type_t arch
);
95 // overrides of ld::File
96 virtual bool forEachAtom(ld::File::AtomHandler
&) const;
97 virtual bool justInTimeforEachAtom(const char* name
, ld::File::AtomHandler
&) const
99 virtual uint32_t cpuSubType() const { return _cpuSubType
; }
101 // overrides of ld::relocatable::File
102 virtual DebugInfoKind
debugInfo() const { return _debugInfo
; }
103 virtual const char* debugInfoPath() const { return _debugInfoPath
; }
104 virtual time_t debugInfoModificationTime() const
105 { return _debugInfoModTime
; }
106 virtual const std::vector
<ld::relocatable::File::Stab
>* stabs() const { return NULL
; }
107 virtual bool canScatterAtoms() const { return true; }
109 lto_module_t
module() { return _module
; }
110 class InternalAtom
& internalAtom() { return _internalAtom
; }
111 void setDebugInfo(ld::relocatable::File::DebugInfoKind k
,
112 const char* pth
, time_t modTime
, uint32_t subtype
)
114 _debugInfoPath
= pth
;
115 _debugInfoModTime
= modTime
;
116 _cpuSubType
= subtype
;}
120 friend class InternalAtom
;
123 cpu_type_t _architecture
;
124 class InternalAtom _internalAtom
;
125 class Atom
* _atomArray
;
126 uint32_t _atomArrayCount
;
127 lto_module_t _module
;
128 const char* _debugInfoPath
;
129 time_t _debugInfoModTime
;
130 ld::Section _section
;
131 ld::Fixup _fixupToInternal
;
132 ld::relocatable::File::DebugInfoKind _debugInfo
;
133 uint32_t _cpuSubType
;
137 // Atom acts as a proxy Atom for the symbols that are exported by LLVM bitcode file. Initially,
138 // Reader creates Atoms to allow linker proceed with usual symbol resolution phase. After
139 // optimization is performed, real Atoms are created for these symobls. However these real Atoms
140 // are not inserted into global symbol table. Atom holds real Atom and forwards appropriate
141 // methods to real atom.
143 class Atom
: public ld::Atom
146 Atom(File
& f
, const char* name
, ld::Atom::Scope s
,
147 ld::Atom::Definition d
, ld::Atom::Combine c
, ld::Atom::Alignment a
, bool ah
);
149 // overrides of ld::Atom
150 virtual ld::File
* file() const { return &_file
; }
151 virtual const char* translationUnitSource() const
152 { return (_compiledAtom
? _compiledAtom
->translationUnitSource() : NULL
); }
153 virtual const char* name() const { return _name
; }
154 virtual uint64_t size() const { return (_compiledAtom
? _compiledAtom
->size() : 0); }
155 virtual uint64_t objectAddress() const { return (_compiledAtom
? _compiledAtom
->objectAddress() : 0); }
156 virtual void copyRawContent(uint8_t buffer
[]) const
157 { if (_compiledAtom
) _compiledAtom
->copyRawContent(buffer
); }
158 virtual const uint8_t* rawContentPointer() const
159 { return (_compiledAtom
? _compiledAtom
->rawContentPointer() : NULL
); }
160 virtual unsigned long contentHash(const class ld::IndirectBindingTable
& ibt
) const
161 { return (_compiledAtom
? _compiledAtom
->contentHash(ibt
) : 0); }
162 virtual bool canCoalesceWith(const ld::Atom
& rhs
, const class ld::IndirectBindingTable
& ibt
) const
163 { return (_compiledAtom
? _compiledAtom
->canCoalesceWith(rhs
,ibt
) : false); }
164 virtual ld::Fixup::iterator
fixupsBegin() const
165 { return (_compiledAtom
? _compiledAtom
->fixupsBegin() : (ld::Fixup
*)&_file
._fixupToInternal
); }
166 virtual ld::Fixup::iterator
fixupsEnd() const
167 { return (_compiledAtom
? _compiledAtom
->fixupsEnd() : &((ld::Fixup
*)&_file
._fixupToInternal
)[1]); }
168 virtual ld::Atom::UnwindInfo::iterator
beginUnwind() const
169 { return (_compiledAtom
? _compiledAtom
->beginUnwind() : NULL
); }
170 virtual ld::Atom::UnwindInfo::iterator
endUnwind() const
171 { return (_compiledAtom
? _compiledAtom
->endUnwind() : NULL
); }
172 virtual ld::Atom::LineInfo::iterator
beginLineInfo() const
173 { return (_compiledAtom
? _compiledAtom
->beginLineInfo() : NULL
); }
174 virtual ld::Atom::LineInfo::iterator
endLineInfo() const
175 { return (_compiledAtom
? _compiledAtom
->endLineInfo() : NULL
); }
177 const ld::Atom
* compiledAtom() { return _compiledAtom
; }
178 void setCompiledAtom(const ld::Atom
& atom
);
184 const ld::Atom
* _compiledAtom
;
196 static bool validFile(const uint8_t* fileContent
, uint64_t fileLength
, cpu_type_t architecture
, cpu_subtype_t subarch
);
197 static const char* fileKind(const uint8_t* fileContent
, uint64_t fileLength
);
198 static File
* parse(const uint8_t* fileContent
, uint64_t fileLength
, const char* path
,
199 time_t modTime
, ld::File::Ordinal ordinal
, cpu_type_t architecture
, cpu_subtype_t subarch
, bool logAllFiles
);
200 static bool libLTOisLoaded() { return (::lto_get_version() != NULL
); }
201 static bool optimize( const std::vector
<const ld::Atom
*>& allAtoms
,
203 const OptimizeOptions
& options
,
204 ld::File::AtomHandler
& handler
,
205 std::vector
<const ld::Atom
*>& newAtoms
,
206 std::vector
<const char*>& additionalUndefines
);
208 static const char* ltoVersion() { return ::lto_get_version(); }
211 static const char* tripletPrefixForArch(cpu_type_t arch
);
212 static ld::relocatable::File
* parseMachOFile(const uint8_t* p
, size_t len
, const OptimizeOptions
& options
);
217 bool operator()(const char* left
, const char* right
) const { return (strcmp(left
, right
) == 0); }
219 typedef __gnu_cxx::hash_set
<const char*, __gnu_cxx::hash
<const char*>, CStringEquals
> CStringSet
;
220 typedef __gnu_cxx::hash_map
<const char*, Atom
*, __gnu_cxx::hash
<const char*>, CStringEquals
> CStringToAtom
;
222 class AtomSyncer
: public ld::File::AtomHandler
{
224 AtomSyncer(std::vector
<const char*>& a
, std::vector
<const ld::Atom
*>&na
,
225 CStringToAtom la
, CStringToAtom dla
, const OptimizeOptions
& options
) :
226 _options(options
), _additionalUndefines(a
), _newAtoms(na
), _llvmAtoms(la
), _deadllvmAtoms(dla
) { }
227 virtual void doAtom(const class ld::Atom
&);
228 virtual void doFile(const class ld::File
&) { }
230 const OptimizeOptions
& _options
;
231 std::vector
<const char*>& _additionalUndefines
;
232 std::vector
<const ld::Atom
*>& _newAtoms
;
233 CStringToAtom _llvmAtoms
;
234 CStringToAtom _deadllvmAtoms
;
237 static std::vector
<File
*> _s_files
;
240 std::vector
<File
*> Parser::_s_files
;
243 bool Parser::validFile(const uint8_t* fileContent
, uint64_t fileLength
, cpu_type_t architecture
, cpu_subtype_t subarch
)
245 for (const ArchInfo
* t
=archInfoArray
; t
->archName
!= NULL
; ++t
) {
246 if ( (architecture
== t
->cpuType
) && (!(t
->isSubType
) || (subarch
== t
->cpuSubType
)) ) {
247 bool result
= ::lto_module_is_object_file_in_memory_for_target(fileContent
, fileLength
, t
->llvmTriplePrefix
);
249 // <rdar://problem/8434487> LTO only supports thumbv7 not armv7
250 if ( t
->llvmTriplePrefixAlt
[0] != '\0' ) {
251 result
= ::lto_module_is_object_file_in_memory_for_target(fileContent
, fileLength
, t
->llvmTriplePrefixAlt
);
260 const char* Parser::fileKind(const uint8_t* p
, uint64_t fileLength
)
262 if ( (p
[0] == 0xDE) && (p
[1] == 0xC0) && (p
[2] == 0x17) && (p
[3] == 0x0B) ) {
263 cpu_type_t arch
= LittleEndian::get32(*((uint32_t*)(&p
[16])));
264 for (const ArchInfo
* t
=archInfoArray
; t
->archName
!= NULL
; ++t
) {
265 if ( arch
== t
->cpuType
) {
266 if ( t
->isSubType
) {
267 if ( ::lto_module_is_object_file_in_memory_for_target(p
, fileLength
, t
->llvmTriplePrefix
) )
275 return "unknown bitcode architecture";
280 File
* Parser::parse(const uint8_t* fileContent
, uint64_t fileLength
, const char* path
, time_t modTime
, ld::File::Ordinal ordinal
,
281 cpu_type_t architecture
, cpu_subtype_t subarch
, bool logAllFiles
)
283 File
* f
= new File(path
, modTime
, ordinal
, fileContent
, fileLength
, architecture
);
284 _s_files
.push_back(f
);
286 printf("%s\n", path
);
291 ld::relocatable::File
* Parser::parseMachOFile(const uint8_t* p
, size_t len
, const OptimizeOptions
& options
)
293 mach_o::relocatable::ParserOptions objOpts
;
294 objOpts
.architecture
= options
.arch
;
295 objOpts
.objSubtypeMustMatch
= false;
296 objOpts
.logAllFiles
= false;
297 objOpts
.convertUnwindInfo
= true;
300 // mach-o parsing is done in-memory, but need path for debug notes
301 const char* path
= "/tmp/lto.o";
303 if ( options
.tmpObjectFilePath
!= NULL
) {
304 path
= options
.tmpObjectFilePath
;
305 struct stat statBuffer
;
306 if ( stat(options
.tmpObjectFilePath
, &statBuffer
) == 0 )
307 modTime
= statBuffer
.st_mtime
;
310 ld::relocatable::File
* result
= mach_o::relocatable::parse(p
, len
, path
, modTime
, ld::File::Ordinal::LTOOrdinal(), objOpts
);
311 if ( result
!= NULL
)
313 throw "LLVM LTO, file is not of required architecture";
318 File::File(const char* pth
, time_t mTime
, ld::File::Ordinal ordinal
, const uint8_t* content
, uint32_t contentLength
, cpu_type_t arch
)
319 : ld::relocatable::File(pth
,mTime
,ordinal
), _architecture(arch
), _internalAtom(*this),
320 _atomArray(NULL
), _atomArrayCount(0), _module(NULL
), _debugInfoPath(pth
),
321 _section("__TEXT_", "__tmp_lto", ld::Section::typeTempLTO
),
322 _fixupToInternal(0, ld::Fixup::k1of1
, ld::Fixup::kindNone
, &_internalAtom
),
323 _debugInfo(ld::relocatable::File::kDebugInfoNone
), _cpuSubType(0)
325 const bool log
= false;
327 // create llvm module
328 _module
= ::lto_module_create_from_memory(content
, contentLength
);
329 if ( _module
== NULL
)
330 throwf("could not parse object file %s: %s", pth
, lto_get_error_message());
332 if ( log
) fprintf(stderr
, "bitcode file: %s\n", pth
);
334 // create atom for each global symbol in module
335 uint32_t count
= ::lto_module_get_num_symbols(_module
);
336 _atomArray
= (Atom
*)malloc(sizeof(Atom
)*count
);
337 for (uint32_t i
=0; i
< count
; ++i
) {
338 const char* name
= ::lto_module_get_symbol_name(_module
, i
);
339 lto_symbol_attributes attr
= lto_module_get_symbol_attribute(_module
, i
);
341 // <rdar://problem/6378110> LTO doesn't like dtrace symbols
342 // ignore dtrace static probes for now
343 // later when codegen is done and a mach-o file is produces the probes will be processed
344 if ( (strncmp(name
, "___dtrace_probe$", 16) == 0) || (strncmp(name
, "___dtrace_isenabled$", 20) == 0) )
347 ld::Atom::Definition def
;
348 ld::Atom::Combine combine
= ld::Atom::combineNever
;
349 switch ( attr
& LTO_SYMBOL_DEFINITION_MASK
) {
350 case LTO_SYMBOL_DEFINITION_REGULAR
:
351 def
= ld::Atom::definitionRegular
;
353 case LTO_SYMBOL_DEFINITION_TENTATIVE
:
354 def
= ld::Atom::definitionTentative
;
356 case LTO_SYMBOL_DEFINITION_WEAK
:
357 def
= ld::Atom::definitionRegular
;
358 combine
= ld::Atom::combineByName
;
360 case LTO_SYMBOL_DEFINITION_UNDEFINED
:
361 case LTO_SYMBOL_DEFINITION_WEAKUNDEF
:
362 def
= ld::Atom::definitionProxy
;
365 throwf("unknown definition kind for symbol %s in bitcode file %s", name
, pth
);
368 // make LLVM atoms for definitions and a reference for undefines
369 if ( def
!= ld::Atom::definitionProxy
) {
370 ld::Atom::Scope scope
;
371 bool autohide
= false;
372 switch ( attr
& LTO_SYMBOL_SCOPE_MASK
) {
373 case LTO_SYMBOL_SCOPE_INTERNAL
:
374 scope
= ld::Atom::scopeTranslationUnit
;
376 case LTO_SYMBOL_SCOPE_HIDDEN
:
377 scope
= ld::Atom::scopeLinkageUnit
;
379 case LTO_SYMBOL_SCOPE_DEFAULT
:
380 scope
= ld::Atom::scopeGlobal
;
382 #if LTO_API_VERSION >= 4
383 case LTO_SYMBOL_SCOPE_DEFAULT_CAN_BE_HIDDEN
:
384 scope
= ld::Atom::scopeGlobal
;
389 throwf("unknown scope for symbol %s in bitcode file %s", name
, pth
);
391 // only make atoms for non-internal symbols
392 if ( scope
== ld::Atom::scopeTranslationUnit
)
394 uint8_t alignment
= (attr
& LTO_SYMBOL_ALIGNMENT_MASK
);
395 // make Atom using placement new operator
396 new (&_atomArray
[_atomArrayCount
++]) Atom(*this, name
, scope
, def
, combine
, alignment
, autohide
);
397 if ( scope
!= ld::Atom::scopeTranslationUnit
)
398 _internalAtom
.addReference(name
);
399 if ( log
) fprintf(stderr
, "\t0x%08X %s\n", attr
, name
);
402 // add to list of external references
403 _internalAtom
.addReference(name
);
404 if ( log
) fprintf(stderr
, "\t%s (undefined)\n", name
);
411 if ( _module
!= NULL
)
412 ::lto_module_dispose(_module
);
415 bool File::forEachAtom(ld::File::AtomHandler
& handler
) const
417 handler
.doAtom(_internalAtom
);
418 for(uint32_t i
=0; i
< _atomArrayCount
; ++i
) {
419 handler
.doAtom(_atomArray
[i
]);
424 InternalAtom::InternalAtom(File
& f
)
425 : ld::Atom(f
._section
, ld::Atom::definitionRegular
, ld::Atom::combineNever
, ld::Atom::scopeTranslationUnit
,
426 ld::Atom::typeLTOtemporary
, ld::Atom::symbolTableNotIn
, true, false, false, ld::Atom::Alignment(0)),
431 Atom::Atom(File
& f
, const char* nm
, ld::Atom::Scope s
, ld::Atom::Definition d
, ld::Atom::Combine c
,
432 ld::Atom::Alignment a
, bool ah
)
433 : ld::Atom(f
._section
, d
, c
, s
, ld::Atom::typeLTOtemporary
,
434 ld::Atom::symbolTableIn
, false, false, false, a
),
435 _file(f
), _name(nm
), _compiledAtom(NULL
)
441 void Atom::setCompiledAtom(const ld::Atom
& atom
)
443 // set delegate so virtual methods go to it
444 _compiledAtom
= &atom
;
446 //fprintf(stderr, "setting lto atom %p to delegate to mach-o atom %p (%s)\n", this, &atom, atom.name());
448 // update fields in ld::Atom to match newly constructed mach-o atom
449 (const_cast<Atom
*>(this))->setAttributesFromAtom(atom
);
454 bool Parser::optimize( const std::vector
<const ld::Atom
*>& allAtoms
,
456 const OptimizeOptions
& options
,
457 ld::File::AtomHandler
& handler
,
458 std::vector
<const ld::Atom
*>& newAtoms
,
459 std::vector
<const char*>& additionalUndefines
)
461 const bool logMustPreserve
= false;
462 const bool logExtraOptions
= false;
463 const bool logBitcodeFiles
= false;
464 const bool logAtomsBeforeSync
= false;
466 // exit quickly if nothing to do
467 if ( _s_files
.size() == 0 )
470 // print out LTO version string if -v was used
471 if ( options
.verbose
)
472 fprintf(stderr
, "%s\n", lto_get_version());
474 // create optimizer and add each Reader
475 lto_code_gen_t generator
= ::lto_codegen_create();
476 for (std::vector
<File
*>::iterator it
=_s_files
.begin(); it
!= _s_files
.end(); ++it
) {
477 if ( logBitcodeFiles
) fprintf(stderr
, "lto_codegen_add_module(%s)\n", (*it
)->path());
478 if ( ::lto_codegen_add_module(generator
, (*it
)->module()) )
479 throwf("lto: could not merge in %s because %s", (*it
)->path(), ::lto_get_error_message());
482 // add any -mllvm command line options
483 for (std::vector
<const char*>::const_iterator it
=options
.llvmOptions
->begin(); it
!= options
.llvmOptions
->end(); ++it
) {
484 if ( logExtraOptions
) fprintf(stderr
, "passing option to llvm: %s\n", *it
);
485 ::lto_codegen_debug_options(generator
, *it
);
488 // The atom graph uses directed edges (references). Collect all references where
489 // originating atom is not part of any LTO Reader. This allows optimizer to optimize an
490 // external (i.e. not originated from same .o file) reference if all originating atoms are also
491 // defined in llvm bitcode file.
492 CStringSet nonLLVMRefs
;
493 CStringToAtom llvmAtoms
;
494 bool hasNonllvmAtoms
= false;
495 for (std::vector
<const ld::Atom
*>::const_iterator it
= allAtoms
.begin(); it
!= allAtoms
.end(); ++it
) {
496 const ld::Atom
* atom
= *it
;
497 // only look at references that come from an atom that is not an llvm atom
498 if ( atom
->contentType() != ld::Atom::typeLTOtemporary
) {
499 if ( (atom
->section().type() != ld::Section::typeMachHeader
) && (atom
->definition() != ld::Atom::definitionProxy
) ) {
500 hasNonllvmAtoms
= true;
502 const ld::Atom
* target
;
503 for (ld::Fixup::iterator fit
=atom
->fixupsBegin(); fit
!= atom
->fixupsEnd(); ++fit
) {
504 switch ( fit
->binding
) {
505 case ld::Fixup::bindingDirectlyBound
:
506 // that reference an llvm atom
507 if ( fit
->u
.target
->contentType() == ld::Atom::typeLTOtemporary
)
508 nonLLVMRefs
.insert(fit
->u
.target
->name());
510 case ld::Fixup::bindingsIndirectlyBound
:
511 target
= state
.indirectBindingTable
[fit
->u
.bindingIndex
];
512 if ( target
== NULL
)
513 throwf("'%s' in %s contains undefined reference", atom
->name(), atom
->file()->path());
514 assert(target
!= NULL
);
515 if ( target
->contentType() == ld::Atom::typeLTOtemporary
)
516 nonLLVMRefs
.insert(target
->name());
523 llvmAtoms
[atom
->name()] = (Atom
*)atom
;
526 // if entry point is in a llvm bitcode file, it must be preserved by LTO
527 if ( state
.entryPoint
!= NULL
) {
528 if ( state
.entryPoint
->contentType() == ld::Atom::typeLTOtemporary
)
529 nonLLVMRefs
.insert(state
.entryPoint
->name());
532 // deadAtoms are the atoms that the linker coalesced. For instance weak or tentative definitions
533 // overriden by another atom. If any of these deadAtoms are llvm atoms and they were replaced
534 // with a mach-o atom, we need to tell the lto engine to preserve (not optimize away) its dead
535 // atom so that the linker can replace it with the mach-o one later.
536 CStringToAtom deadllvmAtoms
;
537 for (std::vector
<const ld::Atom
*>::const_iterator it
= allAtoms
.begin(); it
!= allAtoms
.end(); ++it
) {
538 const ld::Atom
* atom
= *it
;
539 if ( atom
->coalescedAway() && (atom
->contentType() == ld::Atom::typeLTOtemporary
) ) {
540 const char* name
= atom
->name();
541 if ( logMustPreserve
) fprintf(stderr
, "lto_codegen_add_must_preserve_symbol(%s) because linker coalesce away and replace with a mach-o atom\n", name
);
542 ::lto_codegen_add_must_preserve_symbol(generator
, name
);
543 deadllvmAtoms
[name
] = (Atom
*)atom
;
546 for (std::vector
<File
*>::iterator it
=_s_files
.begin(); it
!= _s_files
.end(); ++it
) {
548 for(uint32_t i
=0; i
< file
->_atomArrayCount
; ++i
) {
549 Atom
* llvmAtom
= &file
->_atomArray
[i
];
550 if ( llvmAtom
->coalescedAway() ) {
551 const char* name
= llvmAtom
->name();
552 if ( deadllvmAtoms
.find(name
) == deadllvmAtoms
.end() ) {
553 if ( logMustPreserve
)
554 fprintf(stderr
, "lto_codegen_add_must_preserve_symbol(%s) because linker coalesce away and replace with a mach-o atom\n", name
);
555 ::lto_codegen_add_must_preserve_symbol(generator
, name
);
556 deadllvmAtoms
[name
] = (Atom
*)llvmAtom
;
559 else if ( options
.linkerDeadStripping
&& !llvmAtom
->live() ) {
560 const char* name
= llvmAtom
->name();
561 deadllvmAtoms
[name
] = (Atom
*)llvmAtom
;
566 // tell code generator about symbols that must be preserved
567 for (CStringToAtom::iterator it
= llvmAtoms
.begin(); it
!= llvmAtoms
.end(); ++it
) {
568 const char* name
= it
->first
;
569 Atom
* atom
= it
->second
;
570 // Include llvm Symbol in export list if it meets one of following two conditions
571 // 1 - atom scope is global (and not linkage unit).
572 // 2 - included in nonLLVMRefs set.
573 // If a symbol is not listed in exportList then LTO is free to optimize it away.
574 if ( (atom
->scope() == ld::Atom::scopeGlobal
) && options
.preserveAllGlobals
) {
575 if ( logMustPreserve
) fprintf(stderr
, "lto_codegen_add_must_preserve_symbol(%s) because global symbol\n", name
);
576 ::lto_codegen_add_must_preserve_symbol(generator
, name
);
578 else if ( nonLLVMRefs
.find(name
) != nonLLVMRefs
.end() ) {
579 if ( logMustPreserve
) fprintf(stderr
, "lto_codegen_add_must_preserve_symbol(%s) because referenced by a mach-o atom\n", name
);
580 ::lto_codegen_add_must_preserve_symbol(generator
, name
);
584 // special case running ld -r on all bitcode files to produce another bitcode file (instead of mach-o)
585 if ( options
.relocatable
&& !hasNonllvmAtoms
) {
586 if ( ! ::lto_codegen_write_merged_modules(generator
, options
.outputFilePath
) ) {
587 // HACK, no good way to tell linker we are all done, so just quit
590 warning("could not produce merged bitcode file");
593 // set code-gen model
594 lto_codegen_model model
= LTO_CODEGEN_PIC_MODEL_DYNAMIC
;
595 if ( options
.mainExecutable
) {
596 if ( options
.staticExecutable
) {
597 // darwin x86_64 "static" code model is really dynamic code model
598 if ( options
.arch
== CPU_TYPE_X86_64
)
599 model
= LTO_CODEGEN_PIC_MODEL_DYNAMIC
;
601 model
= LTO_CODEGEN_PIC_MODEL_STATIC
;
605 model
= LTO_CODEGEN_PIC_MODEL_DYNAMIC
;
607 model
= LTO_CODEGEN_PIC_MODEL_DYNAMIC_NO_PIC
;
611 if ( options
.allowTextRelocs
)
612 model
= LTO_CODEGEN_PIC_MODEL_DYNAMIC_NO_PIC
;
614 model
= LTO_CODEGEN_PIC_MODEL_DYNAMIC
;
616 if ( ::lto_codegen_set_pic_model(generator
, model
) )
617 throwf("could not create set codegen model: %s", lto_get_error_message());
619 // if requested, save off merged bitcode file
620 if ( options
.saveTemps
) {
621 char tempBitcodePath
[MAXPATHLEN
];
622 strcpy(tempBitcodePath
, options
.outputFilePath
);
623 strcat(tempBitcodePath
, ".lto.bc");
624 ::lto_codegen_write_merged_modules(generator
, tempBitcodePath
);
627 #if LTO_API_VERSION >= 3
628 // find assembler next to linker
630 uint32_t bufSize
= PATH_MAX
;
631 if ( _NSGetExecutablePath(path
, &bufSize
) != -1 ) {
632 char* lastSlash
= strrchr(path
, '/');
633 if ( lastSlash
!= NULL
) {
634 strcpy(lastSlash
+1, "as");
635 struct stat statInfo
;
636 if ( stat(path
, &statInfo
) == 0 )
637 ::lto_codegen_set_assembler_path(generator
, path
);
641 // run code generator
643 const uint8_t* machOFile
= (uint8_t*)::lto_codegen_compile(generator
, &machOFileLen
);
644 if ( machOFile
== NULL
)
645 throwf("could not do LTO codegen: %s", ::lto_get_error_message());
647 // if requested, save off temp mach-o file
648 if ( options
.saveTemps
) {
649 char tempMachoPath
[MAXPATHLEN
];
650 strcpy(tempMachoPath
, options
.outputFilePath
);
651 strcat(tempMachoPath
, ".lto.o");
652 int fd
= ::open(tempMachoPath
, O_CREAT
| O_WRONLY
| O_TRUNC
, 0666);
654 ::write(fd
, machOFile
, machOFileLen
);
657 // save off merged bitcode file
658 char tempOptBitcodePath
[MAXPATHLEN
];
659 strcpy(tempOptBitcodePath
, options
.outputFilePath
);
660 strcat(tempOptBitcodePath
, ".lto.opt.bc");
661 ::lto_codegen_write_merged_modules(generator
, tempOptBitcodePath
);
664 // if needed, save temp mach-o file to specific location
665 if ( options
.tmpObjectFilePath
!= NULL
) {
666 int fd
= ::open(options
.tmpObjectFilePath
, O_CREAT
| O_WRONLY
| O_TRUNC
, 0666);
668 ::write(fd
, machOFile
, machOFileLen
);
672 warning("could not write LTO temp file '%s', errno=%d", options
.tmpObjectFilePath
, errno
);
676 // parse generated mach-o file into a MachOReader
677 ld::relocatable::File
* machoFile
= parseMachOFile(machOFile
, machOFileLen
, options
);
679 // sync generated mach-o atoms with existing atoms ld knows about
680 if ( logAtomsBeforeSync
) {
681 fprintf(stderr
, "llvmAtoms:\n");
682 for (CStringToAtom::iterator it
= llvmAtoms
.begin(); it
!= llvmAtoms
.end(); ++it
) {
683 const char* name
= it
->first
;
684 //Atom* atom = it->second;
685 fprintf(stderr
, "\t%s\n", name
);
687 fprintf(stderr
, "deadllvmAtoms:\n");
688 for (CStringToAtom::iterator it
= deadllvmAtoms
.begin(); it
!= deadllvmAtoms
.end(); ++it
) {
689 const char* name
= it
->first
;
690 //Atom* atom = it->second;
691 fprintf(stderr
, "\t%s\n", name
);
694 AtomSyncer
syncer(additionalUndefines
, newAtoms
, llvmAtoms
, deadllvmAtoms
, options
);
695 machoFile
->forEachAtom(syncer
);
697 // Remove InternalAtoms from ld
698 for (std::vector
<File
*>::iterator it
=_s_files
.begin(); it
!= _s_files
.end(); ++it
) {
699 (*it
)->internalAtom().setCoalescedAway();
701 // Remove Atoms from ld if code generator optimized them away
702 for (CStringToAtom::iterator li
= llvmAtoms
.begin(), le
= llvmAtoms
.end(); li
!= le
; ++li
) {
703 // check if setRealAtom() called on this Atom
704 if ( li
->second
->compiledAtom() == NULL
) {
705 //fprintf(stderr, "llvm optimized away %p %s\n", li->second, li->second->name());
706 li
->second
->setCoalescedAway();
710 // notify about file level attributes
711 handler
.doFile(*machoFile
);
713 // if final mach-o file has debug info, update original bitcode files to match
714 for (std::vector
<File
*>::iterator it
=_s_files
.begin(); it
!= _s_files
.end(); ++it
) {
715 (*it
)->setDebugInfo(machoFile
->debugInfo(), machoFile
->path(),
716 machoFile
->modificationTime(), machoFile
->cpuSubType());
723 void Parser::AtomSyncer::doAtom(const ld::Atom
& machoAtom
)
725 // update proxy atoms to point to real atoms and find new atoms
726 const char* name
= machoAtom
.name();
727 if ( machoAtom
.scope() >= ld::Atom::scopeLinkageUnit
) {
728 CStringToAtom::iterator pos
= _llvmAtoms
.find(name
);
729 if ( pos
!= _llvmAtoms
.end() ) {
730 // turn Atom into a proxy for this mach-o atom
731 pos
->second
->setCompiledAtom(machoAtom
);
734 // an atom of this name was not in the allAtoms list the linker gave us
735 if ( _deadllvmAtoms
.find(name
) != _deadllvmAtoms
.end() ) {
736 // this corresponding to an atom that the linker coalesced away or marked not-live
737 if ( _options
.linkerDeadStripping
) {
738 // llvm seems to want this atom and -dead_strip is enabled, so it will be deleted if not needed, so add back
739 Atom
* llvmAtom
= _deadllvmAtoms
[name
];
740 llvmAtom
->setCompiledAtom(machoAtom
);
741 _newAtoms
.push_back(&machoAtom
);
744 // Don't pass it back as a new atom
749 // this is something new that lto conjured up, tell ld its new
750 _newAtoms
.push_back(&machoAtom
);
755 // ld only knew about non-static atoms, so this one must be new
756 _newAtoms
.push_back(&machoAtom
);
759 // adjust fixups to go through proxy atoms
760 //fprintf(stderr, "adjusting fixups in atom: %s\n", machoAtom.name());
761 for (ld::Fixup::iterator fit
=machoAtom
.fixupsBegin(); fit
!= machoAtom
.fixupsEnd(); ++fit
) {
762 switch ( fit
->binding
) {
763 case ld::Fixup::bindingNone
:
765 case ld::Fixup::bindingByNameUnbound
:
766 // don't know if this target has been seen by linker before or if it is new
767 // be conservative and tell linker it is new
768 _additionalUndefines
.push_back(fit
->u
.name
);
769 //fprintf(stderr, " by name ref to: %s\n", fit->u.name);
771 case ld::Fixup::bindingDirectlyBound
:
772 // If mach-o atom is referencing another mach-o atom then
773 // reference is not going through Atom proxy. Fix it here to ensure that all
774 // llvm symbol references always go through Atom proxy.
775 if ( fit
->u
.target
->scope() != ld::Atom::scopeTranslationUnit
) {
776 const char* targetName
= fit
->u
.target
->name();
777 CStringToAtom::iterator pos
= _llvmAtoms
.find(targetName
);
778 if ( pos
!= _llvmAtoms
.end() ) {
779 fit
->u
.target
= pos
->second
;
782 if ( _deadllvmAtoms
.find(targetName
) != _deadllvmAtoms
.end() ) {
783 // target was coalesed away and replace by mach-o atom from a non llvm .o file
784 fit
->binding
= ld::Fixup::bindingByNameUnbound
;
785 fit
->u
.name
= targetName
;
789 //fprintf(stderr, " direct ref to: %s (scope=%d)\n", fit->u.target->name(), fit->u.target->scope());
791 case ld::Fixup::bindingByContentBound
:
792 //fprintf(stderr, " direct by content to: %s\n", fit->u.target->name());
794 case ld::Fixup::bindingsIndirectlyBound
:
795 assert(0 && "indirect binding found in initial mach-o file?");
796 //fprintf(stderr, " indirect by content to: %u\n", fit->u.bindingIndex);
804 static pthread_mutex_t lto_lock
;
806 Mutex() { pthread_mutex_lock(<o_lock
); }
807 ~Mutex() { pthread_mutex_unlock(<o_lock
); }
809 pthread_mutex_t
Mutex::lto_lock
= PTHREAD_MUTEX_INITIALIZER
;
812 // Used by archive reader to see if member is an llvm bitcode file
814 bool isObjectFile(const uint8_t* fileContent
, uint64_t fileLength
, cpu_type_t architecture
, cpu_subtype_t subarch
)
817 return Parser::validFile(fileContent
, fileLength
, architecture
, subarch
);
822 // main function used by linker to instantiate ld::Files
824 ld::relocatable::File
* parse(const uint8_t* fileContent
, uint64_t fileLength
,
825 const char* path
, time_t modTime
, ld::File::Ordinal ordinal
,
826 cpu_type_t architecture
, cpu_subtype_t subarch
, bool logAllFiles
)
829 if ( Parser::validFile(fileContent
, fileLength
, architecture
, subarch
) )
830 return Parser::parse(fileContent
, fileLength
, path
, modTime
, ordinal
, architecture
, subarch
, logAllFiles
);
836 // used by "ld -v" to report version of libLTO.dylib being used
838 const char* version()
841 return ::lto_get_version();
846 // used by ld for error reporting
848 bool libLTOisLoaded()
851 return (::lto_get_version() != NULL
);
855 // used by ld for error reporting
857 const char* archName(const uint8_t* fileContent
, uint64_t fileLength
)
860 return Parser::fileKind(fileContent
, fileLength
);
864 // used by ld for doing link time optimization
866 bool optimize( const std::vector
<const ld::Atom
*>& allAtoms
,
868 const OptimizeOptions
& options
,
869 ld::File::AtomHandler
& handler
,
870 std::vector
<const ld::Atom
*>& newAtoms
,
871 std::vector
<const char*>& additionalUndefines
)
874 return Parser::optimize(allAtoms
, state
, options
, handler
, newAtoms
, additionalUndefines
);