1 /* -*- mode: C++; c-basic-offset: 4; tab-width: 4 -*-
3 * Copyright (c) 2015 Apple Inc. All rights reserved.
5 * @APPLE_LICENSE_HEADER_START@
7 * This file contains Original Code and/or Modifications of Original Code
8 * as defined in and that are subject to the Apple Public Source License
9 * Version 2.0 (the 'License'). You may not use this file except in
10 * compliance with the License. Please obtain a copy of the License at
11 * http://www.opensource.apple.com/apsl/ and read it before using this
14 * The Original Code and all software distributed under the License are
15 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
16 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
17 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
19 * Please see the License for the specific language governing rights and
20 * limitations under the License.
22 * @APPLE_LICENSE_HEADER_END@
30 #include <mach/machine.h>
35 #include <unordered_map>
38 #include "code_dedup.h"
46 class DeDupAliasAtom
: public ld::Atom
49 DeDupAliasAtom(const ld::Atom
* dupOf
, const ld::Atom
* replacement
) :
50 ld::Atom(dupOf
->section(), ld::Atom::definitionRegular
, ld::Atom::combineNever
,
51 dupOf
->scope(), dupOf
->contentType(), ld::Atom::symbolTableIn
,
52 false, false, true, dupOf
->alignment()),
54 _fixup(0, ld::Fixup::k1of1
, ld::Fixup::kindNoneFollowOn
, ld::Fixup::bindingDirectlyBound
, replacement
) {
55 if ( dupOf
->autoHide() )
59 virtual const ld::File
* file() const { return _dedupOf
->file(); }
60 virtual const char* translationUnitSource() const
62 virtual const char* name() const { return _dedupOf
->name(); }
63 virtual uint64_t size() const { return 0; }
64 virtual uint64_t objectAddress() const { return 0; }
65 virtual void copyRawContent(uint8_t buffer
[]) const { }
66 virtual ld::Fixup::iterator
fixupsBegin() const { return &((ld::Fixup
*)&_fixup
)[0]; }
67 virtual ld::Fixup::iterator
fixupsEnd() const { return &((ld::Fixup
*)&_fixup
)[1]; }
70 const ld::Atom
* _dedupOf
;
76 typedef std::unordered_map
<const ld::Atom
*, unsigned long> CachedHashes
;
78 ld::Internal
* sState
= nullptr;
79 CachedHashes sSavedHashes
;
80 unsigned long sHashCount
= 0;
81 unsigned long sFixupCompareCount
= 0;
85 // A helper for std::unordered_map<> that hashes the instructions of a function
88 static unsigned long hash(const ld::Atom
* atom
) {
89 auto pos
= sSavedHashes
.find(atom
);
90 if ( pos
!= sSavedHashes
.end() )
93 const unsigned instructionBytes
= atom
->size();
94 const uint8_t* instructions
= atom
->rawContentPointer();
95 unsigned long hash
= instructionBytes
;
96 for (unsigned i
=0; i
< instructionBytes
; ++i
) {
97 hash
= (hash
* 33) + instructions
[i
];
99 for (ld::Fixup::iterator fit
= atom
->fixupsBegin(), end
=atom
->fixupsEnd(); fit
!= end
; ++fit
) {
100 const Atom
* target
= NULL
;
101 switch ( fit
->binding
) {
102 case ld::Fixup::bindingDirectlyBound
:
103 target
= fit
->u
.target
;
105 case ld::Fixup::bindingsIndirectlyBound
:
106 target
= sState
->indirectBindingTable
[fit
->u
.bindingIndex
];
111 // don't include calls to auto-hide functions in hash because they might be de-dup'ed
112 switch ( fit
->kind
) {
113 #if SUPPORT_ARCH_arm64
114 case ld::Fixup::kindStoreTargetAddressARM64Branch26
:
116 case ld::Fixup::kindStoreTargetAddressX86BranchPCRel32
:
117 if ( target
&& target
->autoHide() )
118 continue; // don't include
123 if ( target
!= NULL
) {
124 const char* name
= target
->name();
125 if ( target
->contentType() == ld::Atom::typeCString
)
126 name
= (const char*)target
->rawContentPointer();
127 for (const char* s
= name
; *s
!= '\0'; ++s
)
128 hash
= (hash
* 33) + *s
;
132 sSavedHashes
[atom
] = hash
;
136 unsigned long operator()(const ld::Atom
* atom
) const {
142 // A helper for std::unordered_map<> that compares functions
147 const Atom
* inCallChain1
;
148 const Atom
* inCallChain2
;
150 bool inCallChain(const Atom
* target
) {
151 for (BackChain
* p
= this; p
->prev
!= NULL
; p
= p
->prev
) {
152 if ( (p
->inCallChain1
== target
) || (p
->inCallChain2
== target
) )
159 static bool sameFixups(const ld::Atom
* atom1
, const ld::Atom
* atom2
, BackChain
& backChain
) {
160 ++sFixupCompareCount
;
161 //fprintf(stderr, "sameFixups(%s,%s)\n", atom1->name(), atom2->name());
162 Fixup::iterator f1
= atom1
->fixupsBegin();
163 Fixup::iterator end1
= atom1
->fixupsEnd();
164 Fixup::iterator f2
= atom2
->fixupsBegin();
165 Fixup::iterator end2
= atom2
->fixupsEnd();
166 // two atoms must have same number of fixups
167 if ( (end1
- f1
) != (end2
- f2
) )
169 // if no fixups, fixups are equal
172 // all fixups must be the same
174 if ( f1
->offsetInAtom
!= f2
->offsetInAtom
)
176 if ( f1
->kind
!= f2
->kind
)
178 if ( f1
->clusterSize
!= f2
->clusterSize
)
180 if ( f1
->binding
!= f2
->binding
)
182 const Atom
* target1
= NULL
;
183 const Atom
* target2
= NULL
;
184 switch ( f1
->binding
) {
185 case ld::Fixup::bindingDirectlyBound
:
186 target1
= f1
->u
.target
;
187 target2
= f2
->u
.target
;
189 case ld::Fixup::bindingsIndirectlyBound
:
190 target1
= sState
->indirectBindingTable
[f1
->u
.bindingIndex
];
191 target2
= sState
->indirectBindingTable
[f2
->u
.bindingIndex
];
193 case ld::Fixup::bindingNone
:
198 if ( target1
!= target2
) {
199 // targets must match unless they are both calls to functions that will de-dup together
200 #if SUPPORT_ARCH_arm64
201 if ( (f1
->kind
!= ld::Fixup::kindStoreTargetAddressARM64Branch26
) && (f1
->kind
!= ld::Fixup::kindStoreTargetAddressX86BranchPCRel32
) )
203 if ( f1
->kind
!= ld::Fixup::kindStoreTargetAddressX86BranchPCRel32
)
206 if ( target1
->section().type() != target2
->section().type() )
208 if ( target1
->section().type() != ld::Section::typeCode
)
210 // to support co-recursive functions, don't recurse into equals() for targets already in the back chain
211 if ( !backChain
.inCallChain(target1
) || !backChain
.inCallChain(target2
) ) {
212 BackChain nextBackChain
;
213 nextBackChain
.prev
= &backChain
;
214 nextBackChain
.inCallChain1
= target1
;
215 nextBackChain
.inCallChain2
= target2
;
216 if ( !equal(target1
, target2
, nextBackChain
) )
223 } while (f1
!= end1
);
228 static bool equal(const ld::Atom
* atom1
, const ld::Atom
* atom2
, BackChain
& backChain
) {
229 if ( atom1
->size() != atom2
->size() )
231 if ( atom_hashing::hash(atom1
) != atom_hashing::hash(atom2
) )
233 if ( memcmp(atom1
->rawContentPointer(), atom2
->rawContentPointer(), atom1
->size()) != 0 )
235 bool result
= sameFixups(atom1
, atom2
, backChain
);
236 //fprintf(stderr, "sameFixups(%s,%s) = %d\n", atom1->name(), atom2->name(), result);
240 bool operator()(const ld::Atom
* atom1
, const ld::Atom
* atom2
) const {
241 BackChain backChain
= { NULL
, atom1
, atom2
};
242 return equal(atom1
, atom2
, backChain
);
248 void doPass(const Options
& opts
, ld::Internal
& state
)
250 const bool log
= false;
252 // only de-duplicate in final linked images
253 if ( opts
.outputKind() == Options::kObjectFile
)
256 // only de-duplicate for architectures that use relocations that don't store bits in instructions
257 if ( (opts
.architecture() != CPU_TYPE_ARM64
) && (opts
.architecture() != CPU_TYPE_X86_64
) )
260 // support -no_deduplicate to suppress this pass
261 if ( ! opts
.deduplicateFunctions() )
264 const bool verbose
= opts
.verboseDeduplicate();
266 // find __text section
267 ld::Internal::FinalSection
* textSection
= NULL
;
268 for (ld::Internal::FinalSection
* sect
: state
.sections
) {
269 if ( (sect
->type() == ld::Section::typeCode
) && (strcmp(sect
->sectionName(), "__text") == 0) ) {
274 if ( textSection
== NULL
)
277 // build map of auto-hide functions and their duplicates
278 // the key for the map is always the first element in the value vector
279 // the key is always earlier in the atoms list then matching other atoms
281 std::unordered_map
<const ld::Atom
*, std::vector
<const ld::Atom
*>, atom_hashing
, atom_equal
> map
;
282 std::unordered_set
<const ld::Atom
*> masterAtoms
;
283 for (const ld::Atom
* atom
: textSection
->atoms
) {
284 // ignore empty (alias) atoms
285 if ( atom
->size() == 0 )
287 if ( atom
->autoHide() )
288 map
[atom
].push_back(atom
);
292 for (auto& entry
: map
) {
293 if ( entry
.second
.size() > 1 ) {
294 printf("Found following matching functions:\n");
295 for (const ld::Atom
* atom
: entry
.second
) {
296 printf(" %p %s\n", atom
, atom
->name());
300 fprintf(stderr
, "duplicate sets count:\n");
301 for (auto& entry
: map
)
302 fprintf(stderr
, " %p -> %lu\n", entry
.first
, entry
.second
.size());
305 // construct alias atoms to replace atoms found to be duplicates
306 unsigned atomsBeingComparedCount
= 0;
307 uint64_t dedupSavings
= 0;
308 std::vector
<const ld::Atom
*>& textAtoms
= textSection
->atoms
;
309 std::unordered_map
<const ld::Atom
*, const ld::Atom
*> replacementMap
;
310 for (auto& entry
: map
) {
311 const ld::Atom
* masterAtom
= entry
.first
;
312 std::vector
<const ld::Atom
*>& dups
= entry
.second
;
313 atomsBeingComparedCount
+= dups
.size();
314 if ( dups
.size() == 1 )
317 dedupSavings
+= ((dups
.size() - 1) * masterAtom
->size());
318 fprintf(stderr
, "deduplicate the following %lu functions (%llu bytes apiece):\n", dups
.size(), masterAtom
->size());
320 for (const ld::Atom
* dupAtom
: dups
) {
322 fprintf(stderr
, " %s\n", dupAtom
->name());
323 if ( dupAtom
== masterAtom
)
325 const ld::Atom
* aliasAtom
= new DeDupAliasAtom(dupAtom
, masterAtom
);
326 auto pos
= std::find(textAtoms
.begin(), textAtoms
.end(), masterAtom
);
327 if ( pos
!= textAtoms
.end() ) {
328 textAtoms
.insert(pos
, aliasAtom
);
329 state
.atomToSection
[aliasAtom
] = textSection
;
330 replacementMap
[dupAtom
] = aliasAtom
;
331 (const_cast<ld::Atom
*>(dupAtom
))->setCoalescedAway();
336 fprintf(stderr
, "deduplication saved %llu bytes of __text\n", dedupSavings
);
340 fprintf(stderr
, "replacement map:\n");
341 for (auto& entry
: replacementMap
)
342 fprintf(stderr
, " %p -> %p\n", entry
.first
, entry
.second
);
345 // walk all atoms and replace references to dups with references to alias
346 for (ld::Internal::FinalSection
* sect
: state
.sections
) {
347 for (const ld::Atom
* atom
: sect
->atoms
) {
348 for (ld::Fixup::iterator fit
= atom
->fixupsBegin(), end
=atom
->fixupsEnd(); fit
!= end
; ++fit
) {
349 std::unordered_map
<const ld::Atom
*, const ld::Atom
*>::iterator pos
;
350 switch ( fit
->binding
) {
351 case ld::Fixup::bindingsIndirectlyBound
:
352 pos
= replacementMap
.find(state
.indirectBindingTable
[fit
->u
.bindingIndex
]);
353 if ( pos
!= replacementMap
.end() )
354 state
.indirectBindingTable
[fit
->u
.bindingIndex
] = pos
->second
;
356 case ld::Fixup::bindingDirectlyBound
:
357 pos
= replacementMap
.find(fit
->u
.target
);
358 if ( pos
!= replacementMap
.end() )
359 fit
->u
.target
= pos
->second
;
369 fprintf(stderr
, "atoms before pruning:\n");
370 for (const ld::Atom
* atom
: textSection
->atoms
)
371 fprintf(stderr
, " %p (size=%llu) %s\n", atom
, atom
->size(), atom
->name());
373 // remove replaced atoms from section
374 textSection
->atoms
.erase(std::remove_if(textSection
->atoms
.begin(), textSection
->atoms
.end(),
375 [&](const ld::Atom
* atom
) {
376 return (replacementMap
.count(atom
) != 0);
378 textSection
->atoms
.end());
380 for (auto& entry
: replacementMap
)
381 state
.atomToSection
.erase(entry
.first
);
384 fprintf(stderr
, "atoms after pruning:\n");
385 for (const ld::Atom
* atom
: textSection
->atoms
)
386 fprintf(stderr
, " %p (size=%llu) %s\n", atom
, atom
->size(), atom
->name());
389 //fprintf(stderr, "hash-count=%lu, fixup-compares=%lu, atom-count=%u\n", sHashCount, sFixupCompareCount, atomsBeingComparedCount);
394 } // namespace passes