git.saurik.com Git - apple/ld64.git/blob - src/ld/parsers/macho_relocatable

1 /* -*- mode: C++; c-basic-offset: 4; tab-width: 4 -*-

2 *

4 *

5 * @APPLE_LICENSE_HEADER_START@

6 *

7 * This file contains Original Code and/or Modifications of Original Code

8 * as defined in and that are subject to the Apple Public Source License

9 * Version 2.0 (the 'License'). You may not use this file except in

10 * compliance with the License. Please obtain a copy of the License at

11 * http://www.opensource.apple.com/apsl/ and read it before using this

12 * file.

13 *

14 * The Original Code and all software distributed under the License are

15 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER

16 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,

17 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,

18 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.

19 * Please see the License for the specific language governing rights and

20 * limitations under the License.

21 *

22 * @APPLE_LICENSE_HEADER_END@

23 */

26 #include <stdint.h>

27 #include <stdlib.h>

28 #include <math.h>

29 #include <unistd.h>

30 #include <fcntl.h>

31 #include <sys/param.h>

32 #include <sys/stat.h>

33 #include <sys/mman.h>

35 #include "MachOFileAbstraction.hpp"

37 #include "libunwind/DwarfInstructions.hpp"

38 #include "libunwind/AddressSpace.hpp"

39 #include "libunwind/Registers.hpp"

41 #include <vector>

42 #include <set>

43 #include <map>

44 #include <algorithm>

45 #include <type_traits>

47 #include "dwarf2.h"

48 #include "debugline.h"

50 #include "Architectures.hpp"

51 #include "Bitcode.hpp"

52 #include "ld.hpp"

53 #include "macho_relocatable_file.h"

 extern void throwf(const char* format, ...) __attribute__ ((noreturn,format(printf, 1, 2)));

 extern void warning(const char* format, ...) __attribute__((format(printf, 1, 2)));

60 namespace mach_o {

61 namespace relocatable {

64 // forward reference

 template <typename A> class Parser;

 template <typename A> class Atom;

 template <typename A> class Section;

 template <typename A> class CFISection;

 template <typename A> class CUSection;

71 template <typename A>

 class File : public ld::relocatable::File

73 {

74 public:

                                                                                         File(const char* p, time_t mTime, const uint8_t* content, ld::File::Ordinal ord) :

                                                                                                 ld::relocatable::File(p,mTime,ord), _fileContent(content),

                                                                                                 _sectionsArray(NULL), _atomsArray(NULL),

                                                                                                 _sectionsArrayCount(0), _atomsArrayCount(0), _aliasAtomsArrayCount(0),

                                                                                                 _debugInfoKind(ld::relocatable::File::kDebugInfoNone),

80 _dwarfTranslationUnitPath(NULL),

                                                                                                 _dwarfDebugInfoSect(NULL), _dwarfDebugAbbrevSect(NULL), 

                                                                                                 _dwarfDebugLineSect(NULL), _dwarfDebugStringSect(NULL), 

83 _hasObjC(false),

84 _swiftVersion(0),

85 _cpuSubType(0),

86 _minOSVersion(0),

87 _canScatterAtoms(false),

88 _hasllvmProfiling(false),

89 _objcHasCategoryClassPropertiesField(false),

90 _srcKind(kSourceUnknown) { }

91 virtual ~File();

93 // overrides of ld::File

         virtual bool                                                                            forEachAtom(ld::File::AtomHandler&) const;

         virtual bool                                                                            justInTimeforEachAtom(const char* name, ld::File::AtomHandler&) const

96 { return false; }

         virtual const ld::VersionSet&                                           platforms()     const                   { return _platforms; }

99 // overrides of ld::relocatable::File

         virtual bool                                                                            hasObjC() const                                 { return _hasObjC; }

         virtual bool                                                                            objcHasCategoryClassPropertiesField() const 

102 { return _objcHasCategoryClassPropertiesField; }

         virtual uint32_t                                                                        cpuSubType() const                              { return _cpuSubType; }

         virtual DebugInfoKind                                                           debugInfo() const                               { return _debugInfoKind; }

         virtual const std::vector<ld::relocatable::File::Stab>* stabs() const                           { return &_stabs; }

         virtual bool                                                                            canScatterAtoms() const                 { return _canScatterAtoms; }

         virtual bool                                                                            hasllvmProfiling() const        { return _hasllvmProfiling; }

         virtual const char*                                                                     translationUnitSource() const;

         virtual LinkerOptionsList*                                                      linkerOptions() const                   { return &_linkerOptions; }

         virtual const ToolVersionList&                                          toolVersions() const                    { return _toolVersions; }

         virtual uint8_t                                                                         swiftVersion() const                    { return _swiftVersion; }

         virtual ld::Bitcode*                                                            getBitcode() const                              { return _bitcode.get(); }

         virtual SourceKind                                                                      sourceKind() const                              { return _srcKind; }

114

         virtual const uint8_t*                                                          fileContent() const                             { return _fileContent; }

         virtual const std::vector<AstTimeAndPath>*                      astFiles() const                                { return &_astFiles; }

117

         void                                                                                    setHasllvmProfiling()                   { _hasllvmProfiling = true; }

119 private:

120 friend class Atom<A>;

121 friend class Section<A>;

122 friend class Parser<A>;

123 friend class CFISection<A>::OAS;

124

125 typedef typename A::P P;

126

127 const uint8_t* _fileContent;

128 Section<A>** _sectionsArray;

129 uint8_t* _atomsArray;

130 uint8_t* _aliasAtomsArray;

131 uint32_t _sectionsArrayCount;

132 uint32_t _atomsArrayCount;

133 uint32_t _aliasAtomsArrayCount;

         std::vector<ld::Fixup>                                  _fixups;

         std::vector<ld::Atom::UnwindInfo>               _unwindInfos;

         std::vector<ld::Atom::LineInfo>                 _lineInfos;

         std::vector<ld::relocatable::File::Stab>_stabs;

         std::vector<AstTimeAndPath>                             _astFiles;

         ld::relocatable::File::DebugInfoKind    _debugInfoKind;

140 const char* _dwarfTranslationUnitPath;

141 const macho_section* _dwarfDebugInfoSect;

142 const macho_section* _dwarfDebugAbbrevSect;

143 const macho_section* _dwarfDebugLineSect;

144 const macho_section* _dwarfDebugStringSect;

145 bool _hasObjC;

146 uint8_t _swiftVersion;

147 uint32_t _cpuSubType;

148 uint32_t _minOSVersion;

149 ld::VersionSet _platforms;

150 bool _canScatterAtoms;

151 bool _hasllvmProfiling;

152 bool _objcHasCategoryClassPropertiesField;

         std::vector<std::vector<const char*> >  _linkerOptions;

         std::unique_ptr<ld::Bitcode>                    _bitcode;

155 SourceKind _srcKind;

156 ToolVersionList _toolVersions;

157 };

158

159

160 template <typename A>

 class Section : public ld::Section

162 {

163 public:

         typedef typename A::P::uint_t   pint_t;

165 typedef typename A::P P;

         typedef typename A::P::E                E;

167

168 virtual ~Section() { }

         class File<A>&                                  file() const                            { return _file; }

         const macho_section<P>*                 machoSection() const            { return _machOSection; }

         uint32_t                                                sectionNum(class Parser<A>&) const;

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr);

         virtual ld::Atom::ContentType   contentType()                           { return ld::Atom::typeUnclassified; }

         virtual bool                                    dontDeadStrip()                         { return (this->_machOSection->flags() & S_ATTR_NO_DEAD_STRIP); }

         virtual bool                                    dontDeadStripIfReferencesLive() { return ( (this->_machOSection != NULL) && (this->_machOSection->flags() & S_ATTR_LIVE_SUPPORT) );  }

         virtual Atom<A>*                                findAtomByAddress(pint_t addr) { return this->findContentAtomByAddress(addr, this->_beginAtoms, this->_endAtoms); }

         virtual bool                                    addFollowOnFixups() const       { return ! _file.canScatterAtoms(); }

         virtual uint32_t                                appendAtoms(class Parser<A>& parser, uint8_t* buffer, 

                                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, 

                                                                                                 const struct Parser<A>::CFI_CU_InfoArrays&) = 0;

         virtual uint32_t                                computeAtomCount(class Parser<A>& parser, 

                                                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, 

                                                                                                                 const struct Parser<A>::CFI_CU_InfoArrays&) = 0;

         virtual void                                    makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual bool                                    addRelocFixup(class Parser<A>& parser, const macho_relocation_info<P>*);

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const { return 0; }

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const { return false; }

         virtual bool                                    ignoreLabel(const char* label) const { return false; }

         static const char*                              makeSectionName(const macho_section<typename A::P>* s);

191

192 protected:

                                                 Section(File<A>& f, const macho_section<typename A::P>* s)

                                                         : ld::Section(makeSegmentName(s), makeSectionName(s), sectionType(s)),

                                                                 _file(f), _machOSection(s), _beginAtoms(NULL), _endAtoms(NULL), _hasAliases(false) { }

                                                 Section(File<A>& f, const char* segName, const char* sectName, ld::Section::Type t, bool hidden=false)

                                                         : ld::Section(segName, sectName, t, hidden), _file(f), _machOSection(NULL), 

                                                                 _beginAtoms(NULL), _endAtoms(NULL), _hasAliases(false) { }

199

200

         Atom<A>*                                                findContentAtomByAddress(pint_t addr, class Atom<A>* start, class Atom<A>* end);

         uint32_t                                                x86_64PcRelOffset(uint8_t r_type);

         void                                                    addLOH(class Parser<A>& parser, int kind, int count, const uint64_t addrs[]);

         static const char*                              makeSegmentName(const macho_section<typename A::P>* s);

         static bool                                             readable(const macho_section<typename A::P>* s);

         static bool                                             writable(const macho_section<typename A::P>* s);

         static bool                                             exectuable(const macho_section<typename A::P>* s);

         static ld::Section::Type                sectionType(const macho_section<typename A::P>* s);

209

210 File<A>& _file;

211 const macho_section* _machOSection;

212 class Atom<A>* _beginAtoms;

213 class Atom<A>* _endAtoms;

214 bool _hasAliases;

         std::set<const class Atom<A>*>  _altEntries;

216 };

217

218

219 template <typename A>

 class CFISection : public Section<A>

221 {

222 public:

                                                 CFISection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : Section<A>(f, s) { }

         uint32_t                        cfiCount(Parser<A>& parser);

226

         virtual ld::Atom::ContentType   contentType()           { return ld::Atom::typeCFI; }

         virtual uint32_t        computeAtomCount(class Parser<A>& parser, struct Parser<A>::LabelAndCFIBreakIterator& it, const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual uint32_t        appendAtoms(class Parser<A>& parser, uint8_t* buffer, struct Parser<A>::LabelAndCFIBreakIterator& it, const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual void            makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual bool            addFollowOnFixups() const       { return false; }

232

233

234 ///

235 /// ObjectFileAddressSpace is used as a template parameter to UnwindCursor for parsing

236 /// dwarf CFI information in an object file.

237 ///

238 class OAS

239 {

240 public:

                         typedef typename A::P::uint_t   pint_t;

242 typedef typename A::P P;

                         typedef typename A::P::E                E;

                         typedef typename A::P::uint_t   sint_t;

245

                                                         OAS(CFISection<A>& ehFrameSection, const uint8_t* ehFrameBuffer) : 

247 _ehFrameSection(ehFrameSection),

248 _ehFrameContent(ehFrameBuffer),

                                                                 _ehFrameStartAddr(ehFrameSection.machoSection()->addr()), 

                                                                 _ehFrameEndAddr(ehFrameSection.machoSection()->addr()+ehFrameSection.machoSection()->size()) {}

251

                         uint8_t                 get8(pint_t addr) { return *((uint8_t*)mappedAddress(addr)); }

                         uint16_t                get16(pint_t addr)      { return E::get16(*((uint16_t*)mappedAddress(addr))); }

                         uint32_t                get32(pint_t addr)      { return E::get32(*((uint32_t*)mappedAddress(addr))); }

                         uint64_t                get64(pint_t addr)      { return E::get64(*((uint64_t*)mappedAddress(addr))); }

                         pint_t                  getP(pint_t addr)       { return P::getP(*((pint_t*)mappedAddress(addr))); }

                         uint64_t                getULEB128(pint_t& addr, pint_t end);

                         int64_t                 getSLEB128(pint_t& addr, pint_t end);

                         pint_t                  getEncodedP(pint_t& addr, pint_t end, uint8_t encoding);

260 private:

                 const void*                     mappedAddress(pint_t addr);

262

263 CFISection<A>& _ehFrameSection;

264 const uint8_t* _ehFrameContent;

265 pint_t _ehFrameStartAddr;

266 pint_t _ehFrameEndAddr;

267 };

268

269

         typedef typename A::P::uint_t                   pint_t;

         typedef libunwind::CFI_Atom_Info<OAS>   CFI_Atom_Info;

272

         void                            cfiParse(class Parser<A>& parser, uint8_t* buffer, CFI_Atom_Info cfiArray[], uint32_t& cfiCount, const pint_t cuStarts[], uint32_t cuCount);

274 bool needsRelocating();

275

276 static bool bigEndian();

277 private:

         void                            addCiePersonalityFixups(class Parser<A>& parser, const CFI_Atom_Info* cieInfo);

         static void                     warnFunc(void* ref, uint64_t funcAddr, const char* msg);

280 };

281

282

283 template <typename A>

 class CUSection : public Section<A>

285 {

286 public:

                                                 CUSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : Section<A>(f, s) { }

289

         typedef typename A::P::uint_t   pint_t;

291 typedef typename A::P P;

         typedef typename A::P::E                E;

293

         virtual uint32_t                computeAtomCount(class Parser<A>& parser, struct Parser<A>::LabelAndCFIBreakIterator& it, const struct Parser<A>::CFI_CU_InfoArrays&) { return 0; }

         virtual uint32_t                appendAtoms(class Parser<A>& parser, uint8_t* buffer, struct Parser<A>::LabelAndCFIBreakIterator& it, const struct Parser<A>::CFI_CU_InfoArrays&) { return 0; }

         virtual void                    makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual bool                    addFollowOnFixups() const       { return false; }

298

299 struct Info {

300 pint_t functionStartAddress;

301 uint32_t functionSymbolIndex;

302 uint32_t rangeLength;

303 uint32_t compactUnwindInfo;

304 const char* personality;

305 pint_t lsdaAddress;

306 Atom<A>* function;

307 Atom<A>* lsda;

308 };

309

310 uint32_t count();

         void                                    parse(class Parser<A>& parser, uint32_t cnt, Info array[]);

312 static bool encodingMeansUseDwarf(compact_unwind_encoding_t enc);

313

314

315 private:

316

         const char*                             personalityName(class Parser<A>& parser, const macho_relocation_info<P>* reloc);

318

         static int                              infoSorter(const void* l, const void* r);

320

321 };

322

323

324 template <typename A>

 class TentativeDefinitionSection : public Section<A>

326 {

327 public:

                                                 TentativeDefinitionSection(Parser<A>& parser, File<A>& f)

                                                         : Section<A>(f, "__DATA", "__comm/tent", ld::Section::typeTentativeDefs)  {}

330

         virtual ld::Atom::ContentType   contentType()           { return ld::Atom::typeZeroFill; }

         virtual bool            addFollowOnFixups() const       { return false; }

         virtual Atom<A>*        findAtomByAddress(typename A::P::uint_t addr) { throw "TentativeDefinitionSection::findAtomByAddress() should never be called"; }

         virtual uint32_t        computeAtomCount(class Parser<A>& parser, struct Parser<A>::LabelAndCFIBreakIterator& it, 

335 const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual uint32_t        appendAtoms(class Parser<A>& parser, uint8_t* buffer, 

                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, 

338 const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual void            makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&) {}

340 private:

         typedef typename A::P::uint_t   pint_t;

342 typedef typename A::P P;

343 };

344

345

346 template <typename A>

 class AbsoluteSymbolSection : public Section<A>

348 {

349 public:

                                                 AbsoluteSymbolSection(Parser<A>& parser, File<A>& f)

                                                         : Section<A>(f, "__DATA", "__abs", ld::Section::typeAbsoluteSymbols, true)  {}

352

         virtual ld::Atom::ContentType   contentType()           { return ld::Atom::typeUnclassified; }

         virtual bool                                    dontDeadStrip()         { return false; }

         virtual ld::Atom::Alignment             alignmentForAddress(typename A::P::uint_t addr) { return ld::Atom::Alignment(0); }

         virtual bool            addFollowOnFixups() const       { return false; }

         virtual Atom<A>*        findAtomByAddress(typename A::P::uint_t addr) { throw "AbsoluteSymbolSection::findAtomByAddress() should never be called"; }

         virtual uint32_t        computeAtomCount(class Parser<A>& parser, struct Parser<A>::LabelAndCFIBreakIterator& it, 

359 const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual uint32_t        appendAtoms(class Parser<A>& parser, uint8_t* buffer, 

                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, 

362 const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual void            makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&) {}

         virtual Atom<A>*        findAbsAtomForValue(typename A::P::uint_t);

365

366 private:

         typedef typename A::P::uint_t   pint_t;

368 typedef typename A::P P;

369 };

370

371

372 template <typename A>

 class SymboledSection : public Section<A>

374 {

375 public:

                                                 SymboledSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s);

         virtual ld::Atom::ContentType   contentType() { return _type; }

378 virtual bool dontDeadStrip();

         virtual uint32_t        computeAtomCount(class Parser<A>& parser, struct Parser<A>::LabelAndCFIBreakIterator& it, 

380 const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual uint32_t        appendAtoms(class Parser<A>& parser, uint8_t* buffer, 

                                                                         struct Parser<A>::LabelAndCFIBreakIterator& it, 

383 const struct Parser<A>::CFI_CU_InfoArrays&);

384 protected:

         typedef typename A::P::uint_t   pint_t;

386 typedef typename A::P P;

387

         ld::Atom::ContentType                   _type;

389 };

390

391

392 template <typename A>

 class TLVDefsSection : public SymboledSection<A>

394 {

395 public:

                                                 TLVDefsSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s) :

                                                         SymboledSection<A>(parser, f, s) { }

398

         typedef typename A::P::uint_t   pint_t;

400

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(log2(sizeof(pint_t))); }

403 private:

405 };

408 template <typename A>

 class ImplicitSizeSection : public Section<A>

410 {

411 public:

                                                 ImplicitSizeSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : Section<A>(f, s) { }

         virtual uint32_t        computeAtomCount(class Parser<A>& parser, struct Parser<A>::LabelAndCFIBreakIterator& it, const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual uint32_t        appendAtoms(class Parser<A>& parser, uint8_t* buffer, struct Parser<A>::LabelAndCFIBreakIterator& it, const struct Parser<A>::CFI_CU_InfoArrays&);

416 protected:

         typedef typename A::P::uint_t   pint_t;

418 typedef typename A::P P;

419

         virtual bool                                            addFollowOnFixups() const               { return false; }

         virtual const char*                                     unlabeledAtomName(Parser<A>& parser, pint_t addr) = 0;

         virtual ld::Atom::SymbolTableInclusion  symbolTableInclusion();

         virtual pint_t                                          elementSizeAtAddress(pint_t addr) = 0;

         virtual ld::Atom::Scope                         scopeAtAddress(Parser<A>& parser, pint_t addr) { return ld::Atom::scopeLinkageUnit; }

         virtual bool                                            useElementAt(Parser<A>& parser, 

                                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, pint_t addr) = 0;

         virtual ld::Atom::Definition            definition()                                    { return ld::Atom::definitionRegular; }

         virtual ld::Atom::Combine                       combine(Parser<A>& parser, pint_t addr) = 0;

         virtual bool                                            ignoreLabel(const char* label) const { return (label[0] == 'L'); }

430 };

431

432

433 template <typename A>

 class FixedSizeSection : public ImplicitSizeSection<A>

435 {

436 public:

                                                 FixedSizeSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : ImplicitSizeSection<A>(parser, f, s) { }

439 protected:

         typedef typename A::P::uint_t   pint_t;

441 typedef typename A::P P;

         typedef typename A::P::E                E;

443

         virtual bool                                    useElementAt(Parser<A>& parser, 

                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, pint_t addr) 

446 { return true; }

447 };

448

449

450 template <typename A>

 class Literal4Section : public FixedSizeSection<A>

452 {

453 public:

                                                 Literal4Section(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

456 protected:

         typedef typename A::P::uint_t   pint_t;

458 typedef typename A::P P;

459

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(2); }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "4-byte-literal"; }

         virtual pint_t                                  elementSizeAtAddress(pint_t addr)               { return 4; }

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineByNameAndContent; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

         virtual bool                                    ignoreLabel(const char* label) const;

468 };

469

470 template <typename A>

 class Literal8Section : public FixedSizeSection<A>

472 {

473 public:

                                                 Literal8Section(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

476 protected:

         typedef typename A::P::uint_t   pint_t;

478 typedef typename A::P P;

479

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(3); }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "8-byte-literal"; }

         virtual pint_t                                  elementSizeAtAddress(pint_t addr)               { return 8; }

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineByNameAndContent; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

         virtual bool                                    ignoreLabel(const char* label) const;

488 };

489

490 template <typename A>

 class Literal16Section : public FixedSizeSection<A>

492 {

493 public:

                                                 Literal16Section(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

496 protected:

         typedef typename A::P::uint_t   pint_t;

498 typedef typename A::P P;

499

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(4); }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "16-byte-literal"; }

         virtual pint_t                                  elementSizeAtAddress(pint_t addr)               { return 16; }

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineByNameAndContent; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

         virtual bool                                    ignoreLabel(const char* label) const;

508 };

509

510

511 template <typename A>

 class NonLazyPointerSection : public FixedSizeSection<A>

513 {

514 public:

                                                 NonLazyPointerSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

517 protected:

         typedef typename A::P::uint_t   pint_t;

519 typedef typename A::P P;

520

         virtual void                                    makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual ld::Atom::ContentType   contentType()                                                   { return ld::Atom::typeNonLazyPointer; }

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(log2(sizeof(pint_t))); }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "non_lazy_ptr"; }

         virtual pint_t                                  elementSizeAtAddress(pint_t addr)               { return sizeof(pint_t); }

         virtual ld::Atom::Scope                 scopeAtAddress(Parser<A>& parser, pint_t addr);

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t);

         virtual bool                                    ignoreLabel(const char* label) const    { return true; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

532

533 private:

         static const char*                              targetName(const class Atom<A>* atom, const ld::IndirectBindingTable& ind);

         static ld::Fixup::Kind                  fixupKind();

536 };

537

538 template <typename A>

 class TLVPointerSection : public FixedSizeSection<A>

540 {

541 public:

                                                 TLVPointerSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

544 protected:

         typedef typename A::P::uint_t   pint_t;

546 typedef typename A::P P;

547

         virtual void                                    makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&);

         virtual ld::Atom::ContentType   contentType()                                                   { return ld::Atom::typeTLVPointer; }

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(log2(sizeof(pint_t))); }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "tlv_lazy_ptr"; }

         virtual pint_t                                  elementSizeAtAddress(pint_t addr)               { return sizeof(pint_t); }

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t);

         virtual bool                                    ignoreLabel(const char* label) const    { return true; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

558

559 private:

         static const char*                              targetName(const class Atom<A>* atom, const ld::IndirectBindingTable& ind, bool* isStatic);

561 };

562

563

564 template <typename A>

 class CFStringSection : public FixedSizeSection<A>

566 {

567 public:

                                                 CFStringSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

570 protected:

         typedef typename A::P::uint_t   pint_t;

572

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(log2(sizeof(pint_t))); }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "CFString"; }

         virtual pint_t                                  elementSizeAtAddress(pint_t addr)               { return 4*sizeof(pint_t); }

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineByNameAndReferences; }

         virtual bool                                    ignoreLabel(const char* label) const    { return true; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

581 private:

         enum ContentType { contentUTF8, contentUTF16, contentUnknown };

         static const uint8_t*                   targetContent(const class Atom<A>* atom, const ld::IndirectBindingTable& ind,

                                                                                                 ContentType* ct, unsigned int* count);

585 };

586

587

588 template <typename A>

 class ObjC1ClassSection : public FixedSizeSection<A>

590 {

591 public:

                                                 ObjC1ClassSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

594 protected:

         typedef typename A::P::uint_t   pint_t;

596 typedef typename A::P P;

         typedef typename A::P::E                E;

598

         virtual ld::Atom::Scope                 scopeAtAddress(Parser<A>& , pint_t )    { return ld::Atom::scopeGlobal; }

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(2); }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t);

         virtual ld::Atom::SymbolTableInclusion  symbolTableInclusion()                  { return ld::Atom::symbolTableIn; }

603 virtual pint_t elementSizeAtAddress(pint_t addr);

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineNever; }

         virtual bool                                    ignoreLabel(const char* label) const    { return true; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

607 { return 0; }

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const { return false; }

         virtual bool                                    addRelocFixup(class Parser<A>& parser, const macho_relocation_info<P>*);

611 };

612

613

614 template <typename A>

 class ObjC2ClassRefsSection : public FixedSizeSection<A>

616 {

617 public:

                                                 ObjC2ClassRefsSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

620 protected:

         typedef typename A::P::uint_t   pint_t;

622

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(log2(sizeof(pint_t))); }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "objc-class-ref"; }

         virtual pint_t                                  elementSizeAtAddress(pint_t addr)               { return sizeof(pint_t); }

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineByNameAndReferences; }

         virtual bool                                    ignoreLabel(const char* label) const    { return true; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

631 private:

         const char*                                             targetClassName(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

633 };

634

635

636 template <typename A>

 class ObjC2CategoryListSection : public FixedSizeSection<A>

638 {

639 public:

                                                 ObjC2CategoryListSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

642 protected:

         typedef typename A::P::uint_t   pint_t;

644

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(log2(sizeof(pint_t))); }

         virtual ld::Atom::Scope                 scopeAtAddress(Parser<A>& parser, pint_t addr) { return ld::Atom::scopeTranslationUnit; }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "objc-cat-list"; }

         virtual pint_t                                  elementSizeAtAddress(pint_t addr)               { return sizeof(pint_t); }

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineNever; }

         virtual bool                                    ignoreLabel(const char* label) const    { return true; }

651 private:

         const char*                                             targetClassName(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

653 };

654

655

656 template <typename A>

 class PointerToCStringSection : public FixedSizeSection<A>

658 {

659 public:

                                                 PointerToCStringSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : FixedSizeSection<A>(parser, f, s) {}

662 protected:

         typedef typename A::P::uint_t   pint_t;

664

         virtual ld::Atom::Alignment             alignmentForAddress(pint_t addr)                { return ld::Atom::Alignment(log2(sizeof(pint_t))); }

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "pointer-to-literal-cstring"; }

         virtual pint_t                                  elementSizeAtAddress(pint_t addr)               { return sizeof(pint_t); }

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineByNameAndReferences; }

         virtual bool                                    ignoreLabel(const char* label) const    { return true; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

         virtual const char*                             targetCString(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

674 };

675

676

677 template <typename A>

 class Objc1ClassReferences : public PointerToCStringSection<A>

679 {

680 public:

                                                 Objc1ClassReferences(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : PointerToCStringSection<A>(parser, f, s) {}

683

         typedef typename A::P::uint_t   pint_t;

685 typedef typename A::P P;

686

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "pointer-to-literal-objc-class-name"; }

         virtual bool                                    addRelocFixup(class Parser<A>& parser, const macho_relocation_info<P>*);

         virtual const char*                             targetCString(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

690 };

691

692

693 template <typename A>

 class CStringSection : public ImplicitSizeSection<A>

695 {

696 public:

                                                 CStringSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : ImplicitSizeSection<A>(parser, f, s) {}

699 protected:

         typedef typename A::P::uint_t   pint_t;

701 typedef typename A::P P;

702

         virtual ld::Atom::ContentType   contentType()                                                   { return ld::Atom::typeCString; }

         virtual Atom<A>*                                findAtomByAddress(pint_t addr);

         virtual const char*                             unlabeledAtomName(Parser<A>&, pint_t)   { return "cstring"; }

706 virtual pint_t elementSizeAtAddress(pint_t addr);

         virtual bool                                    ignoreLabel(const char* label) const;

         virtual bool                                    useElementAt(Parser<A>& parser, 

                                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, pint_t addr);

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineByNameAndContent; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

714

715 };

716

717

718 template <typename A>

 class UTF16StringSection : public SymboledSection<A>

720 {

721 public:

                                                 UTF16StringSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

                                                         : SymboledSection<A>(parser, f, s) {}

724 protected:

         typedef typename A::P::uint_t   pint_t;

726 typedef typename A::P P;

727

         virtual ld::Atom::Combine               combine(Parser<A>&, pint_t)                             { return ld::Atom::combineByNameAndContent; }

         virtual unsigned long                   contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const;

         virtual bool                                    canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const;

732 };

733

734

735 //

736 // Atoms in mach-o files

737 //

738 template <typename A>

 class Atom : public ld::Atom

740 {

741 public:

742 // overrides of ld::Atom

         virtual const ld::File*                                         file() const;

         virtual const char*                                                     translationUnitSource() const

                                                                                                                                         { return sect().file().translationUnitSource(); }

         virtual const char*                                                     name() const            { return _name; }

         virtual uint64_t                                                        size() const            { return _size; }

         virtual uint64_t                                                        objectAddress() const { return _objAddress; }

         virtual void                                                            copyRawContent(uint8_t buffer[]) const;

         virtual const uint8_t*                                          rawContentPointer() const { return contentPointer(); }

         virtual unsigned long                                           contentHash(const ld::IndirectBindingTable& ind) const 

                                                                                                                         { if ( _hash == 0 ) _hash = sect().contentHash(this, ind); return _hash; }

         virtual bool                                                            canCoalesceWith(const ld::Atom& rhs, const ld::IndirectBindingTable& ind) const 

                                                                                                                         { return sect().canCoalesceWith(this, rhs, ind); }

         virtual ld::Fixup::iterator                                     fixupsBegin() const     { return &machofile()._fixups[_fixupsStartIndex]; }

         virtual ld::Fixup::iterator                                     fixupsEnd()     const   { return &machofile()._fixups[_fixupsStartIndex+_fixupsCount]; }

         virtual ld::Atom::UnwindInfo::iterator          beginUnwind() const     { return &machofile()._unwindInfos[_unwindInfoStartIndex]; }

         virtual ld::Atom::UnwindInfo::iterator          endUnwind()     const   { return &machofile()._unwindInfos[_unwindInfoStartIndex+_unwindInfoCount];  }

         virtual ld::Atom::LineInfo::iterator            beginLineInfo() const{ return &machofile()._lineInfos[_lineInfoStartIndex]; }

         virtual ld::Atom::LineInfo::iterator            endLineInfo() const { return &machofile()._lineInfos[_lineInfoStartIndex+_lineInfoCount];  }

         virtual void                                                            setFile(const ld::File* f);

762

763 private:

764

         enum {  kFixupStartIndexBits = 32,

766 kLineInfoStartIndexBits = 32,

767 kUnwindInfoStartIndexBits = 24,

768 kFixupCountBits = 24,

769 kLineInfoCountBits = 12,

770 kUnwindInfoCountBits = 4

771 }; // must sum to 128

772

773 public:

774 // methods for all atoms from mach-o object file

                         Section<A>&                                                     sect() const                    { return (Section<A>&)section(); }

                         File<A>&                                                        machofile() const                       { return ((Section<A>*)(this->_section))->file(); }

                         void                                                            setFixupsRange(uint32_t s, uint32_t c);

                         void                                                            setUnwindInfoRange(uint32_t s, uint32_t c);

779 void extendUnwindInfoRange();

                         void                                                            setLineInfoRange(uint32_t s, uint32_t c);

                         bool                                                            roomForMoreLineInfoCount() { return (_lineInfoCount < ((1<<kLineInfoCountBits)-1)); }

                         void                                                            incrementLineInfoCount() { assert(roomForMoreLineInfoCount()); ++_lineInfoCount; }

                         void                                                            incrementFixupCount() { if (_fixupsCount == ((1 << kFixupCountBits)-1)) 

                                                                                                                                                         throwf("too may fixups in %s", name()); ++_fixupsCount; }

                         const uint8_t*                                          contentPointer() const;

                         uint32_t                                                        fixupCount() const { return _fixupsCount; }

                         void                                                            verifyAlignment(const macho_section<typename A::P>&) const;

788

789 typedef typename A::P P;

         typedef typename A::P::E                                        E;

         typedef typename A::P::uint_t                           pint_t;

792 // constuct via all attributes

                                                                                                 Atom(Section<A>& sct, const char* nm, pint_t addr, uint64_t sz, 

                                                                                                         ld::Atom::Definition d, ld::Atom::Combine c, ld::Atom::Scope s, 

                                                                                                         ld::Atom::ContentType ct, ld::Atom::SymbolTableInclusion i, 

                                                                                                         bool dds, bool thumb, bool al, ld::Atom::Alignment a) 

                                                                                                                 : ld::Atom((ld::Section&)sct, d, c, s, ct, i, dds, thumb, al, a), 

                                                                                                                         _size(sz), _objAddress(addr), _name(nm), _hash(0), 

                                                                                                                         _fixupsStartIndex(0), _lineInfoStartIndex(0),

                                                                                                                         _unwindInfoStartIndex(0), _fixupsCount(0),  

                                                                                                                         _lineInfoCount(0), _unwindInfoCount(0) { }

802 // construct via symbol table entry

                                                                                                 Atom(Section<A>& sct, Parser<A>& parser, const macho_nlist<P>& sym, 

                                                                                                                                 uint64_t sz, bool alias=false)

                                                                                                                 : ld::Atom((ld::Section&)sct, parser.definitionFromSymbol(sym), 

                                                                                                                                 parser.combineFromSymbol(sym), parser.scopeFromSymbol(sym),

                                                                                                                                 parser.resolverFromSymbol(sym) ? ld::Atom::typeResolver : sct.contentType(), 

808 parser.inclusionFromSymbol(sym),

                                                                                                                                 (parser.dontDeadStripFromSymbol(sym) && !sct.dontDeadStripIfReferencesLive()) || sct.dontDeadStrip(),

                                                                                                                                 parser.isThumbFromSymbol(sym), alias, 

                                                                                                                                 sct.alignmentForAddress(sym.n_value())),

                                                                                                                         _size(sz), _objAddress(sym.n_value()), 

                                                                                                                         _name(parser.nameFromSymbol(sym)), _hash(0), 

                                                                                                                         _fixupsStartIndex(0), _lineInfoStartIndex(0),

                                                                                                                         _unwindInfoStartIndex(0), _fixupsCount(0),  

                                                                                                                         _lineInfoCount(0), _unwindInfoCount(0) { 

817 // <rdar://problem/6783167> support auto-hidden weak symbols

                                                                                                                                 if ( _scope == ld::Atom::scopeGlobal && 

                                                                                                                                                 (sym.n_desc() & (N_WEAK_DEF|N_WEAK_REF)) == (N_WEAK_DEF|N_WEAK_REF) )

820 this->setAutoHide();

                                                                                                                                 this->verifyAlignment(*sct.machoSection());

                                                                                                                                 if ( sct.dontDeadStripIfReferencesLive() )

823 this->setDontDeadStripIfReferencesLive();

824 }

825

826 private:

827 friend class Parser<A>;

828 friend class Section<A>;

829 friend class CStringSection<A>;

830 friend class AbsoluteSymbolSection<A>;

831

832 pint_t _size;

833 pint_t _objAddress;

834 const char* _name;

835 mutable unsigned long _hash;

836

837 uint64_t _fixupsStartIndex : kFixupStartIndexBits,

838 _lineInfoStartIndex : kLineInfoStartIndexBits,

839 _unwindInfoStartIndex : kUnwindInfoStartIndexBits,

840 _fixupsCount : kFixupCountBits,

841 _lineInfoCount : kLineInfoCountBits,

842 _unwindInfoCount : kUnwindInfoCountBits;

843

         static std::map<const ld::Atom*, const ld::File*> _s_fileOverride;

845 };

846

847 template <typename A>

 std::map<const ld::Atom*, const ld::File*> Atom<A>::_s_fileOverride;

849

850 template <typename A>

 void Atom<A>::setFile(const ld::File* f) {

852 _s_fileOverride[this] = f;

853 }

854

855 template <typename A>

 const ld::File* Atom<A>::file() const

857 {

         std::map<const ld::Atom*, const ld::File*>::iterator pos = _s_fileOverride.find(this);

         if ( pos != _s_fileOverride.end() )

860 return pos->second;

861

         return &sect().file();

863 }

864

865 template <typename A>

 void Atom<A>::setFixupsRange(uint32_t startIndex, uint32_t count)

867 {

         if ( count >= (1 << kFixupCountBits) ) 

                 throwf("too many fixups in function %s", this->name());

         if ( startIndex >= (1 << kFixupStartIndexBits) ) 

871 throwf("too many fixups in file");

         assert(((startIndex+count) <= sect().file()._fixups.size()) && "fixup index out of range");

873 _fixupsStartIndex = startIndex;

874 _fixupsCount = count;

875 }

876

877 template <typename A>

 void Atom<A>::setUnwindInfoRange(uint32_t startIndex, uint32_t count)

879 {

         if ( count >= (1 << kUnwindInfoCountBits) ) 

                 throwf("too many compact unwind infos in function %s", this->name());

         if ( startIndex >= (1 << kUnwindInfoStartIndexBits) ) 

                 throwf("too many compact unwind infos (%d) in file", startIndex);

         assert((startIndex+count) <= sect().file()._unwindInfos.size() && "unwindinfo index out of range");

885 _unwindInfoStartIndex = startIndex;

886 _unwindInfoCount = count;

887 }

888

889 template <typename A>

 void Atom<A>::extendUnwindInfoRange()

891 {

         if ( _unwindInfoCount+1 >= (1 << kUnwindInfoCountBits) ) 

                 throwf("too many compact unwind infos in function %s", this->name());

894 _unwindInfoCount += 1;

895 }

896

897 template <typename A>

 void Atom<A>::setLineInfoRange(uint32_t startIndex, uint32_t count)

899 {

         assert((count < (1 << kLineInfoCountBits)) && "too many line infos");

         assert((startIndex+count) < sect().file()._lineInfos.size() && "line info index out of range");

902 _lineInfoStartIndex = startIndex;

903 _lineInfoCount = count;

904 }

905

906 template <typename A>

 const uint8_t* Atom<A>::contentPointer() const

908 {

         const macho_section<P>* sct = this->sect().machoSection();

         if ( this->_objAddress > sct->addr() + sct->size() )

                 throwf("malformed .o file, symbol has address 0x%0llX which is outside range of its section", (uint64_t)this->_objAddress);

         uint32_t fileOffset = sct->offset() - sct->addr() + this->_objAddress;

         return this->sect().file().fileContent()+fileOffset;

914 }

915

916

917 template <typename A>

 void Atom<A>::copyRawContent(uint8_t buffer[]) const

919 {

920 // copy base bytes

         if ( this->contentType() == ld::Atom::typeZeroFill ) {

922 bzero(buffer, _size);

923 }

         else if ( _size != 0 ) {

                 memcpy(buffer, this->contentPointer(), _size);

926 }

927 }

928

929 template <>

 void Atom<arm>::verifyAlignment(const macho_section<P>&) const

931 {

         if ( (this->section().type() == ld::Section::typeCode) && ! isThumb() ) {

                 if ( ((_objAddress % 4) != 0) || (this->alignment().powerOf2 < 2) )

                         warning("ARM function not 4-byte aligned: %s from %s", this->name(), this->file()->path());

935 }

936 }

937

938 #if SUPPORT_ARCH_arm64

939 template <>

 void Atom<arm64>::verifyAlignment(const macho_section<P>& sect) const

941 {

         if ( (this->section().type() == ld::Section::typeCode) && (sect.size() != 0) ) {

                 if ( ((_objAddress % 4) != 0) || (this->alignment().powerOf2 < 2) )

                         warning("arm64 function not 4-byte aligned: %s from %s", this->name(), this->file()->path());

945 }

946 }

947 #endif

948

949

950 template <typename A>

 void Atom<A>::verifyAlignment(const macho_section<P>&) const

952 {

953 }

954

955

 class AliasAtom : public ld::Atom

957 {

958 public:

                                                                                 AliasAtom(const char* name, bool hidden, const ld::File* file, const char* aliasOfName) : 

                                                                                         ld::Atom(_s_section, ld::Atom::definitionRegular, ld::Atom::combineNever,

                                                                                                         (hidden ? ld::Atom::scopeLinkageUnit : ld::Atom::scopeGlobal), 

                                                                                                         ld::Atom::typeUnclassified, ld::Atom::symbolTableIn, 

                                                                                                         false, false, true, 0),

964 _file(file),

965 _name(name),

                                                                                         _fixup(0, ld::Fixup::k1of1, ld::Fixup::kindNoneFollowOn, ld::Fixup::bindingByNameUnbound, aliasOfName) { }

967

         virtual const ld::File*                         file() const            { return _file; }

         virtual const char*                                     translationUnitSource() const

970 { return NULL; }

         virtual const char*                                     name() const            { return _name; }

         virtual uint64_t                                        size() const            { return 0; }

         virtual uint64_t                                        objectAddress() const { return 0; }

         virtual void                                            copyRawContent(uint8_t buffer[]) const { }

         virtual ld::Fixup::iterator                     fixupsBegin() const     { return &((ld::Fixup*)&_fixup)[0]; }

         virtual ld::Fixup::iterator                     fixupsEnd()     const   { return &((ld::Fixup*)&_fixup)[1]; }

977

978 private:

979 static ld::Section _s_section;

980

         const ld::File*                                         _file;

982 const char* _name;

983 ld::Fixup _fixup;

984 };

985

 ld::Section AliasAtom::_s_section("__LD", "__aliases", ld::Section::typeTempAlias, true);

987

988

989 template <typename A>

990 class Parser

991 {

992 public:

         static bool                                                                             validFile(const uint8_t* fileContent, bool subtypeMustMatch=false, 

994 cpu_subtype_t subtype=0);

         static const char*                                                              fileKind(const uint8_t* fileContent);

         static ld::Platform                                                             findPlatform(const macho_header<typename A::P>* header, uint32_t* minOsVers);

         static bool                                                                             hasObjC2Categories(const uint8_t* fileContent);

         static bool                                                                             hasObjC1Categories(const uint8_t* fileContent);

         static bool                                                                             getNonLocalSymbols(const uint8_t* fileContnet, std::vector<const char*> &syms);

         static ld::relocatable::File*                                   parse(const uint8_t* fileContent, uint64_t fileLength, 

                                                                                                                         const char* path, time_t modTime, ld::File::Ordinal ordinal,

1002 const ParserOptions& opts) {

                                                                                                                                 Parser p(fileContent, fileLength, path, modTime, 

1004 ordinal, opts.warnUnwindConversionProblems,

1005 opts.keepDwarfUnwind, opts.forceDwarfConversion,

1006 opts.neverConvertDwarf, opts.verboseOptimizationHints,

1007 opts.ignoreMismatchPlatform);

                                                                                                                                 return p.parse(opts);

1009 }

1010

1011 typedef typename A::P P;

         typedef typename A::P::E                                        E;

         typedef typename A::P::uint_t                           pint_t;

1014

1015 struct SourceLocation {

1016 SourceLocation() {}

                                                                 SourceLocation(Atom<A>* a, uint32_t o) : atom(a), offsetInAtom(o) {}

1018 Atom<A>* atom;

1019 uint32_t offsetInAtom;

1020 };

1021

1022 struct TargetDesc {

1023 Atom<A>* atom;

1024 const char* name; // only used if targetAtom is NULL

1025 int64_t addend;

1026 bool weakImport; // only used if targetAtom is NULL

1027 #if SUPPORT_ARCH_arm64e

                 ld::Fixup::AuthData authData; // only used for authenticated pointers

1029 #endif

1030 };

1031

1032 struct FixupInAtom {

                 FixupInAtom(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, Atom<A>* target) :

                         fixup(src.offsetInAtom, c, k, target), atom(src.atom) { src.atom->incrementFixupCount(); }

1035

                 FixupInAtom(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, ld::Fixup::TargetBinding b, Atom<A>* target) :

                         fixup(src.offsetInAtom, c, k, b, target), atom(src.atom) { src.atom->incrementFixupCount(); }

1038

                 FixupInAtom(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, bool wi, const char* name) :

                         fixup(src.offsetInAtom, c, k, wi, name), atom(src.atom) { src.atom->incrementFixupCount(); }

1041

                 FixupInAtom(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, ld::Fixup::TargetBinding b, const char* name) :

                         fixup(src.offsetInAtom, c, k, b, name), atom(src.atom) { src.atom->incrementFixupCount(); }

1044

                 FixupInAtom(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, uint64_t addend) :

                         fixup(src.offsetInAtom, c, k, addend), atom(src.atom) { src.atom->incrementFixupCount(); }

1047

1048 #if SUPPORT_ARCH_arm64e

                 FixupInAtom(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, ld::Fixup::AuthData authData) :

                         fixup(src.offsetInAtom, c, k, authData), atom(src.atom) { src.atom->incrementFixupCount(); }

1051 #endif

1052

                 FixupInAtom(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k) :

                         fixup(src.offsetInAtom, c, k, (uint64_t)0), atom(src.atom) { src.atom->incrementFixupCount(); }

1055

1056 ld::Fixup fixup;

1057 Atom<A>* atom;

1058 };

1059

         void addFixup(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, Atom<A>* target) { 

                 _allFixups.push_back(FixupInAtom(src, c, k, target)); 

1062 }

1063

         void addFixup(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, ld::Fixup::TargetBinding b, Atom<A>* target) { 

                 _allFixups.push_back(FixupInAtom(src, c, k, b, target)); 

1066 }

1067

         void addFixup(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, bool wi, const char* name) { 

                 _allFixups.push_back(FixupInAtom(src, c, k, wi, name)); 

1070 }

1071

         void addFixup(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, ld::Fixup::TargetBinding b, const char* name) { 

                 _allFixups.push_back(FixupInAtom(src, c, k, b, name)); 

1074 }

1075

         void addFixup(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, uint64_t addend) { 

                 _allFixups.push_back(FixupInAtom(src, c, k, addend)); 

1078 }

1079

1080 #if SUPPORT_ARCH_arm64e

         void addFixup(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k, ld::Fixup::AuthData authData) {

                 _allFixups.push_back(FixupInAtom(src, c, k, authData));

1083 }

1084 #endif

1085

         void addFixup(const SourceLocation& src, ld::Fixup::Cluster c, ld::Fixup::Kind k) { 

                 _allFixups.push_back(FixupInAtom(src, c, k)); 

1088 }

1089

         const char*                                                                             path() { return _path; }

         uint32_t                                                                                symbolCount() { return _symbolCount; }

         uint32_t                                                                                indirectSymbol(uint32_t indirectIndex);

         const macho_nlist<P>&                                                   symbolFromIndex(uint32_t index);

         const char*                                                                             nameFromSymbol(const macho_nlist<P>& sym);

         ld::Atom::Scope                                                                 scopeFromSymbol(const macho_nlist<P>& sym);

         static ld::Atom::Definition                                             definitionFromSymbol(const macho_nlist<P>& sym);

         static ld::Atom::Combine                                                combineFromSymbol(const macho_nlist<P>& sym);

                         ld::Atom::SymbolTableInclusion                  inclusionFromSymbol(const macho_nlist<P>& sym);

         static bool                                                                             dontDeadStripFromSymbol(const macho_nlist<P>& sym);

         static bool                                                                             isThumbFromSymbol(const macho_nlist<P>& sym);

         static bool                                                                             weakImportFromSymbol(const macho_nlist<P>& sym);

         static bool                                                                             resolverFromSymbol(const macho_nlist<P>& sym);

         static bool                                                                             altEntryFromSymbol(const macho_nlist<P>& sym);

         uint32_t                                                                                symbolIndexFromIndirectSectionAddress(pint_t,const macho_section<P>*);

         const macho_section<P>*                                                 firstMachOSection() { return _sectionsStart; }

         const macho_section<P>*                                                 machOSectionFromSectionIndex(uint32_t index);

         uint32_t                                                                                machOSectionCount() { return _machOSectionsCount; }

         uint32_t                                                                                undefinedStartIndex() { return _undefinedStartIndex; }

         uint32_t                                                                                undefinedEndIndex() { return _undefinedEndIndex; }

         void                                                                                    addFixup(FixupInAtom f) { _allFixups.push_back(f); }

         Section<A>*                                                                             sectionForNum(unsigned int sectNum);

         Section<A>*                                                                             sectionForAddress(pint_t addr);

         Atom<A>*                                                                                findAtomByAddress(pint_t addr);

         Atom<A>*                                                                                findAtomByAddressOrNullIfStub(pint_t addr);

         Atom<A>*                                                                                findAtomByAddressOrLocalTargetOfStub(pint_t addr, uint32_t* offsetInAtom);

         Atom<A>*                                                                                findAtomByName(const char* name);       // slow!

         void                                                                                    findTargetFromAddress(pint_t addr, TargetDesc& target);

         void                                                                                    findTargetFromAddress(pint_t baseAddr, pint_t addr, TargetDesc& target);

         void                                                                                    findTargetFromAddressAndSectionNum(pint_t addr, unsigned int sectNum,

1120 TargetDesc& target);

         uint32_t                                                                                tentativeDefinitionCount() { return _tentativeDefinitionCount; }

         uint32_t                                                                                absoluteSymbolCount() { return _absoluteSymbolCount; }

1123

         uint32_t                                                                                fileLength() const { return _fileLength; }

         bool                                                                                    hasStubsSection() { return (_stubsSectionNum != 0); }

         unsigned int                                                                    stubsSectionNum() { return _stubsSectionNum; }

         void                                                                                    addDtraceExtraInfos(const SourceLocation& src, const char* provider);

         const char*                                                                             scanSymbolTableForAddress(uint64_t addr);

         bool                                                                                    warnUnwindConversionProblems() { return _warnUnwindConversionProblems; }

         bool                                                                                    hasDataInCodeLabels() { return _hasDataInCodeLabels; }

         bool                                                                                    keepDwarfUnwind() { return _keepDwarfUnwind; }

         bool                                                                                    forceDwarfConversion() { return _forceDwarfConversion; }

         bool                                                                                    verboseOptimizationHints() { return _verboseOptimizationHints; }

         bool                                                                                    neverConvertDwarf() { return _neverConvertDwarf; }

         bool                                                                                    armUsesZeroCostExceptions() { return _armUsesZeroCostExceptions; }

         uint8_t                                                                                 maxDefaultCommonAlignment() { return _maxDefaultCommonAlignment; }

1137

1138

         macho_data_in_code_entry<P>*                                    dataInCodeStart() { return _dataInCodeStart; }

         macho_data_in_code_entry<P>*                                    dataInCodeEnd()   { return _dataInCodeEnd; }

         const uint8_t*                                                                  optimizationHintsStart() { return _lohStart; }

         const uint8_t*                                                                  optimizationHintsEnd() { return _lohEnd; }

         bool                                                                                    hasOptimizationHints() { return _lohStart != _lohEnd; }

1144

1145

         void                                                    addFixups(const SourceLocation& src, ld::Fixup::Kind kind, const TargetDesc& target);

         void                                                    addFixups(const SourceLocation& src, ld::Fixup::Kind kind, const TargetDesc& target, const TargetDesc& picBase);

1148

1149

1150

1151 struct LabelAndCFIBreakIterator {

1152 typedef typename CFISection<A>::CFI_Atom_Info CFI_Atom_Info;

                                                                 LabelAndCFIBreakIterator(const uint32_t* ssa, uint32_t ssc, const pint_t* cfisa, 

1154 uint32_t cfisc, bool ols)

                                                                         : sortedSymbolIndexes(ssa), sortedSymbolCount(ssc), cfiStartsArray(cfisa), 

                                                                                 cfiStartsCount(cfisc), fileHasOverlappingSymbols(ols),

                                                                                 newSection(false), cfiIndex(0), symIndex(0) {}

                 bool                                    next(Parser<A>& parser, const Section<A>& sect, uint32_t sectNum, pint_t startAddr, pint_t endAddr, 

                                                                                 pint_t* addr, pint_t* size, const macho_nlist<P>** sym);

                 pint_t                                  peek(Parser<A>& parser, pint_t startAddr, pint_t endAddr);

                 void                                    beginSection() { newSection = true; symIndex = 0; }

1162

1163 const uint32_t* const sortedSymbolIndexes;

1164 const uint32_t sortedSymbolCount;

1165 const pint_t* cfiStartsArray;

1166 const uint32_t cfiStartsCount;

1167 const bool fileHasOverlappingSymbols;

1168 bool newSection;

1169 uint32_t cfiIndex;

1170 uint32_t symIndex;

1171 };

1172

1173 struct CFI_CU_InfoArrays {

1174 typedef typename CFISection<A>::CFI_Atom_Info CFI_Atom_Info;

1175 typedef typename CUSection<A>::Info CU_Info;

                                                 CFI_CU_InfoArrays(const CFI_Atom_Info* cfiAr, uint32_t cfiC, CU_Info* cuAr, uint32_t cuC) 

                                                         : cfiArray(cfiAr), cuArray(cuAr), cfiCount(cfiC), cuCount(cuC) {} 

1178 const CFI_Atom_Info* const cfiArray;

1179 CU_Info* const cuArray;

1180 const uint32_t cfiCount;

1181 const uint32_t cuCount;

1182 };

1183

1184

1185

1186 private:

1187 friend class Section<A>;

1188

         enum SectionType { sectionTypeIgnore, sectionTypeLiteral4, sectionTypeLiteral8, sectionTypeLiteral16, 

1190 sectionTypeNonLazy, sectionTypeCFI, sectionTypeCString, sectionTypeCStringPointer,

1191 sectionTypeUTF16Strings, sectionTypeCFString, sectionTypeObjC2ClassRefs, typeObjC2CategoryList,

1192 sectionTypeObjC1Classes, sectionTypeSymboled, sectionTypeObjC1ClassRefs,

1193 sectionTypeTentativeDefinitions, sectionTypeAbsoluteSymbols, sectionTypeTLVDefs,

1194 sectionTypeCompactUnwind, sectionTypeTLVPointers};

1195

1196 template <typename P>

1197 struct MachOSectionAndSectionClass

1198 {

1199 const macho_section* sect;

1200 SectionType type;

1201

                 static int sorter(const void* l, const void* r) {

                         const MachOSectionAndSectionClass<P>* left = (MachOSectionAndSectionClass<P>*)l;

                         const MachOSectionAndSectionClass<P>* right = (MachOSectionAndSectionClass<P>*)r;

                         int64_t diff = left->sect->addr() - right->sect->addr();

                         if ( diff == 0 )

1207 return 0;

                         if ( diff < 0 )

1209 return -1;

1210 else

1211 return 1;

1212 }

1213 };

1214

         struct ParserAndSectionsArray { Parser* parser; const uint32_t* sortedSectionsArray; };

1216

1217

                                                                                                         Parser(const uint8_t* fileContent, uint64_t fileLength, 

                                                                                                                         const char* path, time_t modTime, ld::File::Ordinal ordinal, 

1220 bool warnUnwindConversionProblems, bool keepDwarfUnwind,

1221 bool forceDwarfConversion, bool neverConvertDwarf,

1222 bool verboseOptimizationHints, bool ignoreMismatchPlatform);

         ld::relocatable::File*                                                  parse(const ParserOptions& opts);

1224 static uint8_t loadCommandSizeMask();

1225 static bool useSimulatorVariant();

         bool                                                                                    parseLoadCommands(ld::VersionSet platforms, bool simulator, bool ignoreMismatchPlatform);

1227 void makeSections();

1228 void prescanSymbolTable();

         void                                                                                    makeSortedSymbolsArray(uint32_t symArray[], const uint32_t sectionArray[]);

         void                                                                                    makeSortedSectionsArray(uint32_t array[]);

         static int                                                                              pointerSorter(const void* l, const void* r);

         static int                                                                              symbolIndexSorter(void* extra, const void* l, const void* r);

         static int                                                                              sectionIndexSorter(void* extra, const void* l, const void* r);

1234

1235 void parseDebugInfo();

1236 void parseStabs();

1237 void addAstFiles();

         void                                                                                    appendAliasAtoms(uint8_t* atomBuffer);

         static bool                                                                             isConstFunStabs(const char *stabStr);

         bool                                                                                    read_comp_unit(const char ** name, const char ** comp_dir,

1241 uint64_t *stmt_list);

1242 pint_t realAddr(pint_t addr);

         const char*                                                                             getDwarfString(uint64_t form, const uint8_t*& p);

         uint64_t                                                                                getDwarfOffset(uint64_t form, const uint8_t*& di, bool dwarf64);

         bool                                                                                    skip_form(const uint8_t ** offset, const uint8_t * end, 

                                                                                                                                 uint64_t form, uint8_t addr_size, bool dwarf64);

1247

1248

1249 // filled in by constructor

1250 const uint8_t* _fileContent;

1251 uint32_t _fileLength;

1252 const char* _path;

1253 time_t _modTime;

         ld::File::Ordinal                                                       _ordinal;

1255

1256 // filled in by parseLoadCommands()

1257 File<A>* _file;

1258 const macho_nlist* _symbols;

1259 uint32_t _symbolCount;

1260 uint32_t _indirectSymbolCount;

1261 const char* _strings;

1262 uint32_t _stringsSize;

1263 const uint32_t* _indirectTable;

1264 uint32_t _indirectTableCount;

1265 uint32_t _undefinedStartIndex;

1266 uint32_t _undefinedEndIndex;

1267 const macho_section* _sectionsStart;

1268 uint32_t _machOSectionsCount;

1269 bool _hasUUID;

1270 macho_data_in_code_entry* _dataInCodeStart;

1271 macho_data_in_code_entry* _dataInCodeEnd;

1272 const uint8_t* _lohStart;

1273 const uint8_t* _lohEnd;

1274

1275 // filled in by parse()

1276 CFISection<A>* _EHFrameSection;

1277 CUSection<A>* _compactUnwindSection;

1278 AbsoluteSymbolSection<A>* _absoluteSection;

1279 uint32_t _tentativeDefinitionCount;

1280 uint32_t _absoluteSymbolCount;

1281 uint32_t _symbolsInSections;

1282 bool _hasLongBranchStubs;

1283 bool _AppleObjc; // FSF has objc that uses different data layout

1284 bool _overlappingSymbols;

1285 bool _warnUnwindConversionProblems;

1286 bool _hasDataInCodeLabels;

1287 bool _keepDwarfUnwind;

1288 bool _forceDwarfConversion;

1289 bool _neverConvertDwarf;

1290 bool _verboseOptimizationHints;

1291 bool _armUsesZeroCostExceptions;

1292 bool _ignoreMismatchPlatform;

1293 bool _treateBitcodeAsData;

1294 bool _usingBitcode;

1295 uint8_t _maxDefaultCommonAlignment;

1296 unsigned int _stubsSectionNum;

1297 const macho_section* _stubsMachOSection;

         std::vector<const char*>                                        _dtraceProviderInfo;

         std::vector<FixupInAtom>                                        _allFixups;

1300 #if SUPPORT_ARCH_arm64e

1301 bool _supportsAuthenticatedPointers;

1302 #endif

1303 };

1304

1305

1306

1307 template <typename A>

 Parser<A>::Parser(const uint8_t* fileContent, uint64_t fileLength, const char* path, time_t modTime, 

                                         ld::File::Ordinal ordinal, bool convertDUI, bool keepDwarfUnwind, bool forceDwarfConversion, 

                                         bool neverConvertDwarf, bool verboseOptimizationHints, bool ignoreMismatchPlatform)

                 : _fileContent(fileContent), _fileLength(fileLength), _path(path), _modTime(modTime),

                         _ordinal(ordinal), _file(NULL),

                         _symbols(NULL), _symbolCount(0), _indirectSymbolCount(0), _strings(NULL), _stringsSize(0),

                         _indirectTable(NULL), _indirectTableCount(0), 

                         _undefinedStartIndex(0), _undefinedEndIndex(0), 

                         _sectionsStart(NULL), _machOSectionsCount(0), _hasUUID(false), 

                         _dataInCodeStart(NULL), _dataInCodeEnd(NULL),

                         _lohStart(NULL), _lohEnd(NULL),

                         _EHFrameSection(NULL), _compactUnwindSection(NULL), _absoluteSection(NULL),

                         _tentativeDefinitionCount(0), _absoluteSymbolCount(0),

                         _symbolsInSections(0), _hasLongBranchStubs(false),  _AppleObjc(false),

                         _overlappingSymbols(false), _warnUnwindConversionProblems(convertDUI), _hasDataInCodeLabels(false),

                         _keepDwarfUnwind(keepDwarfUnwind), _forceDwarfConversion(forceDwarfConversion),

1324 _neverConvertDwarf(neverConvertDwarf),

1325 _verboseOptimizationHints(verboseOptimizationHints),

1326 _ignoreMismatchPlatform(ignoreMismatchPlatform),

                         _stubsSectionNum(0), _stubsMachOSection(NULL)

1328 {

1329 }

1330

1331

1332 template <>

 bool Parser<x86>::validFile(const uint8_t* fileContent, bool, cpu_subtype_t)

1334 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         if ( header->magic() != MH_MAGIC )

1337 return false;

         if ( header->cputype() != CPU_TYPE_I386 )

1339 return false;

         if ( header->filetype() != MH_OBJECT )

1341 return false;

1342 return true;

1343 }

1344

1345 template <>

 bool Parser<x86_64>::validFile(const uint8_t* fileContent, bool, cpu_subtype_t)

1347 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         if ( header->magic() != MH_MAGIC_64 )

1350 return false;

         if ( header->cputype() != CPU_TYPE_X86_64 )

1352 return false;

         if ( header->filetype() != MH_OBJECT )

1354 return false;

1355 return true;

1356 }

1357

1358 template <>

 bool Parser<arm>::validFile(const uint8_t* fileContent, bool subtypeMustMatch, cpu_subtype_t subtype)

1360 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         if ( header->magic() != MH_MAGIC )

1363 return false;

         if ( header->cputype() != CPU_TYPE_ARM )

1365 return false;

         if ( header->filetype() != MH_OBJECT )

1367 return false;

1368 if ( subtypeMustMatch ) {

                 if ( (cpu_subtype_t)header->cpusubtype() == subtype )

1370 return true;

1371 // hack until libcc_kext.a is made fat

                 if ( header->cpusubtype() == CPU_SUBTYPE_ARM_ALL )

1373 return true;

1374 return false;

1375 }

1376 return true;

1377 }

1378

1379

1380 template <>

 bool Parser<arm64>::validFile(const uint8_t* fileContent, bool subtypeMustMatch, cpu_subtype_t subtype)

1382 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         if ( header->magic() != MH_MAGIC_64 )

1385 return false;

         if ( header->cputype() != CPU_TYPE_ARM64 )

1387 return false;

         if ( header->filetype() != MH_OBJECT )

1389 return false;

         if ( subtypeMustMatch && (header->cpusubtype() != (uint32_t)subtype) )

1391 return false;

1392 return true;

1393 }

1394

1395

1396 template <>

 const char* Parser<x86>::fileKind(const uint8_t* fileContent)

1398 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         if ( header->magic() != MH_MAGIC )

1401 return NULL;

         if ( header->cputype() != CPU_TYPE_I386 )

1403 return NULL;

1404 return "i386";

1405 }

1406

1407 template <>

 const char* Parser<x86_64>::fileKind(const uint8_t* fileContent)

1409 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         if ( header->magic() != MH_MAGIC_64 )

1412 return NULL;

         if ( header->cputype() != CPU_TYPE_X86_64 )

1414 return NULL;

1415 return "x86_64";

1416 }

1417

1418 template <>

 const char* Parser<arm>::fileKind(const uint8_t* fileContent)

1420 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         if ( header->magic() != MH_MAGIC )

1423 return NULL;

         if ( header->cputype() != CPU_TYPE_ARM )

1425 return NULL;

         for (const ArchInfo* t=archInfoArray; t->archName != NULL; ++t) {

                 if ( (t->cpuType == CPU_TYPE_ARM) && ((cpu_subtype_t)header->cpusubtype() == t->cpuSubType) ) {

1428 return t->archName;

1429 }

1430 }

1431 return "arm???";

1432 }

1433

1434 #if SUPPORT_ARCH_arm64

1435 template <>

 const char* Parser<arm64>::fileKind(const uint8_t* fileContent)

1437 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         if ( header->magic() != MH_MAGIC_64 )

1440 return NULL;

         if ( header->cputype() != CPU_TYPE_ARM64 )

1442 return NULL;

1443 return "arm64";

1444 }

1445 #endif

1446

1447

1448 template <typename A>

 bool Parser<A>::hasObjC2Categories(const uint8_t* fileContent)

1450 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         const uint32_t cmd_count = header->ncmds();

         const macho_load_command<P>* const cmds = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>));

         const macho_load_command<P>* const cmdsEnd = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>) + header->sizeofcmds());

         const macho_load_command<P>* cmd = cmds;

         for (uint32_t i = 0; i < cmd_count; ++i) {

                 if ( cmd->cmd() == macho_segment_command<P>::CMD ) {

                         const macho_segment_command<P>* segment = (macho_segment_command<P>*)cmd;

                         const macho_section<P>* sectionsStart = (macho_section<P>*)((char*)segment + sizeof(macho_segment_command<P>));

                         for (uint32_t si=0; si < segment->nsects(); ++si) {

                                 const macho_section<P>* sect = &sectionsStart[si];

                                 if ( (sect->size() > 0) 

                                         && (strcmp(sect->sectname(), "__objc_catlist") == 0)

                                         && (strcmp(sect->segname(), "__DATA") == 0) ) {

1465 return true;

1466 }

1467 }

1468 }

                 cmd = (const macho_load_command<P>*)(((char*)cmd)+cmd->cmdsize());

1470 if ( cmd > cmdsEnd )

                         throwf("malformed mach-o file, load command #%d is outside size of load commands", i);

1472 }

1473 return false;

1474 }

1475

1476

1477 template <typename A>

 bool Parser<A>::hasObjC1Categories(const uint8_t* fileContent)

1479 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         const uint32_t cmd_count = header->ncmds();

         const macho_load_command<P>* const cmds = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>));

         const macho_load_command<P>* const cmdsEnd = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>) + header->sizeofcmds());

         const macho_load_command<P>* cmd = cmds;

         for (uint32_t i = 0; i < cmd_count; ++i) {

                 if ( cmd->cmd() == macho_segment_command<P>::CMD ) {

                         const macho_segment_command<P>* segment = (macho_segment_command<P>*)cmd;

                         const macho_section<P>* sectionsStart = (macho_section<P>*)((char*)segment + sizeof(macho_segment_command<P>));

                         for (uint32_t si=0; si < segment->nsects(); ++si) {

                                 const macho_section<P>* sect = &sectionsStart[si];

                                 if ( (sect->size() > 0) 

                                         && (strcmp(sect->sectname(), "__category") == 0)

                                         && (strcmp(sect->segname(), "__OBJC") == 0) ) {

1494 return true;

1495 }

1496 }

1497 }

                 cmd = (const macho_load_command<P>*)(((char*)cmd)+cmd->cmdsize());

1499 if ( cmd > cmdsEnd )

                         throwf("malformed mach-o file, load command #%d is outside size of load commands", i);

1501 }

1502 return false;

1503 }

1504

1505

1506 template <typename A>

 bool Parser<A>::getNonLocalSymbols(const uint8_t* fileContent, std::vector<const char*> &syms)

1508 {

         const macho_header<P>* header = (const macho_header<P>*)fileContent;

         const uint32_t cmd_count = header->ncmds();

         const macho_load_command<P>* const cmds = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>));

         const macho_load_command<P>* const cmdsEnd = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>) + header->sizeofcmds());

         const macho_load_command<P>* cmd = cmds;

         for (uint32_t i = 0; i < cmd_count; ++i) {

                 if ( cmd->cmd() == LC_SYMTAB ) {

                         const macho_symtab_command<P>* symtab = (macho_symtab_command<P>*)cmd;

                         uint32_t symbolCount = symtab->nsyms();

                         const macho_nlist<P>* symbols = (const macho_nlist<P>*)(fileContent + symtab->symoff());

                         const char* strings = (char*)fileContent + symtab->stroff();

                         for (uint32_t j = 0; j < symbolCount; ++j) {

1521 // ignore stabs and count only ext symbols

                                 if ( (symbols[j].n_type() & N_STAB) == 0 &&

                                          (symbols[j].n_type() & N_EXT) != 0 ) {

                                         const char* symName = &strings[symbols[j].n_strx()];

1525 syms.push_back(symName);

1526 }

1527 }

1528 return true;

1529 }

                 cmd = (const macho_load_command<P>*)(((char*)cmd)+cmd->cmdsize());

1531 if ( cmd > cmdsEnd )

                         throwf("malformed mach-o file, load command #%d is outside size of load commands", i);

1533 }

1534 return false;

1535 }

1536

1537

1538 template <typename A>

 int Parser<A>::pointerSorter(const void* l, const void* r)

1540 {

1541 // sort references by address

         const pint_t* left = (pint_t*)l;

         const pint_t* right = (pint_t*)r;

1544 return (*left - *right);

1545 }

1546

1547 template <typename A>

 typename A::P::uint_t Parser<A>::LabelAndCFIBreakIterator::peek(Parser<A>& parser, pint_t startAddr, pint_t endAddr)

1549 {

1550 pint_t symbolAddr;

1551 if ( symIndex < sortedSymbolCount )

                 symbolAddr = parser.symbolFromIndex(sortedSymbolIndexes[symIndex]).n_value();

1553 else

1554 symbolAddr = endAddr;

1555 pint_t cfiAddr;

1556 if ( cfiIndex < cfiStartsCount )

1557 cfiAddr = cfiStartsArray[cfiIndex];

1558 else

1559 cfiAddr = endAddr;

         if ( (cfiAddr < symbolAddr) && (cfiAddr >= startAddr) ) {

1561 if ( cfiAddr < endAddr )

1562 return cfiAddr;

1563 else

1564 return endAddr;

1565 }

1566 else {

1567 if ( symbolAddr < endAddr )

1568 return symbolAddr;

1569 else

1570 return endAddr;

1571 }

1572 }

1573

1574 //

1575 // Parses up a section into chunks based on labels and CFI information.

1576 // Each call returns the next chunk address and size, and (if the break

1577 // was becuase of a label, the symbol). Returns false when no more chunks.

1578 //

1579 template <typename A>

 bool Parser<A>::LabelAndCFIBreakIterator::next(Parser<A>& parser, const Section<A>& sect, uint32_t sectNum, pint_t startAddr, pint_t endAddr, 

                                                                                                 pint_t* addr, pint_t* size, const macho_nlist<P>** symbol)

1582 {

         bool cfiApplicable = (sect.machoSection()->flags() & (S_ATTR_PURE_INSTRUCTIONS | S_ATTR_SOME_INSTRUCTIONS));

1584 // may not be a label on start of section, but need atom demarcation there

1585 if ( newSection ) {

1586 newSection = false;

1587 // advance symIndex until we get to the first label at or past the start of this section

1588 while ( symIndex < sortedSymbolCount ) {

                         const macho_nlist<P>* sym = &parser.symbolFromIndex(sortedSymbolIndexes[symIndex]);

1590 // if compile threw in "ltmp*" symbol at start of section and there is another real label at same location, ignore ltmp one

                         if ( symIndex+1 < sortedSymbolCount ) {

                                 const macho_nlist<P>* sym2 = &parser.symbolFromIndex(sortedSymbolIndexes[symIndex+1]);

                                 if ( (sym->n_sect() == sym2->n_sect()) && (sym->n_value() == sym2->n_value()) ) {

                                         if ( strncmp(parser.nameFromSymbol(*sym), "ltmp", 4) == 0 ) {

1595 ++symIndex;

1596 sym = sym2;

1597 }

1598 }

1599 }

                         if ( ! sect.ignoreLabel(parser.nameFromSymbol(*sym)) ) {

1601 pint_t nextSymbolAddr = sym->n_value();

1602 //fprintf(stderr, "sectNum=%d, nextSymbolAddr=0x%08llX, name=%s\n", sectNum, (uint64_t)nextSymbolAddr, parser.nameFromSymbol(sym));

                                 if ( (nextSymbolAddr > startAddr) || ((nextSymbolAddr == startAddr) && (sym->n_sect() == sectNum)) )

1604 break;

1605 }

1606 ++symIndex;

1607 }

1608 if ( symIndex < sortedSymbolCount ) {

                         const macho_nlist<P>& sym = parser.symbolFromIndex(sortedSymbolIndexes[symIndex]);

1610 pint_t nextSymbolAddr = sym.n_value();

1611 // if next symbol found is not in this section

                         if ( sym.n_sect() != sectNum ) {

1613 // check for CFI break instead of symbol break

1614 if ( cfiIndex < cfiStartsCount ) {

1615 pint_t nextCfiAddr = cfiStartsArray[cfiIndex];

1616 if ( nextCfiAddr < endAddr ) {

1617 // use cfi

1618 ++cfiIndex;

1619 *addr = nextCfiAddr;

                                                 *size = peek(parser, startAddr, endAddr) - nextCfiAddr;

1621 *symbol = NULL;

1622 return true;

1623 }

1624 }

1625 *addr = startAddr;

1626 *size = endAddr - startAddr;

1627 *symbol = NULL;

1628 if ( startAddr == endAddr )

1629 return false; // zero size section

1630 else

1631 return true; // whole section is one atom with no label

1632 }

1633 // if also CFI break here, eat it

1634 if ( cfiIndex < cfiStartsCount ) {

                                 if ( cfiStartsArray[cfiIndex] == nextSymbolAddr )

1636 ++cfiIndex;

1637 }

1638 if ( nextSymbolAddr == startAddr ) {

1639 // label at start of section, return it as chunk

1640 ++symIndex;

1641 *addr = startAddr;

                                 *size = peek(parser, startAddr, endAddr) - startAddr;

1643 *symbol = &sym;

1644 return true;

1645 }

1646 // return chunk before first symbol

1647 *addr = startAddr;

1648 *size = nextSymbolAddr - startAddr;

1649 *symbol = NULL;

1650 return true;

1651 }

1652 // no symbols in section, check CFI

                 if ( cfiApplicable && (cfiIndex < cfiStartsCount) ) {

1654 pint_t nextCfiAddr = cfiStartsArray[cfiIndex];

1655 if ( nextCfiAddr < endAddr ) {

1656 // use cfi

1657 ++cfiIndex;

1658 *addr = nextCfiAddr;

                                 *size = peek(parser, startAddr, endAddr) - nextCfiAddr;

1660 *symbol = NULL;

1661 return true;

1662 }

1663 }

1664 // no cfi, so whole section is one chunk

1665 *addr = startAddr;

1666 *size = endAddr - startAddr;

1667 *symbol = NULL;

1668 if ( startAddr == endAddr )

1669 return false; // zero size section

1670 else

1671 return true; // whole section is one atom with no label

1672 }

1673

         while ( (symIndex < sortedSymbolCount) && (cfiIndex < cfiStartsCount) ) {

                 const macho_nlist<P>& sym = parser.symbolFromIndex(sortedSymbolIndexes[symIndex]);

1676 pint_t nextSymbolAddr = sym.n_value();

1677 pint_t nextCfiAddr = cfiStartsArray[cfiIndex];

1678 if ( nextSymbolAddr < nextCfiAddr ) {

1679 if ( nextSymbolAddr >= endAddr )

1680 return false;

1681 ++symIndex;

1682 if ( nextSymbolAddr < startAddr )

1683 continue;

1684 *addr = nextSymbolAddr;

                         *size = peek(parser, startAddr, endAddr) - nextSymbolAddr;

1686 *symbol = &sym;

1687 return true;

1688 }

1689 else if ( nextCfiAddr < nextSymbolAddr ) {

1690 if ( nextCfiAddr >= endAddr )

1691 return false;

1692 ++cfiIndex;

1693 if ( nextCfiAddr < startAddr )

1694 continue;

1695 *addr = nextCfiAddr;

                         *size = peek(parser, startAddr, endAddr) - nextCfiAddr;

1697 *symbol = NULL;

1698 return true;

1699 }

1700 else {

1701 if ( nextCfiAddr >= endAddr )

1702 return false;

1703 ++symIndex;

1704 ++cfiIndex;

1705 if ( nextCfiAddr < startAddr )

1706 continue;

1707 *addr = nextCfiAddr;

                         *size = peek(parser, startAddr, endAddr) - nextCfiAddr;

1709 *symbol = &sym;

1710 return true;

1711 }

1712 }

1713 while ( symIndex < sortedSymbolCount ) {

                 const macho_nlist<P>& sym = parser.symbolFromIndex(sortedSymbolIndexes[symIndex]);

1715 pint_t nextSymbolAddr = sym.n_value();

1716 // if next symbol found is not in this section, then done with iteration

                 if ( sym.n_sect() != sectNum ) 

1718 return false;

1719 ++symIndex;

1720 if ( nextSymbolAddr < startAddr )

1721 continue;

1722 *addr = nextSymbolAddr;

                 *size = peek(parser, startAddr, endAddr) - nextSymbolAddr;

1724 *symbol = &sym;

1725 return true;

1726 }

1727 while ( cfiIndex < cfiStartsCount ) {

1728 pint_t nextCfiAddr = cfiStartsArray[cfiIndex];

1729 if ( nextCfiAddr >= endAddr )

1730 return false;

1731 ++cfiIndex;

1732 if ( nextCfiAddr < startAddr )

1733 continue;

1734 *addr = nextCfiAddr;

                 *size = peek(parser, startAddr, endAddr) - nextCfiAddr;

1736 *symbol = NULL;

1737 return true;

1738 }

1739 return false;

1740 }

1741

1742 template <>

 typename arm::P::uint_t Parser<arm>::realAddr(typename arm::P::uint_t addr)

1744 {

1745 return addr & (-2);

1746 }

1747

1748 template <typename A>

 typename A::P::uint_t Parser<A>::realAddr(typename A::P::uint_t addr)

1750 {

1751 return addr;

1752 }

1753

1754 #define STACK_ALLOC_IF_SMALL(_type, _name, _actual_count, _maxCount) \

1755 _type* _name = NULL; \

1756 uint32_t _name##_count = 1; \

1757 uint32_t _name##_stack_count = _actual_count; \

1758 if ( _actual_count > _maxCount ) { \

1759 _name = (_type*)malloc(sizeof(_type) * _actual_count); \

1760 _name##_stack_count = 1; \

1761 } \

1762 else \

1763 _name##_count = _actual_count; \

1764 _type _name##_buffer[_name##_stack_count]; \

1765 if ( _name == NULL ) \

1766 _name = _name##_buffer;

1767

1768

1769 template <typename A>

 ld::relocatable::File* Parser<A>::parse(const ParserOptions& opts)

1771 {

1772 // create file object

         _file = new File<A>(_path, _modTime, _fileContent, _ordinal);

1774

1775 // set sourceKind

1776 _file->_srcKind = opts.srcKind;

1777 // set treatBitcodeAsData

1778 _treateBitcodeAsData = opts.treateBitcodeAsData;

1779 _usingBitcode = opts.usingBitcode;

1780

1781 #if SUPPORT_ARCH_arm64e

1782 _supportsAuthenticatedPointers = opts.supportsAuthenticatedPointers;

1783 #endif

1784

1785 // respond to -t option

1786 if ( opts.logAllFiles )

                 printf("%s\n", _path);

1788

1789 _armUsesZeroCostExceptions = opts.armUsesZeroCostExceptions;

1790 _maxDefaultCommonAlignment = opts.maxDefaultCommonAlignment;

1791

1792 // parse start of mach-o file

         if ( ! parseLoadCommands(opts.platforms, opts.simulator, opts.ignoreMismatchPlatform) )

1794 return _file;

1795

1796 // make array of

1797 uint32_t sortedSectionIndexes[_machOSectionsCount];

         this->makeSortedSectionsArray(sortedSectionIndexes);

1799

1800 // make symbol table sorted by address

1801 this->prescanSymbolTable();

1802 uint32_t sortedSymbolIndexes[_symbolsInSections];

         this->makeSortedSymbolsArray(sortedSymbolIndexes, sortedSectionIndexes);

1804

1805 // allocate Section<A> object for each mach-o section

1806 makeSections();

1807

1808 // if it exists, do special early parsing of __compact_unwind section

1809 uint32_t countOfCUs = 0;

1810 if ( _compactUnwindSection != NULL )

1811 countOfCUs = _compactUnwindSection->count();

1812 // stack allocate (if not too large) cuInfoBuffer

         STACK_ALLOC_IF_SMALL(typename CUSection<A>::Info, cuInfoArray, countOfCUs, 1024);

         if ( countOfCUs != 0 )

                 _compactUnwindSection->parse(*this, countOfCUs, cuInfoArray);

1816

1817 // create lists of address that already have compact unwind and thus don't need the dwarf parsed

1818 unsigned cuLsdaCount = 0;

         STACK_ALLOC_IF_SMALL(pint_t, cuStarts, countOfCUs, 1024);

         for (uint32_t i=0; i < countOfCUs; ++i) {

                 if ( CUSection<A>::encodingMeansUseDwarf(cuInfoArray[i].compactUnwindInfo) )

1822 cuStarts[i] = -1;

1823 else

                         cuStarts[i] = cuInfoArray[i].functionStartAddress;

                 if ( cuInfoArray[i].lsdaAddress != 0 )

1826 ++cuLsdaCount;

1827 }

1828

1829

1830 // if it exists, do special early parsing of __eh_frame section

1831 // stack allocate (if not too large) array of CFI_Atom_Info

1832 uint32_t countOfCFIs = 0;

1833 if ( _EHFrameSection != NULL )

                 countOfCFIs = _EHFrameSection->cfiCount(*this);

         STACK_ALLOC_IF_SMALL(typename CFISection<A>::CFI_Atom_Info, cfiArray, countOfCFIs, 1024);

1836

1837 // stack allocate (if not too large) a copy of __eh_frame to apply relocations to

1838 uint32_t sectSize = 4;

         if ( (countOfCFIs != 0) && _EHFrameSection->needsRelocating() ) 

                 sectSize = _EHFrameSection->machoSection()->size()+4;

         STACK_ALLOC_IF_SMALL(uint8_t, ehBuffer, sectSize, 50*1024);

1842 uint32_t cfiStartsCount = 0;

         if ( countOfCFIs != 0 ) {

                 _EHFrameSection->cfiParse(*this, ehBuffer, cfiArray, countOfCFIs, cuStarts, countOfCUs);

1845 // count functions and lsdas

                 for(uint32_t i=0; i < countOfCFIs; ++i) {

                         if ( cfiArray[i].isCIE )

1848 continue;

1849 //fprintf(stderr, "cfiArray[i].func = 0x%08llX, cfiArray[i].lsda = 0x%08llX, encoding=0x%08X\n",

1850 // (uint64_t)cfiArray[i].u.fdeInfo.function.targetAddress,

1851 // (uint64_t)cfiArray[i].u.fdeInfo.lsda.targetAddress,

1852 // cfiArray[i].u.fdeInfo.compactUnwindInfo);

                         if ( cfiArray[i].u.fdeInfo.function.targetAddress != CFI_INVALID_ADDRESS )

1854 ++cfiStartsCount;

                         if ( cfiArray[i].u.fdeInfo.lsda.targetAddress != CFI_INVALID_ADDRESS )

1856 ++cfiStartsCount;

1857 }

1858 }

         CFI_CU_InfoArrays cfis(cfiArray, countOfCFIs, cuInfoArray, countOfCUs);

1860

1861 // create sorted array of function starts and lsda starts

1862 pint_t cfiStartsArray[cfiStartsCount+cuLsdaCount];

1863 uint32_t countOfFDEs = 0;

1864 uint32_t cfiStartsArrayCount = 0;

         if ( countOfCFIs != 0 ) {

                 for(uint32_t i=0; i < countOfCFIs; ++i) {

                         if ( cfiArray[i].isCIE )

1868 continue;

                         if ( cfiArray[i].u.fdeInfo.function.targetAddress != CFI_INVALID_ADDRESS )

                                 cfiStartsArray[cfiStartsArrayCount++] = realAddr(cfiArray[i].u.fdeInfo.function.targetAddress);

                         if ( cfiArray[i].u.fdeInfo.lsda.targetAddress != CFI_INVALID_ADDRESS )

                                 cfiStartsArray[cfiStartsArrayCount++] = cfiArray[i].u.fdeInfo.lsda.targetAddress;

1873 ++countOfFDEs;

1874 }

1875 }

         if ( cuLsdaCount != 0 ) {

1877 // merge in an lsda info from compact unwind

                 for (uint32_t i=0; i < countOfCUs; ++i) {

                         if ( cuInfoArray[i].lsdaAddress == 0 )

1880 continue;

1881 // append to cfiStartsArray if not already in that list

1882 bool found = false;

                         for(uint32_t j=0; j < cfiStartsArrayCount; ++j) {

                                 if ( cfiStartsArray[j] == cuInfoArray[i].lsdaAddress )

1885 found = true;

1886 }

1887 if ( ! found ) {

                                 cfiStartsArray[cfiStartsArrayCount++] = cuInfoArray[i].lsdaAddress;

1889 }

1890 }

1891 }

         if ( cfiStartsArrayCount != 0 ) {

                 ::qsort(cfiStartsArray, cfiStartsArrayCount, sizeof(pint_t), pointerSorter);

1894 #ifndef NDEBUG

1895 // scan for FDEs claming the same function

                 for(uint32_t i=1; i < cfiStartsArrayCount; ++i) {

                         assert( cfiStartsArray[i] != cfiStartsArray[i-1] );

1898 }

1899 #endif

1900 }

1901

         Section<A>** sections = _file->_sectionsArray;

1903 uint32_t sectionsCount = _file->_sectionsArrayCount;

1904

1905 // figure out how many atoms will be allocated and allocate

         LabelAndCFIBreakIterator breakIterator(sortedSymbolIndexes, _symbolsInSections, cfiStartsArray, 

1907 cfiStartsArrayCount, _overlappingSymbols);

1908 uint32_t computedAtomCount = 0;

         for (uint32_t i=0; i < sectionsCount; ++i ) {

1910 breakIterator.beginSection();

                 uint32_t count = sections[i]->computeAtomCount(*this, breakIterator, cfis);

1912 //const macho_section* sect = sections[i]->machoSection();

1913 //fprintf(stderr, "computed count=%u for section %s size=%llu\n", count, sect->sectname(), (sect != NULL) ? sect->size() : 0);

1914 computedAtomCount += count;

1915 }

1916 //fprintf(stderr, "allocating %d atoms * sizeof(Atom<A>)=%ld, sizeof(ld::Atom)=%ld\n", computedAtomCount, sizeof(Atom<A>), sizeof(ld::Atom));

         _file->_atomsArray = new uint8_t[computedAtomCount*sizeof(Atom<A>)];

1918 _file->_atomsArrayCount = 0;

1919

1920 // have each section append atoms to _atomsArray

         LabelAndCFIBreakIterator breakIterator2(sortedSymbolIndexes, _symbolsInSections, cfiStartsArray, 

1922 cfiStartsArrayCount, _overlappingSymbols);

         for (uint32_t i=0; i < sectionsCount; ++i ) {

                 uint8_t* atoms = _file->_atomsArray + _file->_atomsArrayCount*sizeof(Atom<A>);

1925 breakIterator2.beginSection();

                 uint32_t count = sections[i]->appendAtoms(*this, atoms, breakIterator2, cfis);

1927 //fprintf(stderr, "append count=%u for section %s/%s\n", count, sections[i]->machoSection()->segname(), sections[i]->machoSection()->sectname());

1928 _file->_atomsArrayCount += count;

1929 }

         assert( _file->_atomsArrayCount == computedAtomCount && "more atoms allocated than expected");

1931

1932

1933 // have each section add all fix-ups for its atoms

         _allFixups.reserve(computedAtomCount*5);

         for (uint32_t i=0; i < sectionsCount; ++i )

                 sections[i]->makeFixups(*this, cfis);

1937

1938 // assign fixups start offset for each atom

         uint8_t* p = _file->_atomsArray;

1940 uint32_t fixupOffset = 0;

         for(int i=_file->_atomsArrayCount; i > 0; --i) {

                 Atom<A>* atom = (Atom<A>*)p;

1943 atom->_fixupsStartIndex = fixupOffset;

1944 fixupOffset += atom->_fixupsCount;

1945 atom->_fixupsCount = 0;

                 p += sizeof(Atom<A>);

1947 }

         assert(fixupOffset == _allFixups.size());

         _file->_fixups.resize(fixupOffset);

1950

1951 // copy each fixup for each atom

         for(typename std::vector<FixupInAtom>::iterator it=_allFixups.begin(); it != _allFixups.end(); ++it) {

                 uint32_t slot = it->atom->_fixupsStartIndex + it->atom->_fixupsCount;

                 _file->_fixups[slot] = it->fixup;

1955 it->atom->_fixupsCount++;

1956 }

1957

1958 // done with temp vector

1959 _allFixups.clear();

1960

1961 // add unwind info

         _file->_unwindInfos.reserve(countOfFDEs+countOfCUs);

         for(uint32_t i=0; i < countOfCFIs; ++i) {

                 if ( cfiArray[i].isCIE )

1965 continue;

                 if ( cfiArray[i].u.fdeInfo.function.targetAddress != CFI_INVALID_ADDRESS ) {

                         ld::Atom::UnwindInfo info;

1968 info.startOffset = 0;

                         info.unwindInfo = cfiArray[i].u.fdeInfo.compactUnwindInfo;

                         _file->_unwindInfos.push_back(info);

                         Atom<A>* func = findAtomByAddress(cfiArray[i].u.fdeInfo.function.targetAddress);

                         func->setUnwindInfoRange(_file->_unwindInfos.size()-1, 1);

1973 //fprintf(stderr, "cu from dwarf =0x%08X, atom=%s\n", info.unwindInfo, func->name());

1974 }

1975 }

1976 // apply compact infos in __LD,__compact_unwind section to each function

1977 // if function also has dwarf unwind, CU will override it

1978 Atom<A>* lastFunc = NULL;

1979 uint32_t lastEnd = 0;

         for(uint32_t i=0; i < countOfCUs; ++i) {

                 typename CUSection<A>::Info* info = &cuInfoArray[i];

                 assert(info->function != NULL);

                 ld::Atom::UnwindInfo ui;

                 ui.startOffset = info->functionStartAddress - info->function->objectAddress();

1985 ui.unwindInfo = info->compactUnwindInfo;

                 _file->_unwindInfos.push_back(ui);

1987 // don't override with converted cu with "use dwarf" cu, if forcing dwarf conversion

                 if ( !_forceDwarfConversion || !CUSection<A>::encodingMeansUseDwarf(info->compactUnwindInfo) ) {

1989 //fprintf(stderr, "cu=0x%08X, atom=%s\n", ui.unwindInfo, info->function->name());

1990 // if previous is for same function, extend range

                         if ( info->function == lastFunc ) {

                                 if ( lastEnd != ui.startOffset ) {

                                         if ( lastEnd < ui.startOffset )

                                                 warning("__LD,__compact_unwind entries for %s have a gap at offset 0x%0X", info->function->name(), lastEnd);

1995 else

                                                 warning("__LD,__compact_unwind entries for %s overlap at offset 0x%0X", info->function->name(), lastEnd);

1997 }

1998 lastFunc->extendUnwindInfoRange();

1999 }

2000 else

                                 info->function->setUnwindInfoRange(_file->_unwindInfos.size()-1, 1);

2002 lastFunc = info->function;

                         lastEnd = ui.startOffset + info->rangeLength;

2004 }

2005 }

2006

2007 // process indirect symbols which become AliasAtoms

2008 _file->_aliasAtomsArray = NULL;

2009 _file->_aliasAtomsArrayCount = 0;

         if ( _indirectSymbolCount != 0 ) {

2011 _file->_aliasAtomsArrayCount = _indirectSymbolCount;

                 _file->_aliasAtomsArray = new uint8_t[_file->_aliasAtomsArrayCount*sizeof(AliasAtom)];

                 this->appendAliasAtoms(_file->_aliasAtomsArray);

2014 }

2015

2016

2017 // parse dwarf debug info to get line info

2018 this->parseDebugInfo();

2019

2020 return _file;

2021 }

2022

 static void versionToString(uint32_t value, char buffer[32])

2024 {

         if ( value & 0xFF )

                 sprintf(buffer, "%d.%d.%d", value >> 16, (value >> 8) & 0xFF, value & 0xFF);

2027 else

                 sprintf(buffer, "%d.%d", value >> 16, (value >> 8) & 0xFF);

2029 }

2030

 template <> uint8_t Parser<x86>::loadCommandSizeMask()          { return 0x03; }

 template <> uint8_t Parser<x86_64>::loadCommandSizeMask()       { return 0x07; }

 template <> uint8_t Parser<arm>::loadCommandSizeMask()          { return 0x03; }

 template <> uint8_t Parser<arm64>::loadCommandSizeMask()        { return 0x07; }

 template <> bool Parser<x86>::useSimulatorVariant() { return true; }

 template <> bool Parser<x86_64>::useSimulatorVariant() { return true; }

 template <typename A> bool Parser<A>::useSimulatorVariant() { return false; }

2038

2039

2040 template <typename A>

 bool Parser<A>::parseLoadCommands(ld::VersionSet platforms, bool simulator, bool ignoreMismatchPlatform)

2042 {

         const macho_header<P>* header = (const macho_header<P>*)_fileContent;

2044

2045 // set File attributes

         _file->_canScatterAtoms = (header->flags() & MH_SUBSECTIONS_VIA_SYMBOLS);

         _file->_cpuSubType = header->cpusubtype();

2048

         const macho_segment_command<P>* segment = NULL;

         const uint8_t* const endOfFile = _fileContent + _fileLength;

         const uint32_t cmd_count = header->ncmds();

2052 // <rdar://problem/5394172> an empty .o file with zero load commands will crash linker

         if ( cmd_count == 0 )

2054 return false;

2055 ld::VersionSet lcPlatforms;

         const macho_load_command<P>* const cmds = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>));

         const macho_load_command<P>* const cmdsEnd = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>) + header->sizeofcmds());

         const macho_load_command<P>* cmd = cmds;

         for (uint32_t i = 0; i < cmd_count; ++i) {

                 uint32_t size = cmd->cmdsize();

                 if ( (size & this->loadCommandSizeMask()) != 0 )

                         throwf("load command #%d has a unaligned size", i);

                 const uint8_t* endOfCmd = ((uint8_t*)cmd)+cmd->cmdsize();

                 if ( endOfCmd > (uint8_t*)cmdsEnd )

                         throwf("load command #%d extends beyond the end of the load commands", i);

2066 if ( endOfCmd > endOfFile )

                         throwf("load command #%d extends beyond the end of the file", i);

                 switch (cmd->cmd()) {

2069 case LC_SYMTAB:

2070 {

                                         const macho_symtab_command<P>* symtab = (macho_symtab_command<P>*)cmd;

2072 _symbolCount = symtab->nsyms();

                                         _symbols = (const macho_nlist<P>*)(_fileContent + symtab->symoff());

                                         _strings = (char*)_fileContent + symtab->stroff();

2075 _stringsSize = symtab->strsize();

                                         if ( (symtab->symoff() + _symbolCount*sizeof(macho_nlist<P>)) > _fileLength )

2077 throw "mach-o symbol table extends beyond end of file";

                                         if ( (_strings + _stringsSize) > (char*)endOfFile )

2079 throw "mach-o string pool extends beyond end of file";

2080 if ( _indirectTable == NULL ) {

                                                 if ( _undefinedEndIndex == 0 ) {

2082 _undefinedStartIndex = 0;

2083 _undefinedEndIndex = symtab->nsyms();

2084 }

2085 }

2086 }

2087 break;

2088 case LC_DYSYMTAB:

2089 {

                                         const macho_dysymtab_command<P>* dsymtab = (macho_dysymtab_command<P>*)cmd;

                                         _indirectTable = (uint32_t*)(_fileContent + dsymtab->indirectsymoff());

2092 _indirectTableCount = dsymtab->nindirectsyms();

                                         if ( &_indirectTable[_indirectTableCount] > (uint32_t*)endOfFile )

2094 throw "indirect symbol table extends beyond end of file";

2095 _undefinedStartIndex = dsymtab->iundefsym();

                                         _undefinedEndIndex = _undefinedStartIndex + dsymtab->nundefsym();

2097 }

2098 break;

2099 case LC_UUID:

2100 _hasUUID = true;

2101 break;

2102 case LC_DATA_IN_CODE:

2103 {

                                         const macho_linkedit_data_command<P>* dc = (macho_linkedit_data_command<P>*)cmd;

                                         _dataInCodeStart = (macho_data_in_code_entry<P>*)(_fileContent + dc->dataoff());

                                         _dataInCodeEnd = (macho_data_in_code_entry<P>*)(_fileContent + dc->dataoff() + dc->datasize());

                                         if ( _dataInCodeEnd > (macho_data_in_code_entry<P>*)endOfFile )

2108 throw "LC_DATA_IN_CODE table extends beyond end of file";

2109 }

2110 break;

2111 case LC_LINKER_OPTION:

2112 {

                                         const macho_linker_option_command<P>* loc = (macho_linker_option_command<P>*)cmd;

                                         const char* buffer = loc->buffer();

                                         _file->_linkerOptions.resize(_file->_linkerOptions.size() + 1);

                                         std::vector<const char*>& vec = _file->_linkerOptions.back();

                                         for (uint32_t j=0; j < loc->count(); ++j) {

2118 vec.push_back(buffer);

                                                 buffer += strlen(buffer) + 1;

2120 }

                                         if ( buffer > ((char*)cmd + loc->cmdsize()) )

2122 throw "malformed LC_LINKER_OPTION";

2123 }

2124 break;

2125 case LC_LINKER_OPTIMIZATION_HINTS:

2126 {

                                         const macho_linkedit_data_command<P>* loh = (macho_linkedit_data_command<P>*)cmd;

                                         _lohStart = _fileContent + loh->dataoff();

                                         _lohEnd = _fileContent + loh->dataoff() + loh->datasize();

2130 if ( _lohEnd > endOfFile )

2131 throw "LC_LINKER_OPTIMIZATION_HINTS table extends beyond end of file";

2132 }

2133 break;

2134 case LC_VERSION_MIN_MACOSX:

2135 case LC_VERSION_MIN_IPHONEOS:

2136 case LC_VERSION_MIN_WATCHOS:

2137 case LC_VERSION_MIN_TVOS:

2138 if ( ignoreMismatchPlatform )

2139 break;

                                 lcPlatforms.add({Options::platformForLoadCommand(cmd->cmd(), useSimulatorVariant()), ((macho_version_min_command<P>*)cmd)->version()});

                                 _file->_platforms.add({Options::platformForLoadCommand(cmd->cmd(), useSimulatorVariant()), ((macho_version_min_command<P>*)cmd)->version()});

2142 break;

2143 case LC_BUILD_VERSION:

2144 {

                                         const macho_build_version_command<P>* buildVersCmd = (macho_build_version_command<P>*)cmd;

2146 if ( ignoreMismatchPlatform )

2147 break;

                                         lcPlatforms.add({(ld::Platform)buildVersCmd->platform(), buildVersCmd->minos()});

                                         _file->_platforms.add({(ld::Platform)buildVersCmd->platform(), buildVersCmd->minos()});

                                         const macho_build_tool_version<P>* entry = (macho_build_tool_version<P>*)((uint8_t*)cmd + sizeof(macho_build_version_command<P>));

                                         for (uint32_t t=0; t < buildVersCmd->ntools(); ++t) {

                                                 _file->_toolVersions.push_back(std::make_pair(entry->tool(), entry->version()));

2153 ++entry;

2154 }

2155 }

2156 break;

2157 case macho_segment_command::CMD:

2158 if ( segment != NULL )

2159 throw "more than one LC_SEGMENT found in object file";

2160 segment = (macho_segment_command*)cmd;

2161 break;

2162 default:

2163 // ignore unknown load commands

2164 break;

2165 }

                 cmd = (const macho_load_command<P>*)(((char*)cmd)+cmd->cmdsize());

2167 if ( cmd > cmdsEnd )

                         throwf("malformed mach-o file, load command #%d is outside size of load commands", i);

2169 }

2170

2171 // arm/arm64 objects are default to ios platform if not set.

2172 // rdar://problem/21746314

         if (lcPlatforms.empty() &&

                 (std::is_same<A, arm>::value || std::is_same<A, arm64>::value))

                 lcPlatforms.add({ld::kPlatform_iOS,0});

2176

2177 // Check platform cross-linking.

2178 if ( !ignoreMismatchPlatform ) {

2179 __block bool warned = false;

                 platforms.forEach(^(ld::Platform platform, uint32_t version, bool &stop) {

                         if ( !warned && !lcPlatforms.contains(platform) ) {

2182 if (_usingBitcode)

                                         throwf("building for %s, but linking in object file built for %s,",

                                                    platforms.to_str().c_str(), lcPlatforms.to_str().c_str());

2185 #if 0

2186 // FIXME: Re-enable once clang supports zippering

2187 // <rdar://problem/36749415> Turn off "urgent:" linker warning about iOSMac / macOS mismatch

2188 else

                                         warning("URGENT: building for %s, but linking in object file (%s) built for %s. "

2190 "Note: This will be an error in the future.",

                                                         platforms.to_str().c_str(), path(), lcPlatforms.to_str().c_str());

2192 #endif

2193 warned = true;

2194 }

                         if ( version && (lcPlatforms.minOS(platform) > version) ) {

2196 char t1[32];

2197 char t2[32];

                                 versionToString(lcPlatforms.minOS(platform), t1);

2199 versionToString(version, t2);

                                 warning("object file (%s) was built for newer %s version (%s) than being linked (%s)",

                                                 _path, Options::platformName(platform), t1, t2);

2202 }

2203 });

2204 }

2205

2206 // validate just one segment

2207 if ( segment == NULL )

2208 throw "missing LC_SEGMENT";

         if ( segment->filesize() > _fileLength )

2210 throw "LC_SEGMENT filesize too large";

2211

2212 // record and validate sections

         _sectionsStart = (macho_section<P>*)((char*)segment + sizeof(macho_segment_command<P>));

2214 _machOSectionsCount = segment->nsects();

         if ( (sizeof(macho_segment_command<P>) + _machOSectionsCount * sizeof(macho_section<P>)) > segment->cmdsize() )

2216 throw "too many sections for size of LC_SEGMENT command";

2217

2218 return true;

2219 }

2220

2221 template <typename A>

 ld::Platform Parser<A>::findPlatform(const macho_header<P>* header, uint32_t* minOsVers)

2223 {

         const uint32_t cmd_count = header->ncmds();

         if ( cmd_count == 0 )

2226 return ld::kPlatform_unknown;

         const macho_load_command<P>* const cmds = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>));

         const macho_load_command<P>* const cmdsEnd = (macho_load_command<P>*)((char*)header + sizeof(macho_header<P>) + header->sizeofcmds());

         const macho_load_command<P>* cmd = cmds;

         for (uint32_t i = 0; i < cmd_count; ++i) {

                 uint32_t size = cmd->cmdsize();

                 if ( (size & loadCommandSizeMask()) != 0 )

                         throwf("load command #%d has a unaligned size", i);

                 const uint8_t* endOfCmd = ((uint8_t*)cmd)+cmd->cmdsize();

                 if ( endOfCmd > (uint8_t*)cmdsEnd )

                         throwf("load command #%d extends beyond the end of the load commands", i);

                 const macho_version_min_command<P>* versCmd = (macho_version_min_command<P>*)cmd;

                 const macho_build_version_command<P>* buildVersCmd = (macho_build_version_command<P>*)cmd;

                 *minOsVers = versCmd->version();

                 switch (cmd->cmd()) {

2241 case LC_VERSION_MIN_MACOSX:

2242 return ld::kPlatform_macOS;

2243 case LC_VERSION_MIN_IPHONEOS:

2244 if (useSimulatorVariant())

2245 return ld::kPlatform_iOSSimulator;

2246 else

2247 return ld::kPlatform_iOS;

2248 case LC_VERSION_MIN_WATCHOS:

2249 if (useSimulatorVariant())

2250 return ld::kPlatform_watchOSSimulator;

2251 else

2252 return ld::kPlatform_watchOS;

2253 case LC_VERSION_MIN_TVOS:

2254 if (useSimulatorVariant())

2255 return ld::kPlatform_tvOSSimulator;

2256 else

2257 return ld::kPlatform_tvOS;

2258 case LC_BUILD_VERSION:

                                 *minOsVers = buildVersCmd->minos();

                                 return (ld::Platform)buildVersCmd->platform();

2261 }

                 cmd = (const macho_load_command<P>*)(((char*)cmd)+cmd->cmdsize());

2263 if ( cmd > cmdsEnd )

                         throwf("malformed mach-o file, load command #%d is outside size of load commands", i);

2265 }

2266 *minOsVers = 0;

2267 return ld::kPlatform_unknown;

2268 }

2269

2270

2271 template <typename A>

 void Parser<A>::prescanSymbolTable()

2273 {

2274 _tentativeDefinitionCount = 0;

2275 _absoluteSymbolCount = 0;

2276 _symbolsInSections = 0;

2277 _hasDataInCodeLabels = false;

         for (uint32_t i=0; i < this->_symbolCount; ++i) {

                 const macho_nlist<P>& sym =     symbolFromIndex(i);

2280 // ignore stabs

                 if ( (sym.n_type() & N_STAB) != 0 )

2282 continue;

2283

2284 // look at undefines

                 const char* symbolName = this->nameFromSymbol(sym);

                 if ( (sym.n_type() & N_TYPE) == N_UNDF ) {

                         if ( sym.n_value() != 0 ) {

2288 // count tentative definitions

2289 ++_tentativeDefinitionCount;

2290 }

                         else if ( strncmp(symbolName, "___dtrace_", 10) == 0 ) {

2292 // any undefined starting with __dtrace_*$ that is not ___dtrace_probe$* or ___dtrace_isenabled$*

2293 // is extra provider info

                                 if ( (strncmp(&symbolName[10], "probe$", 6) != 0) && (strncmp(&symbolName[10], "isenabled$", 10) != 0) ) {

2295 _dtraceProviderInfo.push_back(symbolName);

2296 }

2297 }

2298 continue;

2299 }

                 else if ( ((sym.n_type() & N_TYPE) == N_INDR) && ((sym.n_type() & N_EXT) != 0) ) {

2301 _indirectSymbolCount++;

2302 continue;

2303 }

2304

2305 // count absolute symbols

                 if ( (sym.n_type() & N_TYPE) == N_ABS ) {

                         const char* absName = this->nameFromSymbol(sym);

2308 // ignore .objc_class_name_* symbols

                         if ( strncmp(absName, ".objc_class_name_", 17) == 0 ) {

2310 _AppleObjc = true;

2311 continue;

2312 }

2313 // ignore .objc_class_name_* symbols

                         if ( strncmp(absName, ".objc_category_name_", 20) == 0 )

2315 continue;

2316 // ignore empty *.eh symbols

                         if ( strcmp(&absName[strlen(absName)-3], ".eh") == 0 )

2318 continue;

2319 ++_absoluteSymbolCount;

2320 }

2321

2322 // only look at definitions

                 if ( (sym.n_type() & N_TYPE) != N_SECT )

2324 continue;

2325

2326 // 'L' labels do not denote atom breaks

                 if ( symbolName[0] == 'L' ) {

2328 // <rdar://problem/9218847> Formalize data in code with L$start$ labels

                         if ( strncmp(symbolName, "L$start$", 8) == 0 ) 

2330 _hasDataInCodeLabels = true;

2331 continue;

2332 }

2333 // how many def syms in each section

                 if ( sym.n_sect() > _machOSectionsCount )

2335 throw "bad n_sect in symbol table";

2336

2337 _symbolsInSections++;

2338 }

2339 }

2340

2341 template <typename A>

 void Parser<A>::appendAliasAtoms(uint8_t* p)

2343 {

         for (uint32_t i=0; i < this->_symbolCount; ++i) {

                 const macho_nlist<P>& sym =     symbolFromIndex(i);

2346 // ignore stabs

                 if ( (sym.n_type() & N_STAB) != 0 )

2348 continue;

2349

2350 // only look at N_INDR symbols

                 if ( (sym.n_type() & N_TYPE) != N_INDR ) 

2352 continue;

2353

2354 // skip non-external aliases

                 if ( (sym.n_type() & N_EXT) == 0 ) 

2356 continue;

2357

                 const char* symbolName = this->nameFromSymbol(sym);

                 const char* aliasOfName = &_strings[sym.n_value()];

                 bool isHiddenVisibility = (sym.n_type() & N_PEXT);

2361 AliasAtom* allocatedSpace = (AliasAtom*)p;

                 new (allocatedSpace) AliasAtom(symbolName, isHiddenVisibility, _file, aliasOfName);

2363 p += sizeof(AliasAtom);

2364 }

2365 }

2366

2367

2368

2369 template <typename A>

 int Parser<A>::sectionIndexSorter(void* extra, const void* l, const void* r)

2371 {

         Parser<A>* parser = (Parser<A>*)extra;

         const uint32_t* left = (uint32_t*)l;

         const uint32_t* right = (uint32_t*)r;

         const macho_section<P>* leftSect =      parser->machOSectionFromSectionIndex(*left);

         const macho_section<P>* rightSect = parser->machOSectionFromSectionIndex(*right);

2377

2378 // can't just return difference because 64-bit diff does not fit in 32-bit return type

         int64_t result = leftSect->addr() - rightSect->addr();

         if ( result == 0 ) {

2381 // two sections with same start address

2382 // one with zero size goes first

                 bool leftEmpty = ( leftSect->size() == 0 );

                 bool rightEmpty = ( rightSect->size() == 0 );

2385 if ( leftEmpty != rightEmpty ) {

                         return ( rightEmpty ? 1 : -1 );

2387 }

2388 if ( !leftEmpty && !rightEmpty )

2389 throwf("overlapping sections");

2390 // both empty, so chose file order

2391 return ( rightSect - leftSect );

2392 }

         else if ( result < 0 )

2394 return -1;

2395 else

2396 return 1;

2397 }

2398

2399 template <typename A>

 void Parser<A>::makeSortedSectionsArray(uint32_t array[])

2401 {

2402 const bool log = false;

2403

2404 if ( log ) {

                 fprintf(stderr, "unsorted sections:\n");

                 for(unsigned int i=0; i < _machOSectionsCount; ++i ) 

                         fprintf(stderr, "0x%08llX %s %s\n", _sectionsStart[i].addr(), _sectionsStart[i].segname(), _sectionsStart[i].sectname());

2408 }

2409

2410 // sort by symbol table address

         for (uint32_t i=0; i < _machOSectionsCount; ++i)

2412 array[i] = i;

         ::qsort_r(array, _machOSectionsCount, sizeof(uint32_t), this, &sectionIndexSorter);

2414

2415 if ( log ) {

                 fprintf(stderr, "sorted sections:\n");

                 for(unsigned int i=0; i < _machOSectionsCount; ++i ) 

                         fprintf(stderr, "0x%08llX %s %s\n", _sectionsStart[array[i]].addr(), _sectionsStart[array[i]].segname(), _sectionsStart[array[i]].sectname());

2419 }

2420 }

2421

2422

2423

2424 template <typename A>

 int Parser<A>::symbolIndexSorter(void* extra, const void* l, const void* r)

2426 {

2427 ParserAndSectionsArray* extraInfo = (ParserAndSectionsArray*)extra;

         Parser<A>* parser = extraInfo->parser;

         const uint32_t* sortedSectionsArray = extraInfo->sortedSectionsArray;

         const uint32_t* left = (uint32_t*)l;

         const uint32_t* right = (uint32_t*)r;

         const macho_nlist<P>& leftSym = parser->symbolFromIndex(*left);

         const macho_nlist<P>& rightSym = parser->symbolFromIndex(*right);

2434 // can't just return difference because 64-bit diff does not fit in 32-bit return type

         int64_t result = leftSym.n_value() - rightSym.n_value();

         if ( result == 0 ) {

2437 // two symbols with same address

2438 // if in different sections, sort earlier section first

                 if ( leftSym.n_sect() != rightSym.n_sect() ) {

                         for (uint32_t i=0; i < parser->machOSectionCount(); ++i) {

                                 if ( sortedSectionsArray[i]+1 == leftSym.n_sect() )

2442 return -1;

                                 if ( sortedSectionsArray[i]+1 == rightSym.n_sect() )

2444 return 1;

2445 }

2446 }

2447 // two symbols in same section, means one is an alias

2448 // if one is ltmp*, make it an alias (sort first)

                 const char* leftName  = parser->nameFromSymbol(leftSym);

                 const char* rightName = parser->nameFromSymbol(rightSym);

                 bool leftIsTmp  = strncmp(leftName,  "ltmp", 4);

                 bool rightIsTmp = strncmp(rightName, "ltmp", 4);

2453 if ( leftIsTmp != rightIsTmp ) {

                         return (rightIsTmp ? -1 : 1);

2455 }

2456

2457 // if only one is global, make the other an alias (sort first)

                 if ( (leftSym.n_type() & N_EXT) != (rightSym.n_type() & N_EXT) ) {

                         if ( (rightSym.n_type() & N_EXT) != 0 )

2460 return -1;

2461 else

2462 return 1;

2463 }

2464 // if both are global, sort alphabetically. earlier one will be the alias

                 return ( strcmp(rightName, leftName) );

2466 }

         else if ( result < 0 )

2468 return -1;

2469 else

2470 return 1;

2471 }

2472

2473

2474 template <typename A>

 void Parser<A>::makeSortedSymbolsArray(uint32_t array[], const uint32_t sectionArray[])

2476 {

2477 const bool log = false;

2478

2479 uint32_t* p = array;

         for (uint32_t i=0; i < this->_symbolCount; ++i) {

                 const macho_nlist<P>& sym =     symbolFromIndex(i);

2482 // ignore stabs

                 if ( (sym.n_type() & N_STAB) != 0 )

2484 continue;

2485

2486 // only look at definitions

                 if ( (sym.n_type() & N_TYPE) != N_SECT )

2488 continue;

2489

2490 // 'L' labels do not denote atom breaks

                 const char* symbolName = this->nameFromSymbol(sym);

                 if ( symbolName[0] == 'L' )

2493 continue;

2494

2495 // how many def syms in each section

                 if ( sym.n_sect() > _machOSectionsCount )

2497 throw "bad n_sect in symbol table";

2498

2499 // append to array

2500 *p++ = i;

2501 }

         assert(p == &array[_symbolsInSections] && "second pass over symbol table yield a different number of symbols");

2503

2504 // sort by symbol table address

2505 ParserAndSectionsArray extra = { this, sectionArray };

         ::qsort_r(array, _symbolsInSections, sizeof(uint32_t), &extra, &symbolIndexSorter);

2507

2508

2509 // look for two symbols at same address

2510 _overlappingSymbols = false;

         for (unsigned int i=1; i < _symbolsInSections; ++i) {

                 if ( symbolFromIndex(array[i-1]).n_value() == symbolFromIndex(array[i]).n_value() ) {

2513 //fprintf(stderr, "overlapping symbols at 0x%08llX\n", symbolFromIndex(array[i-1]).n_value());

2514 _overlappingSymbols = true;

2515 break;

2516 }

2517 }

2518

2519 if ( log ) {

                 fprintf(stderr, "sorted symbols:\n");

                 for(unsigned int i=0; i < _symbolsInSections; ++i ) 

                         fprintf(stderr, "0x%09llX symIndex=%d sectNum=%2d, %s\n", symbolFromIndex(array[i]).n_value(), array[i], symbolFromIndex(array[i]).n_sect(), nameFromSymbol(symbolFromIndex(array[i])) );

2523 }

2524 }

2525

2526 template <typename A>

 void Parser<A>::makeSections()

2528 {

2529 // classify each section by type

2530 // compute how many Section objects will be needed and total size for all

2531 unsigned int totalSectionsSize = 0;

         uint8_t machOSectsStorage[sizeof(MachOSectionAndSectionClass<P>)*(_machOSectionsCount+2)]; // also room for tentative-defs and absolute symbols

2533 // allocate raw storage for all section objects on stack

         MachOSectionAndSectionClass<P>* machOSects = (MachOSectionAndSectionClass<P>*)machOSectsStorage;

2535 unsigned int count = 0;

2536 // local variable for bitcode parsing

         const macho_section<P>* bitcodeSect = NULL;

         const macho_section<P>* cmdlineSect = NULL;

         const macho_section<P>* swiftCmdlineSect = NULL;

         const macho_section<P>* bundleSect = NULL;

2541 bool bitcodeAsm = false;

2542

         for (uint32_t i=0; i < _machOSectionsCount; ++i) {

                 const macho_section<P>* sect = &_sectionsStart[i];

                 uint8_t sectionType = (sect->flags() & SECTION_TYPE);

                 if ( (sect->offset() + sect->size() > _fileLength) && (sectionType != S_ZEROFILL) && (sectionType != S_THREAD_LOCAL_ZEROFILL) )

                         throwf("section %s/%s extends beyond end of file,", sect->segname(), sect->sectname());

2548

                 if ( (sect->flags() & S_ATTR_DEBUG) != 0 ) {

                         if ( strcmp(sect->segname(), "__DWARF") == 0 ) {

2551 // note that .o file has dwarf

                                 _file->_debugInfoKind = ld::relocatable::File::kDebugInfoDwarf;

2553 // save off iteresting dwarf sections

                                 if ( strcmp(sect->sectname(), "__debug_info") == 0 )

2555 _file->_dwarfDebugInfoSect = sect;

                                 else if ( strcmp(sect->sectname(), "__debug_abbrev") == 0 )

2557 _file->_dwarfDebugAbbrevSect = sect;

                                 else if ( strcmp(sect->sectname(), "__debug_line") == 0 )

2559 _file->_dwarfDebugLineSect = sect;

                                 else if ( strcmp(sect->sectname(), "__debug_str") == 0 )

2561 _file->_dwarfDebugStringSect = sect;

2562 // linker does not propagate dwarf sections to output file

2563 continue;

2564 }

                         else if ( strcmp(sect->segname(), "__LD") == 0 ) {

                                 if ( strncmp(sect->sectname(), "__compact_unwind", 16) == 0 ) {

2567 machOSects[count].sect = sect;

                                         totalSectionsSize += sizeof(CUSection<A>);

2569 machOSects[count++].type = sectionTypeCompactUnwind;

2570 continue;

2571 }

2572 }

2573 }

                 if ( strcmp(sect->segname(), "__LLVM") == 0 ) {

2575 // Process bitcode segement

                         if ( strncmp(sect->sectname(), "__bitcode", 9) == 0 ) {

2577 bitcodeSect = sect;

                         } else if ( strncmp(sect->sectname(), "__cmdline", 9) == 0 ) {

2579 cmdlineSect = sect;

                         } else if ( strncmp(sect->sectname(), "__swift_cmdline", 15) == 0 ) {

2581 swiftCmdlineSect = sect;

                         } else if ( strncmp(sect->sectname(), "__bundle", 8) == 0 ) {

2583 bundleSect = sect;

                         } else if ( strncmp(sect->sectname(), "__asm", 5) == 0 ) {

2585 bitcodeAsm = true;

2586 }

2587 // If treat the bitcode as data, continue to parse as a normal section.

2588 if ( !_treateBitcodeAsData )

2589 continue;

2590 }

2591 // ignore empty __OBJC sections

                 if ( (sect->size() == 0) && (strcmp(sect->segname(), "__OBJC") == 0) )

2593 continue;

2594 // objc image info section is really attributes and not content

                 if ( ((strcmp(sect->sectname(), "__image_info") == 0) && (strcmp(sect->segname(), "__OBJC") == 0))

                         || ((strncmp(sect->sectname(), "__objc_imageinfo", 16) == 0) && (strcmp(sect->segname(), "__DATA") == 0)) ) {

2597 // struct objc_image_info {

2598 // uint32_t version; // initially 0

2599 // uint32_t flags;

2600 // };

2601 // #define OBJC_IMAGE_SUPPORTS_GC 2

2602 // #define OBJC_IMAGE_GC_ONLY 4

2603 // #define OBJC_IMAGE_IS_SIMULATED 32

2604 // #define OBJC_IMAGE_HAS_CATEGORY_CLASS_PROPERTIES 64

2605 //

                         const uint32_t* contents = (uint32_t*)(_file->fileContent()+sect->offset());

                         if ( (sect->size() >= 8) && (contents[0] == 0) ) {

                                 uint32_t flags = E::get32(contents[1]);

2609 _file->_hasObjC = true;

                                 _file->_swiftVersion = ((flags >> 8) & 0xFF);

                 _file->_objcHasCategoryClassPropertiesField = (flags & 64);

                                 if ( sect->size() > 8 ) {

                                         warning("section %s/%s has unexpectedly large size %llu in %s", 

                                                         sect->segname(), Section<A>::makeSectionName(sect), sect->size(), _file->path());

2615 }

2616 }

2617 else {

                                 warning("can't parse %s/%s section in %s", sect->segname(), Section<A>::makeSectionName(sect), _file->path());

2619 }

2620 continue;

2621 }

2622 machOSects[count].sect = sect;

                 switch ( sect->flags() & SECTION_TYPE ) {

2624 case S_SYMBOL_STUBS:

                                 if ( _stubsSectionNum == 0 ) {

2626 _stubsSectionNum = i+1;

2627 _stubsMachOSection = sect;

2628 }

2629 else

                                         assert(1 && "multiple S_SYMBOL_STUBS sections");

2631 case S_LAZY_SYMBOL_POINTERS:

2632 break;

2633 case S_4BYTE_LITERALS:

                                 totalSectionsSize += sizeof(Literal4Section<A>);

2635 machOSects[count++].type = sectionTypeLiteral4;

2636 break;

2637 case S_8BYTE_LITERALS:

                                 totalSectionsSize += sizeof(Literal8Section<A>);

2639 machOSects[count++].type = sectionTypeLiteral8;

2640 break;

2641 case S_16BYTE_LITERALS:

                                 totalSectionsSize += sizeof(Literal16Section<A>);

2643 machOSects[count++].type = sectionTypeLiteral16;

2644 break;

2645 case S_NON_LAZY_SYMBOL_POINTERS:

                                 totalSectionsSize += sizeof(NonLazyPointerSection<A>);

2647 machOSects[count++].type = sectionTypeNonLazy;

2648 break;

2649 case S_THREAD_LOCAL_VARIABLE_POINTERS:

                                 totalSectionsSize += sizeof(TLVPointerSection<A>);

2651 machOSects[count++].type = sectionTypeTLVPointers;

2652 break;

2653 case S_LITERAL_POINTERS:

                                 if ( (strcmp(sect->segname(), "__OBJC") == 0) && (strcmp(sect->sectname(), "__cls_refs") == 0) ) {

                                         totalSectionsSize += sizeof(Objc1ClassReferences<A>);

2656 machOSects[count++].type = sectionTypeObjC1ClassRefs;

2657 }

2658 else {

                                         totalSectionsSize += sizeof(PointerToCStringSection<A>);

2660 machOSects[count++].type = sectionTypeCStringPointer;

2661 }

2662 break;

2663 case S_CSTRING_LITERALS:

                                 totalSectionsSize += sizeof(CStringSection<A>);

2665 machOSects[count++].type = sectionTypeCString;

2666 break;

2667 case S_MOD_INIT_FUNC_POINTERS:

2668 case S_MOD_TERM_FUNC_POINTERS:

2669 case S_THREAD_LOCAL_INIT_FUNCTION_POINTERS:

2670 case S_INTERPOSING:

2671 case S_ZEROFILL:

2672 case S_REGULAR:

2673 case S_COALESCED:

2674 case S_THREAD_LOCAL_REGULAR:

2675 case S_THREAD_LOCAL_ZEROFILL:

                                 if ( (strcmp(sect->segname(), "__TEXT") == 0) && (strcmp(sect->sectname(), "__eh_frame") == 0) ) {

                                         totalSectionsSize += sizeof(CFISection<A>);

2678 machOSects[count++].type = sectionTypeCFI;

2679 }

                                 else if ( (strcmp(sect->segname(), "__DATA") == 0) && (strcmp(sect->sectname(), "__cfstring") == 0) ) {

                                         totalSectionsSize += sizeof(CFStringSection<A>);

2682 machOSects[count++].type = sectionTypeCFString;

2683 }

                                 else if ( (strcmp(sect->segname(), "__TEXT") == 0) && (strcmp(sect->sectname(), "__ustring") == 0) ) {

                                         totalSectionsSize += sizeof(UTF16StringSection<A>);

2686 machOSects[count++].type = sectionTypeUTF16Strings;

2687 }

                                 else if ( (strcmp(sect->segname(), "__DATA") == 0) && (strncmp(sect->sectname(), "__objc_classrefs", 16) == 0) ) {

                                         totalSectionsSize += sizeof(ObjC2ClassRefsSection<A>);

2690 machOSects[count++].type = sectionTypeObjC2ClassRefs;

2691 }

                                 else if ( (strcmp(sect->segname(), "__DATA") == 0) && (strcmp(sect->sectname(), "__objc_catlist") == 0) ) {

                                         totalSectionsSize += sizeof(ObjC2CategoryListSection<A>);

2694 machOSects[count++].type = typeObjC2CategoryList;

2695 }

                                 else if ( _AppleObjc && (strcmp(sect->segname(), "__OBJC") == 0) && (strcmp(sect->sectname(), "__class") == 0) ) {

                                         totalSectionsSize += sizeof(ObjC1ClassSection<A>);

2698 machOSects[count++].type = sectionTypeObjC1Classes;

2699 }

2700 else {

                                         totalSectionsSize += sizeof(SymboledSection<A>);

2702 machOSects[count++].type = sectionTypeSymboled;

2703 }

2704 break;

2705 case S_THREAD_LOCAL_VARIABLES:

                                 totalSectionsSize += sizeof(TLVDefsSection<A>);

2707 machOSects[count++].type = sectionTypeTLVDefs;

2708 break;

2709 default:

                                 throwf("unknown section type %d", sect->flags() & SECTION_TYPE);

2711 }

2712 }

2713

2714 // Create bitcode

2715 if ( bitcodeSect != NULL ) {

2716 if ( cmdlineSect != NULL )

                         _file->_bitcode = std::unique_ptr<ld::Bitcode>(new ld::ClangBitcode(&_fileContent[bitcodeSect->offset()], bitcodeSect->size(),

                                                                                                                                                                 &_fileContent[cmdlineSect->offset()], cmdlineSect->size()));

2719 else if ( swiftCmdlineSect != NULL )

                         _file->_bitcode = std::unique_ptr<ld::Bitcode>(new ld::SwiftBitcode(&_fileContent[bitcodeSect->offset()], bitcodeSect->size(),

                                                                                                                                                                 &_fileContent[swiftCmdlineSect->offset()], swiftCmdlineSect->size()));

2722 else

                         throwf("Object file with bitcode missing cmdline options: %s", _file->path());

2724 }

2725 else if ( bundleSect != NULL )

                 _file->_bitcode = std::unique_ptr<ld::Bitcode>(new ld::BundleBitcode(&_fileContent[bundleSect->offset()], bundleSect->size()));

2727 else if ( bitcodeAsm )

                 _file->_bitcode = std::unique_ptr<ld::Bitcode>(new ld::AsmBitcode(_fileContent, _fileLength));

2729

2730 // sort by address (mach-o object files don't aways have sections sorted)

         ::qsort(machOSects, count, sizeof(MachOSectionAndSectionClass<P>), MachOSectionAndSectionClass<P>::sorter);

2732

2733 // we will synthesize a dummy Section<A> object for tentative definitions

         if ( _tentativeDefinitionCount > 0 ) {

                 totalSectionsSize += sizeof(TentativeDefinitionSection<A>);

2736 machOSects[count++].type = sectionTypeTentativeDefinitions;

2737 }

2738

2739 // we will synthesize a dummy Section<A> object for Absolute symbols

         if ( _absoluteSymbolCount > 0 ) {

                 totalSectionsSize += sizeof(AbsoluteSymbolSection<A>);

2742 machOSects[count++].type = sectionTypeAbsoluteSymbols;

2743 }

2744

2745 // allocate one block for all Section objects as well as pointers to each

         uint8_t* space = new uint8_t[totalSectionsSize+count*sizeof(Section<A>*)];

         _file->_sectionsArray = (Section<A>**)space;

2748 _file->_sectionsArrayCount = count;

         Section<A>** objects = _file->_sectionsArray;

         space += count*sizeof(Section<A>*);

         for (uint32_t i=0; i < count; ++i) {

                 switch ( machOSects[i].type ) {

2753 case sectionTypeIgnore:

2754 break;

2755 case sectionTypeLiteral4:

                                 *objects++ = new (space) Literal4Section<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(Literal4Section<A>);

2758 break;

2759 case sectionTypeLiteral8:

                                 *objects++ = new (space) Literal8Section<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(Literal8Section<A>);

2762 break;

2763 case sectionTypeLiteral16:

                                 *objects++ = new (space) Literal16Section<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(Literal16Section<A>);

2766 break;

2767 case sectionTypeNonLazy:

                                 *objects++ = new (space) NonLazyPointerSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(NonLazyPointerSection<A>);

2770 break;

2771 case sectionTypeTLVPointers:

                                 *objects++ = new (space) TLVPointerSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(TLVPointerSection<A>);

2774 break;

2775 case sectionTypeCFI:

                                 _EHFrameSection = new (space) CFISection<A>(*this, *_file, machOSects[i].sect);

2777 *objects++ = _EHFrameSection;

                                 space += sizeof(CFISection<A>);

2779 break;

2780 case sectionTypeCString:

                                 *objects++ = new (space) CStringSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(CStringSection<A>);

2783 break;

2784 case sectionTypeCStringPointer:

                                 *objects++ = new (space) PointerToCStringSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(PointerToCStringSection<A>);

2787 break;

2788 case sectionTypeObjC1ClassRefs:

                                 *objects++ = new (space) Objc1ClassReferences<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(Objc1ClassReferences<A>);

2791 break;

2792 case sectionTypeUTF16Strings:

                                 *objects++ = new (space) UTF16StringSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(UTF16StringSection<A>);

2795 break;

2796 case sectionTypeCFString:

                                 *objects++ = new (space) CFStringSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(CFStringSection<A>);

2799 break;

2800 case sectionTypeObjC2ClassRefs:

                                 *objects++ = new (space) ObjC2ClassRefsSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(ObjC2ClassRefsSection<A>);

2803 break;

2804 case typeObjC2CategoryList:

                                 *objects++ = new (space) ObjC2CategoryListSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(ObjC2CategoryListSection<A>);

2807 break;

2808 case sectionTypeObjC1Classes:

                                 *objects++ = new (space) ObjC1ClassSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(ObjC1ClassSection<A>);

2811 break;

2812 case sectionTypeSymboled:

                                 *objects++ = new (space) SymboledSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(SymboledSection<A>);

2815 break;

2816 case sectionTypeTLVDefs:

                                 *objects++ = new (space) TLVDefsSection<A>(*this, *_file, machOSects[i].sect);

                                 space += sizeof(TLVDefsSection<A>);

2819 break;

2820 case sectionTypeCompactUnwind:

                                 _compactUnwindSection = new (space) CUSection<A>(*this, *_file, machOSects[i].sect);

2822 *objects++ = _compactUnwindSection;

                                 space += sizeof(CUSection<A>);

2824 break;

2825 case sectionTypeTentativeDefinitions:

                                 *objects++ = new (space) TentativeDefinitionSection<A>(*this, *_file);

                                 space += sizeof(TentativeDefinitionSection<A>);

2828 break;

2829 case sectionTypeAbsoluteSymbols:

                                 _absoluteSection = new (space) AbsoluteSymbolSection<A>(*this, *_file);

2831 *objects++ = _absoluteSection;

                                 space += sizeof(AbsoluteSymbolSection<A>);

2833 break;

2834 default:

2835 throw "internal error uknown SectionType";

2836 }

2837 }

2838 }

2839

2840

2841 template <typename A>

 Section<A>* Parser<A>::sectionForAddress(typename A::P::uint_t addr)

2843 {

         for (uint32_t i=0; i < _file->_sectionsArrayCount; ++i ) {

                 const macho_section<typename A::P>* sect = _file->_sectionsArray[i]->machoSection();

2846 // TentativeDefinitionSection and AbsoluteSymbolSection have no mach-o section

2847 if ( sect != NULL ) {

                         if ( (sect->addr() <= addr) && (addr < (sect->addr()+sect->size())) ) {

2849 return _file->_sectionsArray[i];

2850 }

2851 }

2852 }

2853 // not strictly in any section

2854 // may be in a zero length section

         for (uint32_t i=0; i < _file->_sectionsArrayCount; ++i ) {

                 const macho_section<typename A::P>* sect = _file->_sectionsArray[i]->machoSection();

2857 // TentativeDefinitionSection and AbsoluteSymbolSection have no mach-o section

2858 if ( sect != NULL ) {

                         if ( (sect->addr() == addr) && (sect->size() == 0) ) {

2860 return _file->_sectionsArray[i];

2861 }

2862 }

2863 }

2864

         throwf("sectionForAddress(0x%llX) address not in any section", (uint64_t)addr);

2866 }

2867

2868 template <typename A>

 Section<A>* Parser<A>::sectionForNum(unsigned int num)

2870 {

         for (uint32_t i=0; i < _file->_sectionsArrayCount; ++i ) {

                 const macho_section<typename A::P>* sect = _file->_sectionsArray[i]->machoSection();

2873 // TentativeDefinitionSection and AbsoluteSymbolSection have no mach-o section

2874 if ( sect != NULL ) {

                         if ( num == (unsigned int)((sect - _sectionsStart)+1) )

2876 return _file->_sectionsArray[i];

2877 }

2878 }

         throwf("sectionForNum(%u) section number not for any section", num);

2880 }

2881

2882 template <typename A>

 Atom<A>* Parser<A>::findAtomByAddress(pint_t addr)

2884 {

         Section<A>* section = this->sectionForAddress(addr);

         return section->findAtomByAddress(addr);

2887 }

2888

2889 template <typename A>

 Atom<A>* Parser<A>::findAtomByAddressOrNullIfStub(pint_t addr)

2891 {

         if ( hasStubsSection() && (_stubsMachOSection->addr() <= addr) && (addr < (_stubsMachOSection->addr()+_stubsMachOSection->size())) ) 

2893 return NULL;

2894 return findAtomByAddress(addr);

2895 }

2896

2897 template <typename A>

 Atom<A>* Parser<A>::findAtomByAddressOrLocalTargetOfStub(pint_t addr, uint32_t* offsetInAtom)

2899 {

         if ( hasStubsSection() && (_stubsMachOSection->addr() <= addr) && (addr < (_stubsMachOSection->addr()+_stubsMachOSection->size())) ) {

2901 // target is a stub, remove indirection

                 uint32_t symbolIndex = this->symbolIndexFromIndirectSectionAddress(addr, _stubsMachOSection);

2903 assert(symbolIndex != INDIRECT_SYMBOL_LOCAL);

                 const macho_nlist<P>& sym = this->symbolFromIndex(symbolIndex);

2905 // can't be to external weak symbol

                 assert( (this->combineFromSymbol(sym) != ld::Atom::combineByName) || (this->scopeFromSymbol(sym) != ld::Atom::scopeGlobal) );

2907 *offsetInAtom = 0;

                 return this->findAtomByName(this->nameFromSymbol(sym));

2909 }

         Atom<A>* target = this->findAtomByAddress(addr);

         *offsetInAtom = addr - target->_objAddress;

2912 return target;

2913 }

2914

2915 template <typename A>

 Atom<A>* Parser<A>::findAtomByName(const char* name)

2917 {

         uint8_t* p = _file->_atomsArray;

         for(int i=_file->_atomsArrayCount; i > 0; --i) {

                 Atom<A>* atom = (Atom<A>*)p;

                 if ( strcmp(name, atom->name()) == 0 )

2922 return atom;

                 p += sizeof(Atom<A>);

2924 }

2925 return NULL;

2926 }

2927

2928 template <typename A>

 void Parser<A>::findTargetFromAddress(pint_t addr, TargetDesc& target)

2930 {

         if ( hasStubsSection() && (_stubsMachOSection->addr() <= addr) && (addr < (_stubsMachOSection->addr()+_stubsMachOSection->size())) ) {

2932 // target is a stub, remove indirection

                 uint32_t symbolIndex = this->symbolIndexFromIndirectSectionAddress(addr, _stubsMachOSection);

2934 assert(symbolIndex != INDIRECT_SYMBOL_LOCAL);

                 const macho_nlist<P>& sym = this->symbolFromIndex(symbolIndex);

2936 target.atom = NULL;

                 target.name = this->nameFromSymbol(sym);

                 target.weakImport = this->weakImportFromSymbol(sym);

2939 target.addend = 0;

2940 return;

2941 }

         Section<A>* section = this->sectionForAddress(addr);

         target.atom = section->findAtomByAddress(addr);

         target.addend = addr - target.atom->_objAddress;

2945 target.weakImport = false;

2946 target.name = NULL;

2947 }

2948

2949 template <typename A>

 void Parser<A>::findTargetFromAddress(pint_t baseAddr, pint_t addr, TargetDesc& target)

2951 {

2952 findTargetFromAddress(baseAddr, target);

         target.addend = addr - target.atom->_objAddress;

2954 }

2955

2956 template <typename A>

 void Parser<A>::findTargetFromAddressAndSectionNum(pint_t addr, unsigned int sectNum, TargetDesc& target)

2958 {

2959 if ( sectNum == R_ABS ) {

2960 // target is absolute symbol that corresponds to addr

2961 if ( _absoluteSection != NULL ) {

                         target.atom = _absoluteSection->findAbsAtomForValue(addr);

                         if ( target.atom != NULL ) {

2964 target.name = NULL;

2965 target.weakImport = false;

2966 target.addend = 0;

2967 return;

2968 }

2969 }

2970 throwf("R_ABS reloc but no absolute symbol at target address");

2971 }

2972

         if ( hasStubsSection() && (stubsSectionNum() == sectNum) ) {

2974 // target is a stub, remove indirection

                 uint32_t symbolIndex = this->symbolIndexFromIndirectSectionAddress(addr, _stubsMachOSection);

2976 assert(symbolIndex != INDIRECT_SYMBOL_LOCAL);

                 const macho_nlist<P>& sym = this->symbolFromIndex(symbolIndex);

2978 // use direct reference when stub is to a static function

                 if ( ((sym.n_type() & N_TYPE) == N_SECT) && (((sym.n_type() & N_EXT) == 0) || (this->nameFromSymbol(sym)[0] == 'L')) ) {

                         this->findTargetFromAddressAndSectionNum(sym.n_value(), sym.n_sect(), target);

2981 }

2982 else {

2983 target.atom = NULL;

                         target.name = this->nameFromSymbol(sym);

                         target.weakImport = this->weakImportFromSymbol(sym);

2986 target.addend = 0;

2987 }

2988 return;

2989 }

         Section<A>* section = this->sectionForNum(sectNum);

         target.atom = section->findAtomByAddress(addr);

         if ( target.atom == NULL ) {

                 typedef typename A::P::sint_t sint_t;

2994 sint_t a = (sint_t)addr;

                 sint_t sectStart = (sint_t)(section->machoSection()->addr());

                 sint_t sectEnd  = sectStart + section->machoSection()->size();

2997 if ( a < sectStart ) {

2998 // target address is before start of section, so must be negative addend

                         target.atom = section->findAtomByAddress(sectStart);

3000 target.addend = a - sectStart;

3001 target.weakImport = false;

3002 target.name = NULL;

3003 return;

3004 }

3005 else if ( a >= sectEnd ) {

                         target.atom = section->findAtomByAddress(sectEnd-1);

3007 target.addend = a - sectEnd;

3008 target.weakImport = false;

3009 target.name = NULL;

3010 return;

3011 }

3012 }

         assert(target.atom != NULL);

         target.addend = addr - target.atom->_objAddress;

3015 target.weakImport = false;

3016 target.name = NULL;

3017 }

3018

3019 template <typename A>

 void Parser<A>::addDtraceExtraInfos(const SourceLocation& src, const char* providerName)

3021 {

3022 // for every ___dtrace_stability$* and ___dtrace_typedefs$* undefine with

3023 // a matching provider name, add a by-name kDtraceTypeReference at probe site

         const char* dollar = strchr(providerName, '$');

3025 if ( dollar != NULL ) {

                 int providerNameLen = dollar-providerName+1;

                 for ( std::vector<const char*>::iterator it = _dtraceProviderInfo.begin(); it != _dtraceProviderInfo.end(); ++it) {

                         const char* typeDollar = strchr(*it, '$');

3029 if ( typeDollar != NULL ) {

                                 if ( strncmp(typeDollar+1, providerName, providerNameLen) == 0 ) {

                                         addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindDtraceExtra,false, *it);

3032 }

3033 }

3034 }

3035 }

3036 }

3037

3038 template <typename A>

 const char* Parser<A>::scanSymbolTableForAddress(uint64_t addr)

3040 {

3041 uint64_t closestSymAddr = 0;

3042 const char* closestSymName = NULL;

         for (uint32_t i=0; i < this->_symbolCount; ++i) {

                 const macho_nlist<P>& sym =     symbolFromIndex(i);

3045 // ignore stabs

                 if ( (sym.n_type() & N_STAB) != 0 )

3047 continue;

3048

3049 // only look at definitions

                 if ( (sym.n_type() & N_TYPE) != N_SECT )

3051 continue;

3052

3053 // return with exact match

                 if ( sym.n_value() == addr ) {

                         const char* name = nameFromSymbol(sym);

                         if ( strncmp(name, "ltmp", 4) != 0 ) 

3057 return name;

3058 // treat 'ltmp*' labels as close match

3059 closestSymAddr = sym.n_value();

3060 closestSymName = name;

3061 }

3062

3063 // record closest seen so far

                 if ( (sym.n_value() < addr) && ((sym.n_value() > closestSymAddr) || (closestSymName == NULL)) )

3065 closestSymName = nameFromSymbol(sym);

3066 }

3067

         return (closestSymName != NULL) ? closestSymName : "unknown";

3069 }

3070

3071

3072 template <typename A>

 void Parser<A>::addFixups(const SourceLocation& src, ld::Fixup::Kind setKind, const TargetDesc& target)

3074 {

3075 // some fixup pairs can be combined

         ld::Fixup::Cluster cl = ld::Fixup::k1of3;

         ld::Fixup::Kind firstKind = ld::Fixup::kindSetTargetAddress;

3078 bool combined = false;

3079

3080 #if SUPPORT_ARCH_arm64e

         bool isAuthenticated = setKind == ld::Fixup::kindStoreLittleEndianAuth64;

3082 // Authenticated pointers need an extra fixup for the auth data.

3083 if (isAuthenticated)

                 cl = ld::Fixup::k2of4;

3085 #endif

         if ( target.addend == 0 ) {

                 cl = ld::Fixup::k1of1;

3088 combined = true;

3089 switch ( setKind ) {

                         case ld::Fixup::kindStoreLittleEndian32:

                                 firstKind = ld::Fixup::kindStoreTargetAddressLittleEndian32;

3092 break;

                         case ld::Fixup::kindStoreLittleEndian64:

                                 firstKind = ld::Fixup::kindStoreTargetAddressLittleEndian64;

3095 break;

                         case ld::Fixup::kindStoreBigEndian32:

                                 firstKind = ld::Fixup::kindStoreTargetAddressBigEndian32;

3098 break;

                         case ld::Fixup::kindStoreBigEndian64:

                                 firstKind = ld::Fixup::kindStoreTargetAddressBigEndian64;

3101 break;

                         case ld::Fixup::kindStoreX86BranchPCRel32:

                                 firstKind = ld::Fixup::kindStoreTargetAddressX86BranchPCRel32;

3104 break;

                         case ld::Fixup::kindStoreX86PCRel32:

                                 firstKind = ld::Fixup::kindStoreTargetAddressX86PCRel32;

3107 break;

                         case ld::Fixup::kindStoreX86PCRel32GOTLoad:

                                 firstKind = ld::Fixup::kindStoreTargetAddressX86PCRel32GOTLoad;

3110 break;

                         case ld::Fixup::kindStoreX86PCRel32TLVLoad:

                                 firstKind = ld::Fixup::kindStoreTargetAddressX86PCRel32TLVLoad;

3113 break;

                         case ld::Fixup::kindStoreX86Abs32TLVLoad:

                                 firstKind = ld::Fixup::kindStoreTargetAddressX86Abs32TLVLoad;

3116 break;

                         case ld::Fixup::kindStoreARMBranch24:

                                 firstKind = ld::Fixup::kindStoreTargetAddressARMBranch24;

3119 break;

                         case ld::Fixup::kindStoreThumbBranch22:

                                 firstKind = ld::Fixup::kindStoreTargetAddressThumbBranch22;

3122 break;

3123 #if SUPPORT_ARCH_arm64

                         case ld::Fixup::kindStoreARM64Branch26:

                                 firstKind = ld::Fixup::kindStoreTargetAddressARM64Branch26;

3126 break;

                         case ld::Fixup::kindStoreARM64Page21:

                                 firstKind = ld::Fixup::kindStoreTargetAddressARM64Page21;

3129 break;

                         case ld::Fixup::kindStoreARM64PageOff12:

                                 firstKind = ld::Fixup::kindStoreTargetAddressARM64PageOff12;

3132 break;

                         case ld::Fixup::kindStoreARM64GOTLoadPage21:

                                 firstKind = ld::Fixup::kindStoreTargetAddressARM64GOTLoadPage21;

3135 break;

                         case ld::Fixup::kindStoreARM64GOTLoadPageOff12:

                                 firstKind = ld::Fixup::kindStoreTargetAddressARM64GOTLoadPageOff12;

3138 break;

                         case ld::Fixup::kindStoreARM64TLVPLoadPage21:

                                 firstKind = ld::Fixup::kindStoreTargetAddressARM64TLVPLoadPage21;

3141 break;

                         case ld::Fixup::kindStoreARM64TLVPLoadPageOff12:

                                 firstKind = ld::Fixup::kindStoreTargetAddressARM64TLVPLoadPageOff12;

3144 break;

3145 #endif

3146 #if SUPPORT_ARCH_arm64e

                         case ld::Fixup::kindStoreLittleEndianAuth64:

                                 firstKind = ld::Fixup::kindStoreTargetAddressLittleEndianAuth64;

                                 cl = ld::Fixup::k2of2;

3150 break;

3151 #endif

3152 default:

3153 combined = false;

                                 cl = ld::Fixup::k1of2;

3155 break;

3156 }

3157 }

3158

3159 #if SUPPORT_ARCH_arm64e

3160 // As the auth data is independent of the addend and target, we can just always

3161 // put it first.

3162 if (isAuthenticated) {

                 if (cl == ld::Fixup::k2of2) {

                         addFixup(src, ld::Fixup::k1of2, ld::Fixup::kindSetAuthData, target.authData);

3165 } else {

                         assert(cl == ld::Fixup::k2of4);

                         addFixup(src, ld::Fixup::k1of4, ld::Fixup::kindSetAuthData, target.authData);

3168 }

3169 }

3170 #endif

3171

         if ( target.atom != NULL ) {

                 if ( target.atom->scope() == ld::Atom::scopeTranslationUnit ) {

                         addFixup(src, cl, firstKind, target.atom);

3175 }

                 else if ( (target.atom->combine() == ld::Atom::combineByNameAndContent) || (target.atom->combine() == ld::Atom::combineByNameAndReferences) ) {

                         addFixup(src, cl, firstKind, ld::Fixup::bindingByContentBound, target.atom);

3178 }

                 else if ( (src.atom->section().type() == ld::Section::typeCFString) && (src.offsetInAtom != 0) ) {

3180 // backing string in CFStrings should always be direct

                         addFixup(src, cl, firstKind, target.atom);

3182 }

                 else if ( (src.atom == target.atom) && (target.atom->combine() == ld::Atom::combineByName) ) {

3184 // reference to self should always be direct

                         addFixup(src, cl, firstKind, target.atom);

3186 }

3187 else {

3188 // change direct fixup to by-name fixup

                         addFixup(src, cl, firstKind, false, target.atom->name());

3190 }

3191 }

3192 else {

                 addFixup(src, cl, firstKind, target.weakImport, target.name);

3194 }

         if ( target.addend == 0 ) {

3196 #if SUPPORT_ARCH_arm64e

3197 if (isAuthenticated)

3198 assert(combined);

3199 #endif

3200 if ( ! combined )

                         addFixup(src, ld::Fixup::k2of2, setKind);

3202 }

3203 else {

3204 #if SUPPORT_ARCH_arm64e

3205 if (isAuthenticated) {

                         addFixup(src, ld::Fixup::k3of4, ld::Fixup::kindAddAddend, target.addend);

                         addFixup(src, ld::Fixup::k4of4, setKind);

3208 } else

3209 #endif

3210 {

                         addFixup(src, ld::Fixup::k2of3, ld::Fixup::kindAddAddend, target.addend);

                         addFixup(src, ld::Fixup::k3of3, setKind);

3213 }

3214 }

3215 }

3216

3217 template <typename A>

 void Parser<A>::addFixups(const SourceLocation& src, ld::Fixup::Kind kind, const TargetDesc& target, const TargetDesc& picBase)

3219 {

         ld::Fixup::Cluster cl = (target.addend == 0) ? ld::Fixup::k1of4 : ld::Fixup::k1of5;

         if ( target.atom != NULL ) {

                 if ( target.atom->scope() == ld::Atom::scopeTranslationUnit ) {

                         addFixup(src, cl, ld::Fixup::kindSetTargetAddress, target.atom);

3224 }

                 else if ( (target.atom->combine() == ld::Atom::combineByNameAndContent) || (target.atom->combine() == ld::Atom::combineByNameAndReferences) ) {

                         addFixup(src, cl, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, target.atom);

3227 }

3228 else {

                         addFixup(src, cl, ld::Fixup::kindSetTargetAddress, false, target.atom->name());

3230 }

3231 }

3232 else {

                 addFixup(src, cl, ld::Fixup::kindSetTargetAddress, target.weakImport, target.name);

3234 }

         if ( target.addend == 0 ) {

                 assert(picBase.atom != NULL);

                 addFixup(src, ld::Fixup::k2of4, ld::Fixup::kindSubtractTargetAddress, picBase.atom);

                 addFixup(src, ld::Fixup::k3of4, ld::Fixup::kindSubtractAddend, picBase.addend);

                 addFixup(src, ld::Fixup::k4of4, kind);

3240 }

3241 else {

                 addFixup(src, ld::Fixup::k2of5, ld::Fixup::kindAddAddend, target.addend);

                 addFixup(src, ld::Fixup::k3of5, ld::Fixup::kindSubtractTargetAddress, picBase.atom);

                 addFixup(src, ld::Fixup::k4of5, ld::Fixup::kindSubtractAddend, picBase.addend);

                 addFixup(src, ld::Fixup::k5of5, kind);

3246 }

3247 }

3248

3249

3250

3251 template <typename A>

 uint32_t TentativeDefinitionSection<A>::computeAtomCount(class Parser<A>& parser, 

                                                                                                                         struct Parser<A>::LabelAndCFIBreakIterator& it, 

3254 const struct Parser<A>::CFI_CU_InfoArrays&)

3255 {

3256 return parser.tentativeDefinitionCount();

3257 }

3258

3259 template <typename A>

 uint32_t TentativeDefinitionSection<A>::appendAtoms(class Parser<A>& parser, uint8_t* p, 

                                                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, 

3262 const struct Parser<A>::CFI_CU_InfoArrays&)

3263 {

         this->_beginAtoms = (Atom<A>*)p;

3265 uint32_t count = 0;

         for (uint32_t i=parser.undefinedStartIndex(); i < parser.undefinedEndIndex(); ++i) {

                 const macho_nlist<P>& sym =     parser.symbolFromIndex(i);

                 if ( ((sym.n_type() & N_TYPE) == N_UNDF) && (sym.n_value() != 0) ) {

                         uint64_t size = sym.n_value();

                         uint8_t alignP2 = GET_COMM_ALIGN(sym.n_desc());

                         if ( alignP2 == 0 ) {

3272 // common symbols align to their size

3273 // that is, a 4-byte common aligns to 4-bytes

3274 // if this size is not a power of two,

3275 // then round up to the next power of two

                                 alignP2 = 63 - (uint8_t)__builtin_clzll(size);

                                 if ( size != (1ULL << alignP2) )

3278 ++alignP2;

3279 // <rdar://problem/24871389> limit default alignment of large commons

                                 if ( alignP2 > parser.maxDefaultCommonAlignment() )

3281 alignP2 = parser.maxDefaultCommonAlignment();

3282 }

                         Atom<A>* allocatedSpace = (Atom<A>*)p;

                         new (allocatedSpace) Atom<A>(*this, parser.nameFromSymbol(sym), (pint_t)ULLONG_MAX, size,

                                                                                 ld::Atom::definitionTentative,  ld::Atom::combineByName, 

                                                                                 parser.scopeFromSymbol(sym), ld::Atom::typeZeroFill, ld::Atom::symbolTableIn, 

                                                                                 parser.dontDeadStripFromSymbol(sym), false, false, ld::Atom::Alignment(alignP2) );

                         p += sizeof(Atom<A>);

3289 ++count;

3290 }

3291 }

         this->_endAtoms = (Atom<A>*)p;

3293 return count;

3294 }

3295

3296

3297 template <typename A>

 uint32_t AbsoluteSymbolSection<A>::computeAtomCount(class Parser<A>& parser, 

                                                                                                                         struct Parser<A>::LabelAndCFIBreakIterator& it, 

3300 const struct Parser<A>::CFI_CU_InfoArrays&)

3301 {

3302 return parser.absoluteSymbolCount();

3303 }

3304

3305 template <typename A>

 uint32_t AbsoluteSymbolSection<A>::appendAtoms(class Parser<A>& parser, uint8_t* p, 

                                                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, 

3308 const struct Parser<A>::CFI_CU_InfoArrays&)

3309 {

         this->_beginAtoms = (Atom<A>*)p;

3311 uint32_t count = 0;

         for (uint32_t i=0; i < parser.symbolCount(); ++i) {

                 const macho_nlist<P>& sym =     parser.symbolFromIndex(i);

                 if ( (sym.n_type() & N_TYPE) != N_ABS )

3315 continue;

                 const char* absName = parser.nameFromSymbol(sym);

3317 // ignore .objc_class_name_* symbols

                 if ( strncmp(absName, ".objc_class_name_", 17) == 0 )

3319 continue;

3320 // ignore .objc_class_name_* symbols

                 if ( strncmp(absName, ".objc_category_name_", 20) == 0 )

3322 continue;

3323 // ignore empty *.eh symbols

                 if ( strcmp(&absName[strlen(absName)-3], ".eh") == 0 )

3325 continue;

3326

                 Atom<A>* allocatedSpace = (Atom<A>*)p;

                 new (allocatedSpace) Atom<A>(*this, parser, sym, 0);

                 p += sizeof(Atom<A>);

3330 ++count;

3331 }

         this->_endAtoms = (Atom<A>*)p;

3333 return count;

3334 }

3335

3336 template <typename A>

 Atom<A>* AbsoluteSymbolSection<A>::findAbsAtomForValue(typename A::P::uint_t value)

3338 {

         Atom<A>* end = this->_endAtoms;

         for(Atom<A>* p = this->_beginAtoms; p < end; ++p) {

                 if ( p->_objAddress == value )  

3342 return p;

3343 }

3344 return NULL;

3345 }

3346

3347

3348 template <typename A>

 uint32_t Parser<A>::indirectSymbol(uint32_t indirectIndex)

3350 {

3351 if ( indirectIndex >= _indirectTableCount )

3352 throw "indirect symbol index out of range";

         return E::get32(_indirectTable[indirectIndex]);

3354 }

3355

3356 template <typename A>

 const macho_nlist<typename A::P>& Parser<A>::symbolFromIndex(uint32_t index)

3358 {

3359 if ( index > _symbolCount )

3360 throw "symbol index out of range";

3361 return _symbols[index];

3362 }

3363

3364 template <typename A>

 const macho_section<typename A::P>*     Parser<A>::machOSectionFromSectionIndex(uint32_t index)

3366 {

3367 if ( index >= _machOSectionsCount )

3368 throw "section index out of range";

3369 return &_sectionsStart[index];

3370 }

3371

3372 template <typename A>

 uint32_t Parser<A>::symbolIndexFromIndirectSectionAddress(pint_t addr, const macho_section<P>* sect)

3374 {

3375 uint32_t elementSize = 0;

         switch ( sect->flags() & SECTION_TYPE ) {

3377 case S_SYMBOL_STUBS:

3378 elementSize = sect->reserved2();

3379 break;

3380 case S_LAZY_SYMBOL_POINTERS:

3381 case S_NON_LAZY_SYMBOL_POINTERS:

3382 case S_THREAD_LOCAL_VARIABLE_POINTERS:

3383 elementSize = sizeof(pint_t);

3384 break;

3385 default:

3386 throw "section does not use indirect symbol table";

3387 }

         uint32_t indexInSection = (addr - sect->addr()) / elementSize;

         uint32_t indexIntoIndirectTable = sect->reserved1() + indexInSection;

         return this->indirectSymbol(indexIntoIndirectTable);

3391 }

3392

3393

3394

3395 template <typename A>

 const char* Parser<A>::nameFromSymbol(const macho_nlist<P>& sym)

3397 {

         return &_strings[sym.n_strx()];

3399 }

3400

3401 template <typename A>

 ld::Atom::Scope Parser<A>::scopeFromSymbol(const macho_nlist<P>& sym)

3403 {

         if ( (sym.n_type() & N_EXT) == 0 )

                 return ld::Atom::scopeTranslationUnit;

         else if ( (sym.n_type() & N_PEXT) != 0 )

                 return ld::Atom::scopeLinkageUnit;

         else if ( this->nameFromSymbol(sym)[0] == 'l' ) // since all 'l' symbols will be remove, don't make them global

                 return ld::Atom::scopeLinkageUnit;

3410 else

                 return ld::Atom::scopeGlobal;

3412 }

3413

3414 template <typename A>

 ld::Atom::Definition Parser<A>::definitionFromSymbol(const macho_nlist<P>& sym)

3416 {

         switch ( sym.n_type() & N_TYPE ) {

3418 case N_ABS:

                         return ld::Atom::definitionAbsolute;

3420 case N_SECT:

                         return ld::Atom::definitionRegular;

3422 case N_UNDF:

                         if ( sym.n_value() != 0 ) 

                                 return ld::Atom::definitionTentative;

3425 }

3426 throw "definitionFromSymbol() bad symbol";

3427 }

3428

3429 template <typename A>

 ld::Atom::Combine Parser<A>::combineFromSymbol(const macho_nlist<P>& sym)

3431 {

         if ( sym.n_desc() & N_WEAK_DEF ) 

                 return ld::Atom::combineByName;

3434 else

                 return ld::Atom::combineNever;

3436 }

3437

3438

3439 template <typename A>

 ld::Atom::SymbolTableInclusion Parser<A>::inclusionFromSymbol(const macho_nlist<P>& sym)

3441 {

         const char* symbolName = nameFromSymbol(sym);

3443 // labels beginning with 'l' (lowercase ell) are automatically removed in final linked images <rdar://problem/4571042>

3444 // labels beginning with 'L' should have been stripped by the assembler, so are stripped now

         if ( sym.n_desc() & REFERENCED_DYNAMICALLY ) 

                 return ld::Atom::symbolTableInAndNeverStrip;

         else if ( symbolName[0] == 'l' )

                 return ld::Atom::symbolTableNotInFinalLinkedImages;

         else if ( symbolName[0] == 'L' )

                 return ld::Atom::symbolTableNotIn;

3451 else

                 return ld::Atom::symbolTableIn;

3453 }

3454

3455 template <typename A>

 bool Parser<A>::dontDeadStripFromSymbol(const macho_nlist<P>& sym)

3457 {

         return ( (sym.n_desc() & (N_NO_DEAD_STRIP|REFERENCED_DYNAMICALLY)) != 0 );

3459 }

3460

3461 template <typename A>

 bool Parser<A>::isThumbFromSymbol(const macho_nlist<P>& sym)

3463 {

         return ( sym.n_desc() & N_ARM_THUMB_DEF );

3465 }

3466

3467 template <typename A>

 bool Parser<A>::weakImportFromSymbol(const macho_nlist<P>& sym)

3469 {

         return ( ((sym.n_type() & N_TYPE) == N_UNDF) && ((sym.n_desc() & N_WEAK_REF) != 0) );

3471 }

3472

3473 template <typename A>

 bool Parser<A>::resolverFromSymbol(const macho_nlist<P>& sym)

3475 {

         return ( sym.n_desc() & N_SYMBOL_RESOLVER );

3477 }

3478

3479 template <typename A>

 bool Parser<A>::altEntryFromSymbol(const macho_nlist<P>& sym)

3481 {

         return ( sym.n_desc() & N_ALT_ENTRY );

3483 }

3484

3485

3486 /* Skip over a LEB128 value (signed or unsigned). */

3487 static void

 skip_leb128 (const uint8_t ** offset, const uint8_t * end)

3489 {

   while (*offset != end && **offset >= 0x80)

3491 (*offset)++;

3492 if (*offset != end)

3493 (*offset)++;

3494 }

3495

3496 /* Read a ULEB128 into a 64-bit word. Return (uint64_t)-1 on overflow

3497 or error. On overflow, skip past the rest of the uleb128. */

3498 static uint64_t

 read_uleb128 (const uint8_t ** offset, const uint8_t * end)

3500 {

3501 uint64_t result = 0;

3502 int bit = 0;

3503

3504 do {

3505 uint64_t b;

3506

3507 if (*offset == end)

       return (uint64_t) -1;

3509

3510 b = **offset & 0x7f;

3511

     if (bit >= 64 || b << bit >> bit != b)

       result = (uint64_t) -1;

3514 else

       result |= b << bit, bit += 7;

   } while (*(*offset)++ >= 0x80);

3517 return result;

3518 }

3519

3520

3521 /* Skip over a DWARF attribute of form FORM. */

3522 template <typename A>

 bool Parser<A>::skip_form(const uint8_t ** offset, const uint8_t * end, uint64_t form,

3524 uint8_t addr_size, bool dwarf64)

3525 {

3526 int64_t sz=0;

3527

3528 switch (form)

3529 {

3530 case DW_FORM_addr:

3531 sz = addr_size;

3532 break;

3533

3534 case DW_FORM_block2:

       if (end - *offset < 2)

3536 return false;

       sz = 2 + A::P::E::get16(*(uint16_t*)offset);

3538 break;

3539

3540 case DW_FORM_block4:

       if (end - *offset < 4)

3542 return false;

       sz = 2 + A::P::E::get32(*(uint32_t*)offset);

3544 break;

3545

3546 case DW_FORM_data2:

3547 case DW_FORM_ref2:

3548 sz = 2;

3549 break;

3550

3551 case DW_FORM_data4:

3552 case DW_FORM_ref4:

3553 sz = 4;

3554 break;

3555

3556 case DW_FORM_data8:

3557 case DW_FORM_ref8:

3558 sz = 8;

3559 break;

3560

3561 case DW_FORM_string:

       while (*offset != end && **offset)

3563 ++*offset;

3564 case DW_FORM_data1:

3565 case DW_FORM_flag:

3566 case DW_FORM_ref1:

3567 sz = 1;

3568 break;

3569

3570 case DW_FORM_block:

       sz = read_uleb128 (offset, end);

3572 break;

3573

3574 case DW_FORM_block1:

3575 if (*offset == end)

3576 return false;

3577 sz = 1 + **offset;

3578 break;

3579

3580 case DW_FORM_sdata:

3581 case DW_FORM_udata:

3582 case DW_FORM_ref_udata:

3583 skip_leb128 (offset, end);

3584 return true;

3585

3586 case DW_FORM_strp:

3587 case DW_FORM_ref_addr:

3588 sz = 4;

3589 break;

3590

3591 case DW_FORM_sec_offset:

           sz = sizeof(typename A::P::uint_t);

3593 break;

3594

3595 case DW_FORM_exprloc:

       sz = read_uleb128 (offset, end);

3597 break;

3598

3599 case DW_FORM_flag_present:

3600 sz = 0;

3601 break;

3602

3603 case DW_FORM_ref_sig8:

3604 sz = 8;

3605 break;

3606

3607 default:

3608 return false;

3609 }

   if (end - *offset < sz)

3611 return false;

3612 *offset += sz;

3613 return true;

3614 }

3615

3616

3617 template <typename A>

 const char* Parser<A>::getDwarfString(uint64_t form, const uint8_t*& di)

3619 {

3620 uint32_t offset;

3621 const char* dwarfStrings;

3622 const char* result = NULL;

3623 switch (form) {

3624 case DW_FORM_string:

3625 result = (const char*)di;

                         di += strlen(result) + 1;

3627 break;

3628 case DW_FORM_strp:

                         offset = E::get32(*((uint32_t*)di));

                         dwarfStrings = (char*)_file->fileContent() + _file->_dwarfDebugStringSect->offset();

                         if ( offset < _file->_dwarfDebugStringSect->size() )

3632 result = &dwarfStrings[offset];

3633 else

                                 warning("dwarf DW_FORM_strp (offset=0x%08X) is too big in %s", offset, this->_path);

3635 di += 4;

3636 break;

3637 default:

                         warning("unknown dwarf string encoding (form=%lld) in %s", form, this->_path);

3639 break;

3640 }

3641 return result;

3642 }

3643

3644 template <typename A>

 uint64_t Parser<A>::getDwarfOffset(uint64_t form, const uint8_t*& di, bool dwarf64)

3646 {

3647 if ( form == DW_FORM_sec_offset )

3648 form = (dwarf64 ? DW_FORM_data8 : DW_FORM_data4);

3649 uint64_t result = -1;

3650 switch (form) {

3651 case DW_FORM_data4:

                         result = A::P::E::get32(*(uint32_t*)di);

3653 di += 4;

3654 break;

3655 case DW_FORM_data8:

                         result = A::P::E::get64(*(uint64_t*)di);

3657 di += 8;

3658 break;

3659 default:

                         warning("unknown dwarf DW_FORM_ for DW_AT_stmt_list in %s", this->_path);

3661 }

3662 return result;

3663 }

3664

3665

3666 template <typename A>

3667 struct AtomAndLineInfo {

3668 Atom<A>* atom;

         ld::Atom::LineInfo      info;

3670 };

3671

3672

3673 // <rdar://problem/5591394> Add support to ld64 for N_FUN stabs when used for symbolic constants

3674 // Returns whether a stabStr belonging to an N_FUN stab represents a

3675 // symbolic constant rather than a function

3676 template <typename A>

 bool Parser<A>::isConstFunStabs(const char *stabStr)

3678 {

3679 const char* colon;

3680 // N_FUN can be used for both constants and for functions. In case it's a constant,

3681 // the format of the stabs string is "symname:c=<value>;"

3682 // ':' cannot appear in the symbol name, except if it's an Objective-C method

3683 // (in which case the symbol name starts with + or -, and then it's definitely

3684 // not a constant)

         return (stabStr != NULL) && (stabStr[0] != '+') && (stabStr[0] != '-')

                         && ((colon = strchr(stabStr, ':')) != NULL)

                         && (colon[1] == 'c') && (colon[2] == '=');

3688 }

3689

3690

3691 template <typename A>

 void Parser<A>::parseDebugInfo()

3693 {

3694 addAstFiles();

3695

3696 // check for dwarf __debug_info section

         if ( _file->_dwarfDebugInfoSect == NULL ) {

3698 // if no DWARF debug info, look for stabs

3699 this->parseStabs();

3700 return;

3701 }

         if ( _file->_dwarfDebugInfoSect->size() == 0 )

3703 return;

3704

3705 uint64_t stmtList;

3706 const char* tuDir;

3707 const char* tuName;

         if ( !read_comp_unit(&tuName, &tuDir, &stmtList) ) {

3709 // if can't parse dwarf, warn and give up

3710 _file->_dwarfTranslationUnitPath = NULL;

                 warning("can't parse dwarf compilation unit info in %s", _path);

                 _file->_debugInfoKind = ld::relocatable::File::kDebugInfoNone;

3713 return;

3714 }

         if ( (tuName != NULL) && (tuName[0] == '/') ) {

3716 _file->_dwarfTranslationUnitPath = tuName;

3717 }

         else if ( (tuDir != NULL) && (tuName != NULL) ) {

                 asprintf((char**)&(_file->_dwarfTranslationUnitPath), "%s/%s", tuDir, tuName);

3720 }

3721 else if ( tuDir == NULL ) {

3722 _file->_dwarfTranslationUnitPath = tuName;

3723 }

3724 else {

3725 _file->_dwarfTranslationUnitPath = NULL;

3726 }

3727

3728 // add line number info to atoms from dwarf

         std::vector<AtomAndLineInfo<A> > entries;

         entries.reserve(64);

         if ( _file->_debugInfoKind == ld::relocatable::File::kDebugInfoDwarf ) {

3732 // file with just data will have no __debug_line info

                 if ( (_file->_dwarfDebugLineSect != NULL) && (_file->_dwarfDebugLineSect->size() != 0) ) {

3734 // validate stmt_list

                         if ( (stmtList != (uint64_t)-1) && (stmtList < _file->_dwarfDebugLineSect->size()) ) {

                                 const uint8_t* debug_line = (uint8_t*)_file->fileContent() + _file->_dwarfDebugLineSect->offset();

                                 struct line_reader_data* lines = line_open(&debug_line[stmtList],

                                                                                                                 _file->_dwarfDebugLineSect->size() - stmtList, E::little_endian);

3739 struct line_info result;

3740 Atom<A>* curAtom = NULL;

3741 uint32_t curAtomOffset = 0;

3742 uint32_t curAtomAddress = 0;

3743 uint32_t curAtomSize = 0;

                                 std::map<uint32_t,const char*>  dwarfIndexToFile;

3745 if ( lines != NULL ) {

                                         while ( line_next(lines, &result, line_stop_pc) ) {

3747 //fprintf(stderr, "curAtom=%p, result.pc=0x%llX, result.line=%llu, result.end_of_sequence=%d,"

3748 // " curAtomAddress=0x%X, curAtomSize=0x%X\n",

3749 // curAtom, result.pc, result.line, result.end_of_sequence, curAtomAddress, curAtomSize);

3750 // work around weird debug line table compiler generates if no functions in __text section

                                                 if ( (curAtom == NULL) && (result.pc == 0) && result.end_of_sequence && (result.file == 1))

3752 continue;

3753 // for performance, see if in next pc is in current atom

                                                 if ( (curAtom != NULL) && (curAtomAddress <= result.pc) && (result.pc < (curAtomAddress+curAtomSize)) ) {

3755 curAtomOffset = result.pc - curAtomAddress;

3756 }

3757 // or pc at end of current atom

                                                 else if ( result.end_of_sequence && (curAtom != NULL) && (result.pc == (curAtomAddress+curAtomSize)) ) {

3759 curAtomOffset = result.pc - curAtomAddress;

3760 }

3761 // or only one function that is a one line function

                                                 else if ( result.end_of_sequence && (curAtom == NULL) && (this->findAtomByAddress(0) != NULL) && (result.pc == this->findAtomByAddress(0)->size()) ) {

                                                         curAtom                 = this->findAtomByAddress(0);

                                                         curAtomOffset   = result.pc - curAtom->objectAddress();

3765 curAtomAddress = curAtom->objectAddress();

3766 curAtomSize = curAtom->size();

3767 }

3768 else {

3769 // do slow look up of atom by address

3770 try {

                                                                 curAtom = this->findAtomByAddress(result.pc);

3772 }

3773 catch (...) {

3774 // in case of bug in debug info, don't abort link, just limp on

3775 curAtom = NULL;

3776 }

3777 if ( curAtom == NULL )

3778 break; // file has line info but no functions

                                                         if ( result.end_of_sequence && (curAtomAddress+curAtomSize < result.pc) ) {     

3780 // a one line function can be returned by line_next() as one entry with pc at end of blob

3781 // look for alt atom starting at end of previous atom

3782 uint32_t previousEnd = curAtomAddress+curAtomSize;

                                                                 Atom<A>* alt = this->findAtomByAddressOrNullIfStub(previousEnd);

3784 if ( alt == NULL )

3785 continue; // ignore spurious debug info for stubs

                                                                 if ( result.pc <= alt->objectAddress() + alt->size() ) {

3787 curAtom = alt;

                                                                         curAtomOffset   = result.pc - alt->objectAddress();

3789 curAtomAddress = alt->objectAddress();

3790 curAtomSize = alt->size();

3791 }

3792 else {

                                                                         curAtomOffset   = result.pc - curAtom->objectAddress();

3794 curAtomAddress = curAtom->objectAddress();

3795 curAtomSize = curAtom->size();

3796 }

3797 }

3798 else {

                                                                 curAtomOffset   = result.pc - curAtom->objectAddress();

3800 curAtomAddress = curAtom->objectAddress();

3801 curAtomSize = curAtom->size();

3802 }

3803 }

3804 const char* filename;

                                                 std::map<uint32_t,const char*>::iterator pos = dwarfIndexToFile.find(result.file);

                                                 if ( pos == dwarfIndexToFile.end() ) {

                                                         filename = line_file(lines, result.file);

3808 dwarfIndexToFile[result.file] = filename;

3809 }

3810 else {

3811 filename = pos->second;

3812 }

3813 // only record for ~8000 line info records per function

                                                 if ( curAtom->roomForMoreLineInfoCount() ) {

3815 AtomAndLineInfo<A> entry;

3816 entry.atom = curAtom;

3817 entry.info.atomOffset = curAtomOffset;

3818 entry.info.fileName = filename;

                                                         entry.info.lineNumber = result.line;

3820 //fprintf(stderr, "addr=0x%08llX, line=%lld, file=%s, atom=%s, atom.size=0x%X, end=%d\n",

3821 // result.pc, result.line, filename, curAtom->name(), curAtomSize, result.end_of_sequence);

3822 entries.push_back(entry);

3823 curAtom->incrementLineInfoCount();

3824 }

3825 if ( result.end_of_sequence ) {

3826 curAtom = NULL;

3827 }

3828 }

3829 line_free(lines);

3830 }

3831 }

3832 }

3833 }

3834

3835 // assign line info start offset for each atom

         uint8_t* p = _file->_atomsArray;

3837 uint32_t liOffset = 0;

         for(int i=_file->_atomsArrayCount; i > 0; --i) {

                 Atom<A>* atom = (Atom<A>*)p;

3840 atom->_lineInfoStartIndex = liOffset;

3841 liOffset += atom->_lineInfoCount;

3842 atom->_lineInfoCount = 0;

                 p += sizeof(Atom<A>);

3844 }

         assert(liOffset == entries.size());

         _file->_lineInfos.resize(liOffset);

3847

3848 // copy each line info for each atom

         for (typename std::vector<AtomAndLineInfo<A> >::iterator it = entries.begin(); it != entries.end(); ++it) {

                 uint32_t slot = it->atom->_lineInfoStartIndex + it->atom->_lineInfoCount;

                 _file->_lineInfos[slot] = it->info;

3852 it->atom->_lineInfoCount++;

3853 }

3854

3855 // done with temp vector

3856 entries.clear();

3857 }

3858

3859 template <typename A>

 void Parser<A>::parseStabs()

3861 {

3862 // scan symbol table for stabs entries

3863 Atom<A>* currentAtom = NULL;

3864 pint_t currentAtomAddress = 0;

         enum { start, inBeginEnd, inFun } state = start;

         for (uint32_t symbolIndex = 0; symbolIndex < _symbolCount; ++symbolIndex ) {

                 const macho_nlist<P>& sym = this->symbolFromIndex(symbolIndex);

3868 bool useStab = true;

                 uint8_t type = sym.n_type();

                 const char* symString = (sym.n_strx() != 0) ? this->nameFromSymbol(sym) : NULL;

                 if ( (type & N_STAB) != 0 ) {

                         _file->_debugInfoKind =  (_hasUUID ? ld::relocatable::File::kDebugInfoStabsUUID : ld::relocatable::File::kDebugInfoStabs);

                         ld::relocatable::File::Stab stab;

3874 stab.atom = NULL;

3875 stab.type = type;

                         stab.other      = sym.n_sect();

                         stab.desc       = sym.n_desc();

                         stab.value      = sym.n_value();

3879 stab.string = NULL;

3880 switch (state) {

3881 case start:

3882 switch (type) {

3883 case N_BNSYM:

3884 // beginning of function block

3885 state = inBeginEnd;

3886 // fall into case to lookup atom by addresss

3887 case N_LCSYM:

3888 case N_STSYM:

3889 currentAtomAddress = sym.n_value();

                                                         currentAtom = this->findAtomByAddress(currentAtomAddress);

3891 if ( currentAtom != NULL ) {

3892 stab.atom = currentAtom;

3893 stab.string = symString;

3894 }

3895 else {

                                                                 fprintf(stderr, "can't find atom for stabs BNSYM at %08llX in %s",

                                                                         (uint64_t)sym.n_value(), _path);

3898 }

3899 break;

3900 case N_SO:

3901 case N_OSO:

3902 case N_OPT:

3903 case N_LSYM:

3904 case N_RSYM:

3905 case N_PSYM:

3906 case N_AST:

3907 // not associated with an atom, just copy

3908 stab.string = symString;

3909 break;

3910 case N_GSYM:

3911 {

3912 // n_value field is NOT atom address ;-(

3913 // need to find atom by name match

                                                         const char* colon = strchr(symString, ':');

3915 if ( colon != NULL ) {

3916 // build underscore leading name

3917 int nameLen = colon - symString;

                                                                 char symName[nameLen+2];

                                                                 strlcpy(&symName[1], symString, nameLen+1);

                                                                 symName[0] = '_';

                                                                 symName[nameLen+1] = '\0';

                                                                 currentAtom = this->findAtomByName(symName);

3923 if ( currentAtom != NULL ) {

3924 stab.atom = currentAtom;

3925 stab.string = symString;

3926 }

3927 }

3928 else {

3929 // might be a debug-note without trailing :G()

                                                                 currentAtom = this->findAtomByName(symString);

3931 if ( currentAtom != NULL ) {

3932 stab.atom = currentAtom;

3933 stab.string = symString;

3934 }

3935 }

                                                         if ( stab.atom == NULL ) {

3937 // ld_classic added bogus GSYM stabs for old style dtrace probes

                                                                 if ( (strncmp(symString, "__dtrace_probe$", 15) != 0) )

                                                                         warning("can't find atom for N_GSYM stabs %s in %s", symString, _path);

3940 useStab = false;

3941 }

3942 break;

3943 }

3944 case N_FUN:

                                                         if ( isConstFunStabs(symString) ) {

3946 // constant not associated with a function

3947 stab.string = symString;

3948 }

3949 else {

3950 // old style stabs without BNSYM

3951 state = inFun;

3952 currentAtomAddress = sym.n_value();

                                                                 currentAtom = this->findAtomByAddress(currentAtomAddress);

3954 if ( currentAtom != NULL ) {

3955 stab.atom = currentAtom;

3956 stab.string = symString;

3957 }

3958 else {

                                                                         warning("can't find atom for stabs FUN at %08llX in %s",

                                                                                 (uint64_t)currentAtomAddress, _path);

3961 }

3962 }

3963 break;

3964 case N_SOL:

3965 case N_SLINE:

3966 stab.string = symString;

3967 // old stabs

3968 break;

3969 case N_BINCL:

3970 case N_EINCL:

3971 case N_EXCL:

3972 stab.string = symString;

3973 // -gfull built .o file

3974 break;

3975 default:

                                                         warning("unknown stabs type 0x%X in %s", type, _path);

3977 }

3978 break;

3979 case inBeginEnd:

3980 stab.atom = currentAtom;

3981 switch (type) {

3982 case N_ENSYM:

3983 state = start;

3984 currentAtom = NULL;

3985 break;

3986 case N_LCSYM:

3987 case N_STSYM:

3988 {

                                                         Atom<A>* nestedAtom = this->findAtomByAddress(sym.n_value());

3990 if ( nestedAtom != NULL ) {

3991 stab.atom = nestedAtom;

3992 stab.string = symString;

3993 }

3994 else {

                                                                 warning("can't find atom for stabs 0x%X at %08llX in %s",

                                                                         type, (uint64_t)sym.n_value(), _path);

3997 }

3998 break;

3999 }

4000 case N_LBRAC:

4001 case N_RBRAC:

4002 case N_SLINE:

4003 // adjust value to be offset in atom

4004 stab.value -= currentAtomAddress;

4005 default:

4006 stab.string = symString;

4007 break;

4008 }

4009 break;

4010 case inFun:

4011 switch (type) {

4012 case N_FUN:

                                                         if ( isConstFunStabs(symString) ) {

4014 stab.atom = currentAtom;

4015 stab.string = symString;

4016 }

4017 else {

                                                                 if ( sym.n_sect() != 0 ) {

4019 // found another start stab, must be really old stabs...

4020 currentAtomAddress = sym.n_value();

                                                                         currentAtom = this->findAtomByAddress(currentAtomAddress);

4022 if ( currentAtom != NULL ) {

4023 stab.atom = currentAtom;

4024 stab.string = symString;

4025 }

4026 else {

                                                                                 warning("can't find atom for stabs FUN at %08llX in %s",

                                                                                         (uint64_t)currentAtomAddress, _path);

4029 }

4030 }

4031 else {

4032 // found ending stab, switch back to start state

4033 stab.string = symString;

4034 stab.atom = currentAtom;

4035 state = start;

4036 currentAtom = NULL;

4037 }

4038 }

4039 break;

4040 case N_LBRAC:

4041 case N_RBRAC:

4042 case N_SLINE:

4043 // adjust value to be offset in atom

4044 stab.value -= currentAtomAddress;

4045 stab.atom = currentAtom;

4046 break;

4047 case N_SO:

4048 stab.string = symString;

4049 state = start;

4050 break;

4051 default:

4052 stab.atom = currentAtom;

4053 stab.string = symString;

4054 break;

4055 }

4056 break;

4057 }

4058 // add to list of stabs for this .o file

4059 if ( useStab )

                                 _file->_stabs.push_back(stab);

4061 }

4062 }

4063 }

4064

4065

4066 template <typename A>

 void Parser<A>::addAstFiles()

4068 {

4069 // scan symbol table for N_AST entries

         for (uint32_t symbolIndex = 0; symbolIndex < _symbolCount; ++symbolIndex ) {

                 const macho_nlist<P>& sym = this->symbolFromIndex(symbolIndex);

                 if ( (sym.n_type() == N_AST) &&  (sym.n_strx() != 0) ) {

                         const char* symString = this->nameFromSymbol(sym);

                         ld::relocatable::File::AstTimeAndPath entry;

                         entry.time = sym.n_value();

4076 entry.path = symString;

                         _file->_astFiles.push_back(entry);

4078 }

4079 }

4080 }

4081

4082

4083 // Look at the compilation unit DIE and determine

4084 // its NAME, compilation directory (in COMP_DIR) and its

4085 // line number information offset (in STMT_LIST). NAME and COMP_DIR

4086 // may be NULL (especially COMP_DIR) if they are not in the .o file;

4087 // STMT_LIST will be (uint64_t) -1.

4088 //

4089 // At present this assumes that there's only one compilation unit DIE.

4090 //

4091 template <typename A>

 bool Parser<A>::read_comp_unit(const char ** name, const char ** comp_dir,

4093 uint64_t *stmt_list)

4094 {

4095 const uint8_t * debug_info;

4096 const uint8_t * debug_abbrev;

4097 const uint8_t * di;

4098 const uint8_t * next_cu;

4099 const uint8_t * da;

4100 const uint8_t * end;

4101 const uint8_t * enda;

4102 uint64_t sz;

4103 uint16_t vers;

4104 uint64_t abbrev_base;

4105 uint64_t abbrev;

4106 uint8_t address_size;

4107 bool dwarf64;

4108

4109 *name = NULL;

4110 *comp_dir = NULL;

         *stmt_list = (uint64_t) -1;

4112

         if ( (_file->_dwarfDebugInfoSect == NULL) || (_file->_dwarfDebugAbbrevSect == NULL) )

4114 return false;

4115

         if (_file->_dwarfDebugInfoSect->size() < 12)

4117 /* Too small to be a real debug_info section. */

4118 return false;

4119

     debug_info = (uint8_t*)_file->fileContent() + _file->_dwarfDebugInfoSect->offset();

     debug_abbrev = (uint8_t*)_file->fileContent() + _file->_dwarfDebugAbbrevSect->offset();

4122 next_cu = debug_info;

4123

     while ((uint64_t)(next_cu - debug_info) < _file->_dwarfDebugInfoSect->size()) {

4125 di = next_cu;

         sz = A::P::E::get32(*(uint32_t*)di);

4127 di += 4;

4128 dwarf64 = sz == 0xffffffff;

4129 if (dwarf64)

             sz = A::P::E::get64(*(uint64_t*)di), di += 8;

         else if (sz > 0xffffff00)

4132 /* Unknown dwarf format. */

4133 return false;

4134

4135 /* Verify claimed size. */

         if (sz + (di - debug_info) > _file->_dwarfDebugInfoSect->size() || sz <= (dwarf64 ? 23 : 11))

4137 return false;

4138

4139 next_cu = di + sz;

4140

         vers = A::P::E::get16(*(uint16_t*)di);

         if (vers < 2 || vers > 4)

4143 /* DWARF version wrong for this code.

4144 Chances are we could continue anyway, but we don't know for sure. */

4145 return false;

4146 di += 2;

4147

4148 /* Find the debug_abbrev section. */

         abbrev_base = dwarf64 ? A::P::E::get64(*(uint64_t*)di) : A::P::E::get32(*(uint32_t*)di);

         di += dwarf64 ? 8 : 4;

4151

         if (abbrev_base > _file->_dwarfDebugAbbrevSect->size())

4153 return false;

4154 da = debug_abbrev + abbrev_base;

         enda = debug_abbrev + _file->_dwarfDebugAbbrevSect->size();

4156

4157 address_size = *di++;

4158

4159 /* Find the abbrev number we're looking for. */

4160 end = di + sz;

         abbrev = read_uleb128 (&di, end);

         if (abbrev == (uint64_t) -1)

4163 return false;

4164

4165 /* Skip through the debug_abbrev section looking for that abbrev. */

4166 for (;;)

4167 {

             uint64_t this_abbrev = read_uleb128 (&da, enda);

4169 uint64_t attr;

4170

4171 if (this_abbrev == abbrev)

4172 /* This is almost always taken. */

4173 break;

             skip_leb128 (&da, enda); /* Skip the tag.  */

4175 if (da == enda)

4176 return false;

4177 da++; /* Skip the DW_CHILDREN_* value. */

4178

4179 do {

                 attr = read_uleb128 (&da, enda);

4181 skip_leb128 (&da, enda);

             } while (attr != 0 && attr != (uint64_t) -1);

             if (attr != 0)

4184 return false;

4185 }

4186

4187 /* Check that the abbrev is one for a DW_TAG_compile_unit. */

         if (read_uleb128 (&da, enda) != DW_TAG_compile_unit)

4189 return false;

4190 if (da == enda)

4191 return false;

4192 da++; /* Skip the DW_CHILDREN_* value. */

4193

4194 /* Now, go through the DIE looking for DW_AT_name,

4195 DW_AT_comp_dir, and DW_AT_stmt_list. */

4196 bool skip_to_next_cu = false;

4197 while (!skip_to_next_cu) {

4198

             uint64_t attr = read_uleb128 (&da, enda);

             uint64_t form = read_uleb128 (&da, enda);

4201

             if (attr == (uint64_t) -1)

4203 return false;

             else if (attr == 0)

4205 return true;

4206 if (form == DW_FORM_indirect)

                 form = read_uleb128 (&di, end);

4208

4209 switch (attr) {

4210 case DW_AT_name:

                     *name = getDwarfString(form, di);

4212 /* Swift object files may contain two CUs: One

4213 describes the Swift code, one is created by the

4214 clang importer. Skip over the CU created by the

4215 clang importer as it may be empty. */

                     if (std::string(*name) == "<swift-imported-modules>")

4217 skip_to_next_cu = true;

4218 break;

4219 case DW_AT_comp_dir:

                     *comp_dir = getDwarfString(form, di);

4221 break;

4222 case DW_AT_stmt_list:

                     *stmt_list = getDwarfOffset(form, di, dwarf64);

4224 break;

4225 default:

                     if (! skip_form (&di, end, form, address_size, dwarf64))

4227 return false;

4228 }

4229 }

4230 }

4231 return false;

4232 }

4233

4234

4235

4236 template <typename A>

4237 File<A>::~File()

4238 {

4239 free(_sectionsArray);

4240 free(_atomsArray);

4241 }

4242

4243 template <typename A>

 const char* File<A>::translationUnitSource() const

4245 {

4246 return _dwarfTranslationUnitPath;

4247 }

4248

4249 template <typename A>

 bool File<A>::forEachAtom(ld::File::AtomHandler& handler) const

4251 {

         handler.doFile(*this);

4253 uint8_t* p = _atomsArray;

         for(int i=_atomsArrayCount; i > 0; --i) {

                 handler.doAtom(*((Atom<A>*)p));

                 p += sizeof(Atom<A>);

4257 }

4258 p = _aliasAtomsArray;

         for(int i=_aliasAtomsArrayCount; i > 0; --i) {

                 handler.doAtom(*((AliasAtom*)p));

4261 p += sizeof(AliasAtom);

4262 }

4263

         return (_atomsArrayCount != 0) || (_aliasAtomsArrayCount != 0);

4265 }

4266

4267 template <typename A>

 const char* Section<A>::makeSegmentName(const macho_section<typename A::P>* sect)

4269 {

4270 // mach-o section record only has room for 16-byte seg/sect names

4271 // so a 16-byte name has no trailing zero

         const char* name = sect->segname();

         if ( strlen(name) < 16 ) 

4274 return name;

         char* tmp = new char[17];

         strlcpy(tmp, name, 17);

4277 return tmp;

4278 }

4279

4280 template <typename A>

 const char* Section<A>::makeSectionName(const macho_section<typename A::P>* sect)

4282 {

         const char* name = sect->sectname();

         if ( strlen(name) < 16 ) 

4285 return name;

4286

4287 // special case common long section names so we don't have to malloc

         if ( strncmp(sect->sectname(), "__objc_classrefs", 16) == 0 )

4289 return "__objc_classrefs";

         if ( strncmp(sect->sectname(), "__objc_classlist", 16) == 0 )

4291 return "__objc_classlist";

         if ( strncmp(sect->sectname(), "__objc_nlclslist", 16) == 0 )

4293 return "__objc_nlclslist";

         if ( strncmp(sect->sectname(), "__objc_nlcatlist", 16) == 0 )

4295 return "__objc_nlcatlist";

         if ( strncmp(sect->sectname(), "__objc_protolist", 16) == 0 )

4297 return "__objc_protolist";

         if ( strncmp(sect->sectname(), "__objc_protorefs", 16) == 0 )

4299 return "__objc_protorefs";

         if ( strncmp(sect->sectname(), "__objc_superrefs", 16) == 0 )

4301 return "__objc_superrefs";

         if ( strncmp(sect->sectname(), "__objc_imageinfo", 16) == 0 )

4303 return "__objc_imageinfo";

         if ( strncmp(sect->sectname(), "__objc_stringobj", 16) == 0 )

4305 return "__objc_stringobj";

         if ( strncmp(sect->sectname(), "__gcc_except_tab", 16) == 0 )

4307 return "__gcc_except_tab";

4308

         char* tmp = new char[17];

         strlcpy(tmp, name, 17);

4311 return tmp;

4312 }

4313

4314 template <typename A>

 bool Section<A>::readable(const macho_section<typename A::P>* sect)

4316 {

4317 return true;

4318 }

4319

4320 template <typename A>

 bool Section<A>::writable(const macho_section<typename A::P>* sect)

4322 {

4323 // mach-o .o files do not contain segment permissions

4324 // we just know TEXT is special

         return ( strcmp(sect->segname(), "__TEXT") != 0 );

4326 }

4327

4328 template <typename A>

 bool Section<A>::exectuable(const macho_section<typename A::P>* sect)

4330 {

4331 // mach-o .o files do not contain segment permissions

4332 // we just know TEXT is special

         return ( strcmp(sect->segname(), "__TEXT") == 0 );

4334 }

4335

4336

4337 template <typename A>

 ld::Section::Type Section<A>::sectionType(const macho_section<typename A::P>* sect)

4339 {

         switch ( sect->flags() & SECTION_TYPE ) {

4341 case S_ZEROFILL:

                         return ld::Section::typeZeroFill;

4343 case S_CSTRING_LITERALS:

                         if ( (strcmp(sect->sectname(), "__cstring") == 0) && (strcmp(sect->segname(), "__TEXT") == 0) )

                                 return ld::Section::typeCString;

4346 else

                                 return ld::Section::typeNonStdCString;

4348 case S_4BYTE_LITERALS:

                         return ld::Section::typeLiteral4;

4350 case S_8BYTE_LITERALS:

                         return ld::Section::typeLiteral8;

4352 case S_LITERAL_POINTERS:

                         return ld::Section::typeCStringPointer;

4354 case S_NON_LAZY_SYMBOL_POINTERS:

                         return ld::Section::typeNonLazyPointer;

4356 case S_LAZY_SYMBOL_POINTERS:

                         return ld::Section::typeLazyPointer;

4358 case S_SYMBOL_STUBS:

                         return ld::Section::typeStub;

4360 case S_MOD_INIT_FUNC_POINTERS:

                         return ld::Section::typeInitializerPointers;

4362 case S_MOD_TERM_FUNC_POINTERS:

                         return ld::Section::typeTerminatorPointers;

4364 case S_INTERPOSING:

                         return ld::Section::typeUnclassified;

4366 case S_16BYTE_LITERALS:

                         return ld::Section::typeLiteral16;

4368 case S_REGULAR:

4369 case S_COALESCED:

                         if ( sect->flags() & S_ATTR_PURE_INSTRUCTIONS ) {

                                 return ld::Section::typeCode;

4372 }

                         else if ( strcmp(sect->segname(), "__TEXT") == 0 ) {

                                 if ( strcmp(sect->sectname(), "__eh_frame") == 0 ) 

                                         return ld::Section::typeCFI;

                                 else if ( strcmp(sect->sectname(), "__ustring") == 0 )

                                         return ld::Section::typeUTF16Strings;

                                 else if ( strcmp(sect->sectname(), "__textcoal_nt") == 0 )

                                         return ld::Section::typeCode;

                                 else if ( strcmp(sect->sectname(), "__StaticInit") == 0 )

                                         return ld::Section::typeCode;

                                 else if ( strcmp(sect->sectname(), "__constructor") == 0 )

                                         return ld::Section::typeInitializerPointers;

4384 }

                         else if ( strcmp(sect->segname(), "__DATA") == 0 ) {

                                 if ( strcmp(sect->sectname(), "__cfstring") == 0 ) 

                                         return ld::Section::typeCFString;

                                 else if ( strcmp(sect->sectname(), "__dyld") == 0 )

                                         return ld::Section::typeDyldInfo;

                                 else if ( strcmp(sect->sectname(), "__program_vars") == 0 )

                                         return ld::Section::typeDyldInfo;

                                 else if ( strncmp(sect->sectname(), "__objc_classrefs", 16) == 0 )

                                         return ld::Section::typeObjCClassRefs;

                                 else if ( strcmp(sect->sectname(), "__objc_catlist") == 0 )

                                         return ld::Section::typeObjC2CategoryList;

4396 }

                         else if ( strcmp(sect->segname(), "__OBJC") == 0 ) {

                                 if ( strcmp(sect->sectname(), "__class") == 0 ) 

                                         return ld::Section::typeObjC1Classes;

4400 }

4401 break;

4402 case S_THREAD_LOCAL_REGULAR:

                         return ld::Section::typeTLVInitialValues;

4404 case S_THREAD_LOCAL_ZEROFILL:

                         return ld::Section::typeTLVZeroFill;

4406 case S_THREAD_LOCAL_VARIABLES:

                         return ld::Section::typeTLVDefs;

4408 case S_THREAD_LOCAL_VARIABLE_POINTERS:

                         return ld::Section::typeTLVPointers;

4410 case S_THREAD_LOCAL_INIT_FUNCTION_POINTERS:

                         return ld::Section::typeTLVInitializerPointers;

4412 }

         return ld::Section::typeUnclassified;

4414 }

4415

4416

4417 template <typename A>

 Atom<A>* Section<A>::findContentAtomByAddress(pint_t addr, class Atom<A>* start, class Atom<A>* end)

4419 {

4420 // do a binary search of atom array

4421 uint32_t atomCount = end - start;

4422 Atom<A>* base = start;

         for (uint32_t n = atomCount; n > 0; n /= 2) {

                 Atom<A>* pivot = &base[n/2];

4425 pint_t atomStartAddr = pivot->_objAddress;

4426 pint_t atomEndAddr = atomStartAddr + pivot->_size;

4427 if ( atomStartAddr <= addr ) {

4428 // address in normal atom

4429 if (addr < atomEndAddr)

4430 return pivot;

4431 // address in "end" label (but not in alias)

                         if ( (pivot->_size == 0) && (addr == atomEndAddr) && !pivot->isAlias() )

4433 return pivot;

4434 }

4435 if ( addr >= atomEndAddr ) {

4436 // key > pivot

4437 // move base to atom after pivot

4438 base = &pivot[1];

4439 --n;

4440 }

4441 else {

4442 // key < pivot

4443 // keep same base

4444 }

4445 }

4446 return NULL;

4447 }

4448

4449 template <typename A>

 ld::Atom::Alignment Section<A>::alignmentForAddress(pint_t addr) 

4451 {

         const uint32_t sectionAlignment = this->_machOSection->align();

         uint32_t modulus = (addr % (1 << sectionAlignment));

         if ( modulus > 0xFFFF )

                 warning("alignment for symbol at address 0x%08llX in %s exceeds 2^16", (uint64_t)addr, this->file().path());

         return ld::Atom::Alignment(sectionAlignment, modulus);

4457 }

4458

4459 template <typename A>

 uint32_t Section<A>::sectionNum(class Parser<A>& parser) const  

4461 {

4462 if ( _machOSection == NULL )

4463 return 0;

4464 else

                 return 1 + (this->_machOSection - parser.firstMachOSection());

4466 }

4467

4468 // arm does not have zero cost exceptions

4469 template <>

 uint32_t CFISection<arm>::cfiCount(Parser<arm>& parser) 

4471 {

         if ( parser.armUsesZeroCostExceptions() ) {

4473 // create ObjectAddressSpace object for use by libunwind

                 OAS oas(*this, (uint8_t*)this->file().fileContent()+this->_machOSection->offset());

                 return libunwind::CFI_Parser<OAS>::getCFICount(oas, 

                                                                                         this->_machOSection->addr(), this->_machOSection->size());

4477 }

4478 return 0;

4479 }

4480

4481 template <typename A>

 uint32_t CFISection<A>::cfiCount(Parser<A>& parser)

4483 {

4484 // create ObjectAddressSpace object for use by libunwind

         OAS oas(*this, (uint8_t*)this->file().fileContent()+this->_machOSection->offset());

         return libunwind::CFI_Parser<OAS>::getCFICount(oas, 

                                                                                 this->_machOSection->addr(), this->_machOSection->size());

4488 }

4489

4490 template <typename A>

 void CFISection<A>::warnFunc(void* ref, uint64_t funcAddr, const char* msg)

4492 {

         Parser<A>* parser = (Parser<A>*)ref;

         if ( ! parser->warnUnwindConversionProblems() ) 

4495 return;

4496 if ( funcAddr != CFI_INVALID_ADDRESS ) {

4497 // atoms are not constructed yet, so scan symbol table for labels

                 const char* name = parser->scanSymbolTableForAddress(funcAddr);

                 warning("could not create compact unwind for %s: %s", name, msg);

4500 }

4501 else {

                 warning("could not create compact unwind: %s", msg);

4503 }

4504 }

4505

4506 template <>

 bool CFISection<x86_64>::needsRelocating()

4508 {

4509 return true;

4510 }

4511

4512 template <>

 bool CFISection<arm64>::needsRelocating()

4514 {

4515 return true;

4516 }

4517

4518

4519 template <typename A>

 bool CFISection<A>::needsRelocating()

4521 {

4522 return false;

4523 }

4524

4525 template <>

 void CFISection<x86_64>::cfiParse(class Parser<x86_64>& parser, uint8_t* buffer,

                                                                         libunwind::CFI_Atom_Info<CFISection<x86_64>::OAS> cfiArray[],

                                                                         uint32_t& count, const pint_t cuStarts[], uint32_t cuCount)

4529 {

         const uint32_t sectionSize = this->_machOSection->size();

4531 // copy __eh_frame data to buffer

         memcpy(buffer, file().fileContent() + this->_machOSection->offset(), sectionSize);

4533

4534 // and apply relocations

         const macho_relocation_info<P>* relocs = (macho_relocation_info<P>*)(file().fileContent() + this->_machOSection->reloff());

         const macho_relocation_info<P>* relocsEnd = &relocs[this->_machOSection->nreloc()];

         for (const macho_relocation_info<P>* reloc = relocs; reloc < relocsEnd; ++reloc) {

4538 uint64_t value = 0;

                 switch ( reloc->r_type() ) {

4540 case X86_64_RELOC_SUBTRACTOR:

                                 value =  0 - parser.symbolFromIndex(reloc->r_symbolnum()).n_value();

4542 ++reloc;

                                 if ( reloc->r_extern() )

                                         value += parser.symbolFromIndex(reloc->r_symbolnum()).n_value();

4545 break;

4546 case X86_64_RELOC_UNSIGNED:

                                 value = parser.symbolFromIndex(reloc->r_symbolnum()).n_value();

4548 break;

4549 case X86_64_RELOC_GOT:

4550 // this is used for the reference to the personality function in CIEs

4551 // store the symbol number of the personality function for later use as a Fixup

4552 value = reloc->r_symbolnum();

4553 break;

4554 default:

                                 fprintf(stderr, "CFISection::cfiParse() unexpected relocation type at r_address=0x%08X\n", reloc->r_address());

4556 break;

4557 }

                 if ( reloc->r_address() > sectionSize )

                         throwf("malformed __eh_frame relocation, offset (0x%08X) is beyond end of section,", reloc->r_address());

4560 uint64_t* p64;

4561 uint32_t* p32;

                 switch ( reloc->r_length() ) {

4563 case 3:

                                 p64 = (uint64_t*)&buffer[reloc->r_address()];

                                 E::set64(*p64, value + E::get64(*p64));

4566 break;

4567 case 2:

                                 p32 = (uint32_t*)&buffer[reloc->r_address()];

                                 E::set32(*p32, value + E::get32(*p32));

4570 break;

4571 default:

                                 fprintf(stderr, "CFISection::cfiParse() unexpected relocation size at r_address=0x%08X\n", reloc->r_address());

4573 break;

4574 }

4575 }

4576

4577 // create ObjectAddressSpace object for use by libunwind

         OAS oas(*this, buffer);

4579

4580 // use libuwind to parse __eh_frame data into array of CFI_Atom_Info

4581 const char* msg;

         msg = libunwind::DwarfInstructions<OAS, libunwind::Registers_x86_64>::parseCFIs(

                                                         oas, this->_machOSection->addr(), this->_machOSection->size(), 

                                                         cuStarts, cuCount, parser.keepDwarfUnwind(), parser.forceDwarfConversion(), parser.neverConvertDwarf(), 

                                                         cfiArray, count, (void*)&parser, warnFunc);

4586 if ( msg != NULL )

                 throwf("malformed __eh_frame section: %s", msg);

4588 }

4589

4590 template <>

 void CFISection<x86>::cfiParse(class Parser<x86>& parser, uint8_t* buffer, 

                                                                         libunwind::CFI_Atom_Info<CFISection<x86>::OAS> cfiArray[],

                                                                         uint32_t& count, const pint_t cuStarts[], uint32_t cuCount)

4594 {

4595 // create ObjectAddressSpace object for use by libunwind

         OAS oas(*this, (uint8_t*)this->file().fileContent()+this->_machOSection->offset());

4597

4598 // use libuwind to parse __eh_frame data into array of CFI_Atom_Info

4599 const char* msg;

         msg = libunwind::DwarfInstructions<OAS, libunwind::Registers_x86>::parseCFIs(

                                                         oas, this->_machOSection->addr(), this->_machOSection->size(), 

                                                         cuStarts, cuCount, parser.keepDwarfUnwind(), parser.forceDwarfConversion(), parser.neverConvertDwarf(),

                                                         cfiArray, count, (void*)&parser, warnFunc);

4604 if ( msg != NULL )

                 throwf("malformed __eh_frame section: %s", msg);

4606 }

4611 template <>

 void CFISection<arm>::cfiParse(class Parser<arm>& parser, uint8_t* buffer, 

                                                                         libunwind::CFI_Atom_Info<CFISection<arm>::OAS> cfiArray[],

                                                                         uint32_t& count, const pint_t cuStarts[], uint32_t cuCount)

4615 {

         if ( !parser.armUsesZeroCostExceptions() ) {

4617 // most arm do not use zero cost exceptions

                 assert(count == 0);

4619 return;

4620 }

4621 // create ObjectAddressSpace object for use by libunwind

         OAS oas(*this, (uint8_t*)this->file().fileContent()+this->_machOSection->offset());

4623

4624 // use libuwind to parse __eh_frame data into array of CFI_Atom_Info

4625 const char* msg;

         msg = libunwind::DwarfInstructions<OAS, libunwind::Registers_arm>::parseCFIs(

                                                         oas, this->_machOSection->addr(), this->_machOSection->size(), 

                                                         cuStarts, cuCount, parser.keepDwarfUnwind(), parser.forceDwarfConversion(), parser.neverConvertDwarf(),

                                                         cfiArray, count, (void*)&parser, warnFunc);

4630 if ( msg != NULL )

                 throwf("malformed __eh_frame section: %s", msg);

4632 }

4637 template <>

 void CFISection<arm64>::cfiParse(class Parser<arm64>& parser, uint8_t* buffer, 

                                                                         libunwind::CFI_Atom_Info<CFISection<arm64>::OAS> cfiArray[],

                                                                         uint32_t& count, const pint_t cuStarts[], uint32_t cuCount)

4641 {

4642 // copy __eh_frame data to buffer

         const uint32_t sectionSize = this->_machOSection->size();

         memcpy(buffer, file().fileContent() + this->_machOSection->offset(), sectionSize);

4645

4646 // and apply relocations

         const macho_relocation_info<P>* relocs = (macho_relocation_info<P>*)(file().fileContent() + this->_machOSection->reloff());

         const macho_relocation_info<P>* relocsEnd = &relocs[this->_machOSection->nreloc()];

         for (const macho_relocation_info<P>* reloc = relocs; reloc < relocsEnd; ++reloc) {

                 uint64_t* p64 = (uint64_t*)&buffer[reloc->r_address()];

                 uint32_t* p32 = (uint32_t*)&buffer[reloc->r_address()];

                 uint32_t addend32 = E::get32(*p32); 

                 uint64_t addend64 = E::get64(*p64); 

4654 uint64_t value = 0;

                 switch ( reloc->r_type() ) {

4656 case ARM64_RELOC_SUBTRACTOR:

                                 value =  0 - parser.symbolFromIndex(reloc->r_symbolnum()).n_value();

4658 ++reloc;

                                 if ( reloc->r_extern() )

                                         value += parser.symbolFromIndex(reloc->r_symbolnum()).n_value();

4661 break;

4662 case ARM64_RELOC_UNSIGNED:

                                 value = parser.symbolFromIndex(reloc->r_symbolnum()).n_value();

4664 break;

4665 case ARM64_RELOC_POINTER_TO_GOT:

4666 // this is used for the reference to the personality function in CIEs

4667 // store the symbol number of the personality function for later use as a Fixup

4668 value = reloc->r_symbolnum();

4669 addend32 = 0;

4670 addend64 = 0;

4671 break;

4672 default:

                                 fprintf(stderr, "CFISection::cfiParse() unexpected relocation type at r_address=0x%08X\n", reloc->r_address());

4674 break;

4675 }

                 if ( reloc->r_address() > sectionSize )

                         throwf("malformed __eh_frame relocation, offset (0x%08X) is beyond end of section,", reloc->r_address());

                 switch ( reloc->r_length() ) {

4679 case 3:

                                 E::set64(*p64, value + addend64);

4681 break;

4682 case 2:

                                 E::set32(*p32, value + addend32);

4684 break;

4685 default:

                                 fprintf(stderr, "CFISection::cfiParse() unexpected relocation size at r_address=0x%08X\n", reloc->r_address());

4687 break;

4688 }

4689 }

4690

4691

4692 // create ObjectAddressSpace object for use by libunwind

         OAS oas(*this, buffer);

4694

4695 // use libuwind to parse __eh_frame data into array of CFI_Atom_Info

4696 const char* msg;

         msg = libunwind::DwarfInstructions<OAS, libunwind::Registers_arm64>::parseCFIs(

                                                         oas, this->_machOSection->addr(), this->_machOSection->size(), 

                                                         cuStarts, cuCount, parser.keepDwarfUnwind(), parser.forceDwarfConversion(), parser.neverConvertDwarf(),

                                                         cfiArray, count, (void*)&parser, warnFunc);

4701 if ( msg != NULL )

                 throwf("malformed __eh_frame section: %s", msg);

4703 }

4704

4705

4706 template <typename A>

 uint32_t CFISection<A>::computeAtomCount(class Parser<A>& parser, 

                                                                                         struct Parser<A>::LabelAndCFIBreakIterator& it, 

                                                                                         const struct Parser<A>::CFI_CU_InfoArrays& cfis)

4710 {

4711 return cfis.cfiCount;

4712 }

4713

4714

4715

4716 template <typename A>

 uint32_t CFISection<A>::appendAtoms(class Parser<A>& parser, uint8_t* p, 

                                                                         struct Parser<A>::LabelAndCFIBreakIterator& it, 

                                                                         const struct Parser<A>::CFI_CU_InfoArrays& cfis)

4720 {

         this->_beginAtoms = (Atom<A>*)p;

4722 // walk CFI_Atom_Info array and create atom for each entry

         const CFI_Atom_Info* start = &cfis.cfiArray[0];

         const CFI_Atom_Info* end   = &cfis.cfiArray[cfis.cfiCount];

         for(const CFI_Atom_Info* a=start; a < end; ++a) {

                 Atom<A>* space = (Atom<A>*)p;

                 new (space) Atom<A>(*this, (a->isCIE ? "CIE" : "FDE"), a->address, a->size, 

                                                                                 ld::Atom::definitionRegular, ld::Atom::combineNever, ld::Atom::scopeTranslationUnit,

                                                                                 ld::Atom::typeCFI, ld::Atom::symbolTableNotInFinalLinkedImages, 

                                                                                 false, false, false, ld::Atom::Alignment(0));

                 p += sizeof(Atom<A>);

4732 }

         this->_endAtoms = (Atom<A>*)p;

4734 return cfis.cfiCount;

4735 }

4736

4737

 template <> bool CFISection<x86_64>::bigEndian() { return false; }

 template <> bool CFISection<x86>::bigEndian() { return false; }

 template <> bool CFISection<arm>::bigEndian() { return false; }

 template <> bool CFISection<arm64>::bigEndian() { return false; }

4742

4743 template <>

 void CFISection<x86_64>::addCiePersonalityFixups(class Parser<x86_64>& parser, const CFI_Atom_Info* cieInfo)

4745 {

         uint8_t personalityEncoding = cieInfo->u.cieInfo.personality.encodingOfTargetAddress;

         if ( personalityEncoding == 0x9B ) {

4748 // compiler always produces X86_64_RELOC_GOT with addend of 4 to personality function

4749 // CFISection<x86_64>::cfiParse() set targetAddress to be symbolIndex + 4 + addressInCIE

                 uint32_t symbolIndex = cieInfo->u.cieInfo.personality.targetAddress - 4 

                                                                         - cieInfo->address - cieInfo->u.cieInfo.personality.offsetInCFI;

                 const macho_nlist<P>& sym = parser.symbolFromIndex(symbolIndex);

                 const char* personalityName = parser.nameFromSymbol(sym);

4754

                 Atom<x86_64>* cieAtom = this->findAtomByAddress(cieInfo->address);

                 Parser<x86_64>::SourceLocation src(cieAtom, cieInfo->u.cieInfo.personality.offsetInCFI);

                 parser.addFixup(src, ld::Fixup::k1of3, ld::Fixup::kindSetTargetAddress, false, personalityName);

                 parser.addFixup(src, ld::Fixup::k2of3, ld::Fixup::kindAddAddend, 4);

                 parser.addFixup(src, ld::Fixup::k3of3, ld::Fixup::kindStoreX86PCRel32GOT);

4760 }

         else if ( personalityEncoding != 0 ) {

                 throwf("unsupported address encoding (%02X) of personality function in CIE", 

4763 personalityEncoding);

4764 }

4765 }

4766

4767 template <>

 void CFISection<x86>::addCiePersonalityFixups(class Parser<x86>& parser, const CFI_Atom_Info* cieInfo)

4769 {

         uint8_t personalityEncoding = cieInfo->u.cieInfo.personality.encodingOfTargetAddress;

         if ( (personalityEncoding == 0x9B) || (personalityEncoding == 0x90) ) {

                 uint32_t offsetInCFI = cieInfo->u.cieInfo.personality.offsetInCFI;

                 uint32_t nlpAddr = cieInfo->u.cieInfo.personality.targetAddress;

                 Atom<x86>* cieAtom = this->findAtomByAddress(cieInfo->address);

                 Atom<x86>* nlpAtom = parser.findAtomByAddress(nlpAddr);

                 assert(nlpAtom->contentType() == ld::Atom::typeNonLazyPointer);

                 Parser<x86>::SourceLocation src(cieAtom, cieInfo->u.cieInfo.personality.offsetInCFI);

4778

                 parser.addFixup(src, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, nlpAtom);

                 parser.addFixup(src, ld::Fixup::k2of4, ld::Fixup::kindSubtractTargetAddress, cieAtom);

                 parser.addFixup(src, ld::Fixup::k3of4, ld::Fixup::kindSubtractAddend, offsetInCFI);

                 parser.addFixup(src, ld::Fixup::k4of4, ld::Fixup::kindStoreLittleEndian32);

4783 }

         else if ( personalityEncoding != 0 ) {

                 throwf("unsupported address encoding (%02X) of personality function in CIE", personalityEncoding);

4786 }

4787 }

4788

4789 #if SUPPORT_ARCH_arm64

4790 template <>

 void CFISection<arm64>::addCiePersonalityFixups(class Parser<arm64>& parser, const CFI_Atom_Info* cieInfo)

4792 {

         uint8_t personalityEncoding = cieInfo->u.cieInfo.personality.encodingOfTargetAddress;

         if ( personalityEncoding == 0x9B ) {

4795 // compiler always produces ARM64_RELOC_GOT r_pcrel=1 to personality function

4796 // CFISection<arm64>::cfiParse() set targetAddress to be symbolIndex + addressInCIE

                 uint32_t symbolIndex = cieInfo->u.cieInfo.personality.targetAddress 

                                                                         - cieInfo->address - cieInfo->u.cieInfo.personality.offsetInCFI;

                 const macho_nlist<P>& sym = parser.symbolFromIndex(symbolIndex);

                 const char* personalityName = parser.nameFromSymbol(sym);

4801

                 Atom<arm64>* cieAtom = this->findAtomByAddress(cieInfo->address);

                 Parser<arm64>::SourceLocation src(cieAtom, cieInfo->u.cieInfo.personality.offsetInCFI);

                 parser.addFixup(src, ld::Fixup::k1of2, ld::Fixup::kindSetTargetAddress, false, personalityName);

                 parser.addFixup(src, ld::Fixup::k2of2, ld::Fixup::kindStoreARM64PCRelToGOT);

4806 }

         else if ( personalityEncoding != 0 ) {

                 throwf("unsupported address encoding (%02X) of personality function in CIE", 

4809 personalityEncoding);

4810 }

4811 }

4812 #endif

4813

4814

4815 template <>

 void CFISection<arm>::addCiePersonalityFixups(class Parser<arm>& parser, const CFI_Atom_Info* cieInfo)

4817 {

         uint8_t personalityEncoding = cieInfo->u.cieInfo.personality.encodingOfTargetAddress;

         if ( (personalityEncoding == 0x9B) || (personalityEncoding == 0x90) ) {

                 uint32_t offsetInCFI = cieInfo->u.cieInfo.personality.offsetInCFI;

                 uint32_t nlpAddr = cieInfo->u.cieInfo.personality.targetAddress;

                 Atom<arm>* cieAtom = this->findAtomByAddress(cieInfo->address);

                 Atom<arm>* nlpAtom = parser.findAtomByAddress(nlpAddr);

                 assert(nlpAtom->contentType() == ld::Atom::typeNonLazyPointer);

                 Parser<arm>::SourceLocation src(cieAtom, cieInfo->u.cieInfo.personality.offsetInCFI);

4826

                 parser.addFixup(src, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, nlpAtom);

                 parser.addFixup(src, ld::Fixup::k2of4, ld::Fixup::kindSubtractTargetAddress, cieAtom);

                 parser.addFixup(src, ld::Fixup::k3of4, ld::Fixup::kindSubtractAddend, offsetInCFI);

                 parser.addFixup(src, ld::Fixup::k4of4, ld::Fixup::kindStoreLittleEndian32);

4831 }

         else if ( personalityEncoding != 0 ) {

                 throwf("unsupported address encoding (%02X) of personality function in CIE", personalityEncoding);

4834 }

4835 }

4836

4837

4838

4839 template <typename A>

 void CFISection<A>::addCiePersonalityFixups(class Parser<A>& parser, const CFI_Atom_Info* cieInfo)

4841 {

         assert(0 && "addCiePersonalityFixups() not implemented for arch");

4843 }

4844

4845 template <typename A>

 void CFISection<A>::makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays& cfis)

4847 {

         ld::Fixup::Kind store32 = bigEndian() ? ld::Fixup::kindStoreBigEndian32 : ld::Fixup::kindStoreLittleEndian32;

         ld::Fixup::Kind store64 = bigEndian() ? ld::Fixup::kindStoreBigEndian64 : ld::Fixup::kindStoreLittleEndian64;

4850

4851 // add all references for FDEs, including implicit group references

         const CFI_Atom_Info* end = &cfis.cfiArray[cfis.cfiCount];

         for(const CFI_Atom_Info* p = &cfis.cfiArray[0]; p < end; ++p) {

4854 if ( p->isCIE ) {

4855 // add reference to personality function if used

                         if ( p->u.cieInfo.personality.targetAddress != CFI_INVALID_ADDRESS ) {

                                 this->addCiePersonalityFixups(parser, p);

4858 }

4859 }

4860 else {

4861 // find FDE Atom

                         Atom<A>* fdeAtom = this->findAtomByAddress(p->address);

4863 // find function Atom

                         Atom<A>* functionAtom = parser.findAtomByAddress(p->u.fdeInfo.function.targetAddress);

4865 // find CIE Atom

                         Atom<A>* cieAtom = this->findAtomByAddress(p->u.fdeInfo.cie.targetAddress);

4867 // find LSDA Atom

4868 Atom<A>* lsdaAtom = NULL;

                         if ( p->u.fdeInfo.lsda.targetAddress != CFI_INVALID_ADDRESS ) {

                                 lsdaAtom = parser.findAtomByAddress(p->u.fdeInfo.lsda.targetAddress);

4871 }

4872 // add reference from FDE to CIE (always 32-bit pc-rel)

                         typename Parser<A>::SourceLocation fdeToCieSrc(fdeAtom, p->u.fdeInfo.cie.offsetInCFI);

                         parser.addFixup(fdeToCieSrc, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, fdeAtom);

                         parser.addFixup(fdeToCieSrc, ld::Fixup::k2of4, ld::Fixup::kindAddAddend, p->u.fdeInfo.cie.offsetInCFI);

                         parser.addFixup(fdeToCieSrc, ld::Fixup::k3of4, ld::Fixup::kindSubtractTargetAddress, cieAtom);

                         parser.addFixup(fdeToCieSrc, ld::Fixup::k4of4, store32, cieAtom);

4878

4879 // add reference from FDE to function

                         typename Parser<A>::SourceLocation fdeToFuncSrc(fdeAtom, p->u.fdeInfo.function.offsetInCFI);

                         switch (p->u.fdeInfo.function.encodingOfTargetAddress) {

4882 case DW_EH_PE_pcrel|DW_EH_PE_ptr:

                                         if ( sizeof(typename A::P::uint_t) == 8 ) {

                                                 parser.addFixup(fdeToFuncSrc, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, functionAtom);

                                                 parser.addFixup(fdeToFuncSrc, ld::Fixup::k2of4, ld::Fixup::kindSubtractTargetAddress, fdeAtom);

                                                 parser.addFixup(fdeToFuncSrc, ld::Fixup::k3of4, ld::Fixup::kindSubtractAddend, p->u.fdeInfo.function.offsetInCFI);

                                                 parser.addFixup(fdeToFuncSrc, ld::Fixup::k4of4, store64);

4888 break;

4889 }

4890 // else fall into 32-bit case

4891 case DW_EH_PE_pcrel|DW_EH_PE_sdata4:

                                         parser.addFixup(fdeToFuncSrc, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, functionAtom);

                                         parser.addFixup(fdeToFuncSrc, ld::Fixup::k2of4, ld::Fixup::kindSubtractTargetAddress, fdeAtom);

                                         parser.addFixup(fdeToFuncSrc, ld::Fixup::k3of4, ld::Fixup::kindSubtractAddend, p->u.fdeInfo.function.offsetInCFI);

                                         parser.addFixup(fdeToFuncSrc, ld::Fixup::k4of4, store32);

4896 break;

4897 default:

4898 throw "unsupported encoding in FDE of pointer to function";

4899 }

4900

4901 // add reference from FDE to LSDA

                         typename Parser<A>::SourceLocation fdeToLsdaSrc(fdeAtom,  p->u.fdeInfo.lsda.offsetInCFI);

4903 if ( lsdaAtom != NULL ) {

                                 switch (p->u.fdeInfo.lsda.encodingOfTargetAddress) {

4905 case DW_EH_PE_pcrel|DW_EH_PE_ptr:

                                                 if ( sizeof(typename A::P::uint_t) == 8 ) {

                                                         parser.addFixup(fdeToLsdaSrc, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, lsdaAtom);

                                                         parser.addFixup(fdeToLsdaSrc, ld::Fixup::k2of4, ld::Fixup::kindSubtractTargetAddress, fdeAtom);

                                                         parser.addFixup(fdeToLsdaSrc, ld::Fixup::k3of4, ld::Fixup::kindSubtractAddend, p->u.fdeInfo.lsda.offsetInCFI);

                                                         parser.addFixup(fdeToLsdaSrc, ld::Fixup::k4of4, store64);

4911 break;

4912 }

4913 // else fall into 32-bit case

4914 case DW_EH_PE_pcrel|DW_EH_PE_sdata4:

                                                 parser.addFixup(fdeToLsdaSrc, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, lsdaAtom);

                                                 parser.addFixup(fdeToLsdaSrc, ld::Fixup::k2of4, ld::Fixup::kindSubtractTargetAddress, fdeAtom);

                                                 parser.addFixup(fdeToLsdaSrc, ld::Fixup::k3of4, ld::Fixup::kindSubtractAddend, p->u.fdeInfo.lsda.offsetInCFI);

                                                 parser.addFixup(fdeToLsdaSrc, ld::Fixup::k4of4, store32);

4919 break;

4920 default:

4921 throw "unsupported encoding in FDE of pointer to LSDA";

4922 }

4923 }

4924

4925 // FDE is in group lead by function atom

                         typename Parser<A>::SourceLocation fdeSrc(functionAtom,0);

                         parser.addFixup(fdeSrc, ld::Fixup::k1of1, ld::Fixup::kindNoneGroupSubordinateFDE, fdeAtom);

4928

4929 // LSDA is in group lead by function atom

4930 if ( lsdaAtom != NULL ) {

                                 parser.addFixup(fdeSrc, ld::Fixup::k1of1, ld::Fixup::kindNoneGroupSubordinateLSDA, lsdaAtom);

4932 }

4933 }

4934 }

4935 }

4940 template <typename A>

 const void*      CFISection<A>::OAS::mappedAddress(pint_t addr)

4942 {

         if ( (_ehFrameStartAddr <= addr) && (addr < _ehFrameEndAddr) )

                 return &_ehFrameContent[addr-_ehFrameStartAddr];

4945 else {

4946 // requested bytes are not in __eh_frame section

4947 // this can occur when examining the instruction bytes in the __text

                 File<A>& file = _ehFrameSection.file();

                 for (uint32_t i=0; i < file._sectionsArrayCount; ++i ) {

                         const macho_section<typename A::P>* sect = file._sectionsArray[i]->machoSection();

4951 // TentativeDefinitionSection and AbsoluteSymbolSection have no mach-o section

4952 if ( sect != NULL ) {

                                 if ( (sect->addr() <= addr) && (addr < (sect->addr()+sect->size())) ) {

                                         return file.fileContent() + sect->offset() + addr - sect->addr();

4955 }

4956 }

4957 }

                 throwf("__eh_frame parsing problem.  Can't find target of reference to address 0x%08llX", (uint64_t)addr);

4959 }

4960 }

4961

4962

4963 template <typename A>

 uint64_t CFISection<A>::OAS::getULEB128(pint_t& logicalAddr, pint_t end)

4965 {

4966 uintptr_t size = (end - logicalAddr);

         libunwind::LocalAddressSpace::pint_t laddr = (libunwind::LocalAddressSpace::pint_t)mappedAddress(logicalAddr);

         libunwind::LocalAddressSpace::pint_t sladdr = laddr;

         uint64_t result = libunwind::LocalAddressSpace::getULEB128(laddr, laddr+size);

4970 logicalAddr += (laddr-sladdr);

4971 return result;

4972 }

4973

4974 template <typename A>

 int64_t CFISection<A>::OAS::getSLEB128(pint_t& logicalAddr, pint_t end)

4976 {

4977 uintptr_t size = (end - logicalAddr);

         libunwind::LocalAddressSpace::pint_t laddr = (libunwind::LocalAddressSpace::pint_t)mappedAddress(logicalAddr);

         libunwind::LocalAddressSpace::pint_t sladdr = laddr;

         int64_t result = libunwind::LocalAddressSpace::getSLEB128(laddr, laddr+size);

4981 logicalAddr += (laddr-sladdr);

4982 return result;

4983 }

4984

4985 template <typename A>

 typename A::P::uint_t CFISection<A>::OAS::getEncodedP(pint_t& addr, pint_t end, uint8_t encoding)

4987 {

4988 pint_t startAddr = addr;

4989 pint_t p = addr;

4990 pint_t result;

4991

4992 // first get value

         switch (encoding & 0x0F) {

4994 case DW_EH_PE_ptr:

4995 result = getP(addr);

4996 p += sizeof(pint_t);

4997 addr = (pint_t)p;

4998 break;

4999 case DW_EH_PE_uleb128:

                         result = getULEB128(addr, end);

5001 break;

5002 case DW_EH_PE_udata2:

5003 result = get16(addr);

5004 p += 2;

5005 addr = (pint_t)p;

5006 break;

5007 case DW_EH_PE_udata4:

5008 result = get32(addr);

5009 p += 4;

5010 addr = (pint_t)p;

5011 break;

5012 case DW_EH_PE_udata8:

5013 result = get64(addr);

5014 p += 8;

5015 addr = (pint_t)p;

5016 break;

5017 case DW_EH_PE_sleb128:

                         result = getSLEB128(addr, end);

5019 break;

5020 case DW_EH_PE_sdata2:

                         result = (int16_t)get16(addr);

5022 p += 2;

5023 addr = (pint_t)p;

5024 break;

5025 case DW_EH_PE_sdata4:

                         result = (int32_t)get32(addr);

5027 p += 4;

5028 addr = (pint_t)p;

5029 break;

5030 case DW_EH_PE_sdata8:

5031 result = get64(addr);

5032 p += 8;

5033 addr = (pint_t)p;

5034 break;

5035 default:

                         throwf("ObjectFileAddressSpace<A>::getEncodedP() encoding 0x%08X not supported", encoding);

5037 }

5038

5039 // then add relative offset

         switch ( encoding & 0x70 ) {

5041 case DW_EH_PE_absptr:

5042 // do nothing

5043 break;

5044 case DW_EH_PE_pcrel:

5045 result += startAddr;

5046 break;

5047 case DW_EH_PE_textrel:

5048 throw "DW_EH_PE_textrel pointer encoding not supported";

5049 break;

5050 case DW_EH_PE_datarel:

5051 throw "DW_EH_PE_datarel pointer encoding not supported";

5052 break;

5053 case DW_EH_PE_funcrel:

5054 throw "DW_EH_PE_funcrel pointer encoding not supported";

5055 break;

5056 case DW_EH_PE_aligned:

5057 throw "DW_EH_PE_aligned pointer encoding not supported";

5058 break;

5059 default:

                         throwf("ObjectFileAddressSpace<A>::getEncodedP() encoding 0x%08X not supported", encoding);

5061 break;

5062 }

5063

5064 // Note: DW_EH_PE_indirect is only used in CIEs to refernce the personality pointer

5065 // When parsing .o files that pointer contains zero, so we don't to return that.

5066 // Instead we skip the dereference and return the address of the pointer.

5067 // if ( encoding & DW_EH_PE_indirect )

5068 // result = getP(result);

5069

5070 return result;

5071 }

5072

5073 template <>

 const char* CUSection<x86_64>::personalityName(class Parser<x86_64>& parser, const macho_relocation_info<x86_64::P>* reloc)

5075 {

         if ( reloc->r_extern() ) {

                 assert((reloc->r_type() == X86_64_RELOC_UNSIGNED) && "wrong reloc type on personality column in __compact_unwind section");

                 const macho_nlist<P>& sym = parser.symbolFromIndex(reloc->r_symbolnum());

                 return parser.nameFromSymbol(sym);

5080 }

5081 else {

                 const pint_t* content = (pint_t*)(this->file().fileContent() + this->_machOSection->offset() + reloc->r_address());

5083 pint_t personalityAddr = *content;

                 assert((parser.sectionForAddress(personalityAddr)->type() == ld::Section::typeCode) && "personality column in __compact_unwind section is not pointer to function");

5085 // atoms may not be constructed yet, so scan symbol table for labels

                 const char* name = parser.scanSymbolTableForAddress(personalityAddr);

5087 return name;

5088 }

5089 }

5090

5091 template <>

 const char* CUSection<x86>::personalityName(class Parser<x86>& parser, const macho_relocation_info<x86::P>* reloc)

5093 {

         if ( reloc->r_extern() ) {

                 assert((reloc->r_type() == GENERIC_RELOC_VANILLA) && "wrong reloc type on personality column in __compact_unwind section");

                 const macho_nlist<P>& sym = parser.symbolFromIndex(reloc->r_symbolnum());

                 return parser.nameFromSymbol(sym);

5098 }

5099 else {

5100 // support __LD, __compact_unwind personality entries which are pointer to personality non-lazy pointer

                 const pint_t* content = (pint_t*)(this->file().fileContent() + this->_machOSection->offset() + reloc->r_address());

5102 pint_t nlPointerAddr = *content;

                 Section<x86>* nlSection = parser.sectionForAddress(nlPointerAddr);

                 if ( nlSection->type() == ld::Section::typeCode ) {

5105 // personality function is defined in this .o file, so this is a direct reference to it

5106 // atoms may not be constructed yet, so scan symbol table for labels

                         const char* name = parser.scanSymbolTableForAddress(nlPointerAddr);

5108 return name;

5109 }

5110 else {

                         uint32_t symIndex = parser.symbolIndexFromIndirectSectionAddress(nlPointerAddr, nlSection->machoSection());

                         const macho_nlist<P>& nlSymbol = parser.symbolFromIndex(symIndex);

                         return parser.nameFromSymbol(nlSymbol);

5114 }

5115 }

5116 }

5117

5118 #if SUPPORT_ARCH_arm64

5119 template <>

 const char* CUSection<arm64>::personalityName(class Parser<arm64>& parser, const macho_relocation_info<arm64::P>* reloc)

5121 {

         if ( reloc->r_extern() ) {

                 assert((reloc->r_type() == ARM64_RELOC_UNSIGNED) && "wrong reloc type on personality column in __compact_unwind section");

                 const macho_nlist<P>& sym = parser.symbolFromIndex(reloc->r_symbolnum());

                 return parser.nameFromSymbol(sym);

5126 }

5127 else {

                 const pint_t* content = (pint_t*)(this->file().fileContent() + this->_machOSection->offset() + reloc->r_address());

5129 pint_t personalityAddr = *content;

                 Section<arm64>* personalitySection = parser.sectionForAddress(personalityAddr);

5131 (void)personalitySection;

                 assert((personalitySection->type() == ld::Section::typeCode) && "personality column in __compact_unwind section is not pointer to function");

5133 // atoms may not be constructed yet, so scan symbol table for labels

                 const char* name = parser.scanSymbolTableForAddress(personalityAddr);

5135 return name;

5136 }

5137 }

5138 #endif

5139

5140

5141 #if SUPPORT_ARCH_arm_any

5142 template <>

 const char* CUSection<arm>::personalityName(class Parser<arm>& parser, const macho_relocation_info<arm::P>* reloc)

5144 {

         if ( reloc->r_extern() ) {

                 assert((reloc->r_type() == ARM_RELOC_VANILLA) && "wrong reloc type on personality column in __compact_unwind section");

                 const macho_nlist<P>& sym = parser.symbolFromIndex(reloc->r_symbolnum());

                 return parser.nameFromSymbol(sym);

5149 }

5150 else {

5151 // support __LD, __compact_unwind personality entries which are pointer to personality non-lazy pointer

                 const pint_t* content = (pint_t*)(this->file().fileContent() + this->_machOSection->offset() + reloc->r_address());

5153 pint_t nlPointerAddr = *content;

                 Section<arm>* nlSection = parser.sectionForAddress(nlPointerAddr);

                 if ( nlSection->type() == ld::Section::typeCode ) {

5156 // personality function is defined in this .o file, so this is a direct reference to it

5157 // atoms may not be constructed yet, so scan symbol table for labels

                         const char* name = parser.scanSymbolTableForAddress(nlPointerAddr);

5159 return name;

5160 }

5161 else {

                         uint32_t symIndex = parser.symbolIndexFromIndirectSectionAddress(nlPointerAddr, nlSection->machoSection());

                         const macho_nlist<P>& nlSymbol = parser.symbolFromIndex(symIndex);

                         return parser.nameFromSymbol(nlSymbol);

5165 }

5166 }

5167 }

5168 #endif

5169

5170

5171 template <typename A>

 const char* CUSection<A>::personalityName(class Parser<A>& parser, const macho_relocation_info<P>* reloc)

5173 {

5174 return NULL;

5175 }

5176

5177 template <>

 bool CUSection<x86>::encodingMeansUseDwarf(compact_unwind_encoding_t enc)

5179 {

         return ((enc & UNWIND_X86_MODE_MASK) == UNWIND_X86_MODE_DWARF);

5181 }

5182

5183 template <>

 bool CUSection<x86_64>::encodingMeansUseDwarf(compact_unwind_encoding_t enc)

5185 {

         return ((enc & UNWIND_X86_64_MODE_MASK) == UNWIND_X86_64_MODE_DWARF);

5187 }

5188

5189 #if SUPPORT_ARCH_arm_any

5190 template <>

 bool CUSection<arm>::encodingMeansUseDwarf(compact_unwind_encoding_t enc)

5192 {

         return ((enc & UNWIND_ARM_MODE_MASK) == UNWIND_ARM_MODE_DWARF);

5194 }

5195 #endif

5196

5197 #if SUPPORT_ARCH_arm64

5198 template <>

 bool CUSection<arm64>::encodingMeansUseDwarf(compact_unwind_encoding_t enc)

5200 {

         return ((enc & UNWIND_ARM64_MODE_MASK) == UNWIND_ARM64_MODE_DWARF);

5202 }

5203 #endif

5204

5205

5206 template <typename A>

 int CUSection<A>::infoSorter(const void* l, const void* r)

5208 {

5209 // sort references by symbol index, then address

         const Info* left = (Info*)l;

         const Info* right = (Info*)r;

         if ( left->functionSymbolIndex == right->functionSymbolIndex )

                 return (left->functionStartAddress - right->functionStartAddress);

5214 else

                 return (left->functionSymbolIndex - right->functionSymbolIndex);

5216 }

5217

5218 template <typename A>

 void CUSection<A>::parse(class Parser<A>& parser, uint32_t cnt, Info array[])

5220 {

5221 // walk section content and copy to Info array

         const macho_compact_unwind_entry<P>* const entries = (macho_compact_unwind_entry<P>*)(this->file().fileContent() + this->_machOSection->offset());

         for (uint32_t i=0; i < cnt; ++i) {

5224 Info* info = &array[i];

                 const macho_compact_unwind_entry<P>* entry = &entries[i];

                 info->functionStartAddress      = entry->codeStart();

5227 info->functionSymbolIndex = 0xFFFFFFFF;

                 info->rangeLength                       = entry->codeLen();

                 info->compactUnwindInfo         = entry->compactUnwindInfo();

5230 info->personality = NULL;

                 info->lsdaAddress                       = entry->lsda();

5232 info->function = NULL;

5233 info->lsda = NULL;

                 if ( (info->compactUnwindInfo & UNWIND_PERSONALITY_MASK) != 0 )

5235 warning("no bits should be set in UNWIND_PERSONALITY_MASK of compact unwind encoding in __LD,__compact_unwind section");

                 if ( info->lsdaAddress != 0 ) {

5237 info->compactUnwindInfo |= UNWIND_HAS_LSDA;

5238 }

5239 }

5240

5241 // scan relocs, extern relocs are needed for personality references (possibly for function/lsda refs??)

         const uint32_t sectionSize = this->_machOSection->size();

         const macho_relocation_info<P>* relocs = (macho_relocation_info<P>*)(this->file().fileContent() + this->_machOSection->reloff());

         const macho_relocation_info<P>* relocsEnd = &relocs[this->_machOSection->nreloc()];

         for (const macho_relocation_info<P>* reloc = relocs; reloc < relocsEnd; ++reloc) {

                 if ( reloc->r_address() & R_SCATTERED )

5247 continue;

                 if ( reloc->r_address() > sectionSize )

                         throwf("malformed __compact_unwind relocation, offset (0x%08X) is beyond end of section,", reloc->r_address());

                 if ( reloc->r_extern() ) {

5251 // only expect external relocs on some colummns

                         if ( (reloc->r_address() % sizeof(macho_compact_unwind_entry<P>)) == macho_compact_unwind_entry<P>::personalityFieldOffset() ) {

                                 uint32_t entryIndex = reloc->r_address() / sizeof(macho_compact_unwind_entry<P>);

                                 array[entryIndex].personality = this->personalityName(parser, reloc);

5255 }

                         else if ( (reloc->r_address() % sizeof(macho_compact_unwind_entry<P>)) == macho_compact_unwind_entry<P>::lsdaFieldOffset() ) {

                                 uint32_t entryIndex = reloc->r_address() / sizeof(macho_compact_unwind_entry<P>);

                                 const macho_nlist<P>& lsdaSym = parser.symbolFromIndex(reloc->r_symbolnum());

                                 if ( (lsdaSym.n_type() & N_TYPE) == N_SECT ) 

                                         array[entryIndex].lsdaAddress = lsdaSym.n_value();

5261 else

5262 warning("unexpected extern relocation to lsda in __compact_unwind section");

5263 }

                         else if ( (reloc->r_address() % sizeof(macho_compact_unwind_entry<P>)) == macho_compact_unwind_entry<P>::codeStartFieldOffset() ) {

                                 uint32_t entryIndex = reloc->r_address() / sizeof(macho_compact_unwind_entry<P>);

                                 array[entryIndex].functionSymbolIndex = reloc->r_symbolnum();

                                 array[entryIndex].functionStartAddress += parser.symbolFromIndex(reloc->r_symbolnum()).n_value();

5268 }

5269 else {

5270 warning("unexpected extern relocation in __compact_unwind section");

5271 }

5272 }

5273 else {

                         if ( (reloc->r_address() % sizeof(macho_compact_unwind_entry<P>)) == macho_compact_unwind_entry<P>::personalityFieldOffset() ) {

                                 uint32_t entryIndex = reloc->r_address() / sizeof(macho_compact_unwind_entry<P>);

                                 array[entryIndex].personality = this->personalityName(parser, reloc);

5277 }

5278 }

5279 }

5280

5281 // sort array by function start address so unwind infos will be contiguous for a given function

         ::qsort(array, cnt, sizeof(Info), infoSorter);

5283 }

5284

5285 template <typename A>

 uint32_t CUSection<A>::count()

5287 {

         const macho_section<P>* machoSect =     this->machoSection();

         if ( (machoSect->size() % sizeof(macho_compact_unwind_entry<P>)) != 0 )

5290 throw "malformed __LD,__compact_unwind section, bad length";

5291

         return machoSect->size() / sizeof(macho_compact_unwind_entry<P>);

5293 }

5294

5295 template <typename A>

 void CUSection<A>::makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays& cus)

5297 {

         Info* const arrayStart = cus.cuArray;

         Info* const arrayEnd = &cus.cuArray[cus.cuCount];

         for (Info* info=arrayStart; info < arrayEnd; ++info) {

5301 // find function atom from address

                 info->function = parser.findAtomByAddress(info->functionStartAddress);  

5303 // find lsda atom from address

                 if ( info->lsdaAddress != 0 ) {

                         info->lsda = parser.findAtomByAddress(info->lsdaAddress);               

5306 // add lsda subordinate

                         typename Parser<A>::SourceLocation src(info->function, info->functionStartAddress - info->function->objectAddress());

                         parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindNoneGroupSubordinateLSDA, info->lsda);

5309 }

                 if ( info->personality != NULL ) {

5311 // add personality subordinate

                         typename Parser<A>::SourceLocation src(info->function, info->functionStartAddress - info->function->objectAddress());

                         parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindNoneGroupSubordinatePersonality, false, info->personality);

5314 }

5315 }

5316

5317 }

5318

5319 template <typename A>

 SymboledSection<A>::SymboledSection(Parser<A>& parser, File<A>& f, const macho_section<typename A::P>* s)

         : Section<A>(f, s), _type(ld::Atom::typeUnclassified) 

5322 {

         switch ( s->flags() & SECTION_TYPE ) {

5324 case S_ZEROFILL:

                         _type = ld::Atom::typeZeroFill;

5326 break;

5327 case S_MOD_INIT_FUNC_POINTERS:

                         _type = ld::Atom::typeInitializerPointers;

5329 break;

5330 case S_MOD_TERM_FUNC_POINTERS:

                         _type = ld::Atom::typeTerminatorPointers;

5332 break;

5333 case S_THREAD_LOCAL_VARIABLES:

                         _type = ld::Atom::typeTLV;

5335 break;

5336 case S_THREAD_LOCAL_ZEROFILL:

                         _type = ld::Atom::typeTLVZeroFill;

5338 break;

5339 case S_THREAD_LOCAL_REGULAR:

                         _type = ld::Atom::typeTLVInitialValue;

5341 break;

5342 case S_THREAD_LOCAL_INIT_FUNCTION_POINTERS:

                         _type = ld::Atom::typeTLVInitializerPointers;

5344 break;

5345 case S_REGULAR:

                         if ( strncmp(s->sectname(), "__gcc_except_tab", 16) == 0 )

                                 _type = ld::Atom::typeLSDA;

                         else if ( this->type() == ld::Section::typeInitializerPointers )

                                 _type = ld::Atom::typeInitializerPointers;

5350 // <rdar://problem/34716321> don't warn about static initializers in dylibs built for profiling

                         if ( strncmp(s->sectname(), "__llvm_prf_", 11) == 0 )

                                 this->_file.setHasllvmProfiling();

5353 break;

5354 }

5355 }

5356

5357

5358 template <typename A>

 bool SymboledSection<A>::dontDeadStrip() 

5360 {

5361 switch ( _type ) {

                 case ld::Atom::typeInitializerPointers:

                 case ld::Atom::typeTerminatorPointers:

5364 return true;

5365 default:

5366 // model an object file without MH_SUBSECTIONS_VIA_SYMBOLS as one in which nothing can be dead stripped

                         if ( ! this->_file.canScatterAtoms() )

5368 return true;

5369 // call inherited

                         return Section<A>::dontDeadStrip();

5371 }

5372 return false;

5373 }

5374

5375

5376 template <typename A>

 uint32_t SymboledSection<A>::computeAtomCount(class Parser<A>& parser, 

                                                                                                 struct Parser<A>::LabelAndCFIBreakIterator& it, 

5379 const struct Parser<A>::CFI_CU_InfoArrays&)

5380 {

         const pint_t startAddr = this->_machOSection->addr();

         const pint_t endAddr = startAddr + this->_machOSection->size();

         const uint32_t sectNum = this->sectionNum(parser);

5384

5385 uint32_t count = 0;

5386 pint_t addr;

5387 pint_t size;

5388 const macho_nlist* sym;

         while ( it.next(parser, *this, sectNum, startAddr, endAddr, &addr, &size, &sym) ) {

5390 ++count;

5391 }

5392 //fprintf(stderr, "computeAtomCount(%s,%s) => %d\n", this->segmentName(), this->sectionName(), count);

5393 return count;

5394 }

5395

5396 template <typename A>

 uint32_t SymboledSection<A>::appendAtoms(class Parser<A>& parser, uint8_t* p, 

                                                                                         struct Parser<A>::LabelAndCFIBreakIterator& it,

5399 const struct Parser<A>::CFI_CU_InfoArrays&)

5400 {

         this->_beginAtoms = (Atom<A>*)p;

5402

5403 //fprintf(stderr, "SymboledSection::appendAtoms() in section %s\n", this->_machOSection->sectname());

         const pint_t startAddr = this->_machOSection->addr();

         const pint_t endAddr = startAddr + this->_machOSection->size();

         const uint32_t sectNum = this->sectionNum(parser);

5407

5408 uint32_t count = 0;

5409 pint_t addr;

5410 pint_t size;

5411 const macho_nlist* label;

         while ( it.next(parser, *this, sectNum, startAddr, endAddr, &addr, &size, &label) ) {

                 Atom<A>* allocatedSpace = (Atom<A>*)p;

5414 // is break because of label or CFI?

5415 if ( label != NULL ) {

5416 // The size is computed based on the address of the next label (or the end of the section for the last label)

5417 // If there are two labels at the same address, we want them one to be an alias of the other.

5418 // If the label is at the end of a section, it is has zero size, but is not an alias

                         const bool isAlias = ( (size == 0) && (addr <  endAddr) );

                         new (allocatedSpace) Atom<A>(*this, parser, *label, size, isAlias);

5421 if ( isAlias )

                                 this->_hasAliases = true;

                         if ( parser.altEntryFromSymbol(*label) )

                                 this->_altEntries.insert(allocatedSpace);

5425 }

5426 else {

                         ld::Atom::SymbolTableInclusion inclusion = ld::Atom::symbolTableNotIn;

                         ld::Atom::ContentType ctype = this->contentType();

                         if ( ctype == ld::Atom::typeLSDA )

                                 inclusion = ld::Atom::symbolTableInWithRandomAutoStripLabel;

                         new (allocatedSpace) Atom<A>(*this, "anon", addr, size, ld::Atom::definitionRegular, ld::Atom::combineNever,

                                                                                 ld::Atom::scopeTranslationUnit, ctype, inclusion, 

                                                                                 this->dontDeadStrip(), false, false, this->alignmentForAddress(addr));

5434 }

                 p += sizeof(Atom<A>);

5436 ++count;

5437 }

5438

         this->_endAtoms = (Atom<A>*)p;

5440 return count;

5441 }

5442

5443

5444 template <>

 ld::Atom::SymbolTableInclusion ImplicitSizeSection<arm64>::symbolTableInclusion()

5446 {

         return ld::Atom::symbolTableInWithRandomAutoStripLabel;

5448 }

5449

5450

5451 template <typename A>

 ld::Atom::SymbolTableInclusion ImplicitSizeSection<A>::symbolTableInclusion()

5453 {

         return ld::Atom::symbolTableNotIn;

5455 }

5456

5457

5458 template <typename A>

 uint32_t ImplicitSizeSection<A>::computeAtomCount(class Parser<A>& parser, 

                                                                                                         struct Parser<A>::LabelAndCFIBreakIterator& it, 

5461 const struct Parser<A>::CFI_CU_InfoArrays&)

5462 {

5463 uint32_t count = 0;

         const macho_section<P>* sect = this->machoSection();

         const pint_t startAddr = sect->addr();

         const pint_t endAddr = startAddr + sect->size();

         for (pint_t addr = startAddr; addr < endAddr; addr += elementSizeAtAddress(addr) ) {

                 if ( useElementAt(parser, it, addr) ) 

5469 ++count;

5470 }

         if ( it.fileHasOverlappingSymbols && (sect->size() != 0) && (this->combine(parser, startAddr) == ld::Atom::combineByNameAndContent) ) {

5472 // if there are multiple labels in this section for the same address, then clone them into multi atoms

5473 pint_t prevSymbolAddr = (pint_t)(-1);

5474 uint8_t prevSymbolSectNum = 0;

5475 bool prevIgnore = false;

                 for(uint32_t i=0; i < it.sortedSymbolCount; ++i) {

                         const macho_nlist<P>& sym = parser.symbolFromIndex(it.sortedSymbolIndexes[i]);

                         const pint_t symbolAddr = sym.n_value();

                         const uint8_t symbolSectNum = sym.n_sect();

                         const bool ignore = this->ignoreLabel(parser.nameFromSymbol(sym));

                         if ( !ignore && !prevIgnore && (symbolAddr == prevSymbolAddr) && (prevSymbolSectNum == symbolSectNum) && (symbolSectNum == this->sectionNum(parser)) ) { 

5482 ++count;

5483 }

5484 prevSymbolAddr = symbolAddr;

5485 prevSymbolSectNum = symbolSectNum;

5486 prevIgnore = ignore;

5487 }

5488 }

5489 return count;

5490 }

5491

5492 template <typename A>

 uint32_t ImplicitSizeSection<A>::appendAtoms(class Parser<A>& parser, uint8_t* p, 

                                                                                         struct Parser<A>::LabelAndCFIBreakIterator& it, 

5495 const struct Parser<A>::CFI_CU_InfoArrays&)

5496 {

         this->_beginAtoms = (Atom<A>*)p;

5498

         const macho_section<P>* sect = this->machoSection();

         const pint_t startAddr = sect->addr();

         const pint_t endAddr = startAddr + sect->size();

         const uint32_t sectNum = this->sectionNum(parser);

5503 //fprintf(stderr, "ImplicitSizeSection::appendAtoms() in section %s\n", sect->sectname());

5504 uint32_t count = 0;

5505 pint_t foundAddr;

5506 pint_t size;

5507 const macho_nlist* foundLabel;

5508 Atom<A>* allocatedSpace;

         while ( it.next(parser, *this, sectNum, startAddr, endAddr, &foundAddr, &size, &foundLabel) ) {

5510 if ( foundLabel != NULL ) {

5511 bool skip = false;

                         pint_t labeledAtomSize = this->elementSizeAtAddress(foundAddr);

5513 allocatedSpace = (Atom<A>*)p;

                         if ( this->ignoreLabel(parser.nameFromSymbol(*foundLabel)) ) {

                                 if ( size == 0 ) {

5516 // <rdar://problem/10018737>

5517 // a size of zero means there is another label at same location

5518 // and we are supposed to ignore this label

5519 skip = true;

5520 }

5521 else {

5522 //fprintf(stderr, " 0x%08llX make annon, size=%lld\n", (uint64_t)foundAddr, (uint64_t)size);

                                         new (allocatedSpace) Atom<A>(*this, this->unlabeledAtomName(parser, foundAddr), foundAddr, 

                                                                                         this->elementSizeAtAddress(foundAddr), this->definition(), 

                                                                                         this->combine(parser, foundAddr), this->scopeAtAddress(parser, foundAddr), 

                                                                                         this->contentType(), this->symbolTableInclusion(), 

                                                                                         this->dontDeadStrip(), false, false, this->alignmentForAddress(foundAddr));

5528 }

5529 }

5530 else {

5531 // make named atom for label

5532 //fprintf(stderr, " 0x%08llX make labeled: %s\n", (uint64_t)foundAddr, parser.nameFromSymbol(*foundLabel));

                                 new (allocatedSpace) Atom<A>(*this, parser, *foundLabel, labeledAtomSize);

5534 }

5535 if ( !skip ) {

5536 ++count;

                                 p += sizeof(Atom<A>);

5538 foundAddr += labeledAtomSize;

5539 size -= labeledAtomSize;

5540 }

5541 }

5542 // some number of anonymous atoms

                 for (pint_t addr = foundAddr; addr < (foundAddr+size); addr += elementSizeAtAddress(addr) ) {

5544 // make anon atoms for area before label

                         if ( this->useElementAt(parser, it, addr) ) {

5546 //fprintf(stderr, " 0x%08llX make annon, size=%lld\n", (uint64_t)addr, (uint64_t)elementSizeAtAddress(addr));

5547 allocatedSpace = (Atom<A>*)p;

                                 new (allocatedSpace) Atom<A>(*this, this->unlabeledAtomName(parser, addr), addr, this->elementSizeAtAddress(addr), 

                                                                                         this->definition(), this->combine(parser, addr), this->scopeAtAddress(parser, addr), 

                                                                                         this->contentType(), this->symbolTableInclusion(), 

                                                                                         this->dontDeadStrip(), false, false, this->alignmentForAddress(addr));

5552 ++count;

                                 p += sizeof(Atom<A>);

5554 }

5555 }

5556 }

5557

         this->_endAtoms = (Atom<A>*)p;

5559

5560 return count;

5561 }

5562

5563 template <typename A>

 bool Literal4Section<A>::ignoreLabel(const char* label) const

5565 {

         return (label[0] == 'L') || (label[0] == 'l');

5567 }

5568

5569 template <typename A>

 unsigned long Literal4Section<A>::contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

5571 {

         const uint32_t* literalContent = (uint32_t*)atom->contentPointer();

5573 return *literalContent;

5574 }

5575

5576 template <typename A>

 bool Literal4Section<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const

5579 {

         assert(this->type() == rhs.section().type());

         const uint32_t* literalContent = (uint32_t*)atom->contentPointer();

5582

         const Atom<A>* rhsAtom = dynamic_cast<const Atom<A>*>(&rhs);

5584 assert(rhsAtom != NULL);

5585 if ( rhsAtom != NULL ) {

                 const uint32_t* rhsLiteralContent = (uint32_t*)rhsAtom->contentPointer();

5587 return (*literalContent == *rhsLiteralContent);

5588 }

5589 return false;

5590 }

5591

5592

5593 template <typename A>

 bool Literal8Section<A>::ignoreLabel(const char* label) const

5595 {

         return (label[0] == 'L') || (label[0] == 'l');

5597 }

5598

5599 template <typename A>

 unsigned long Literal8Section<A>::contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

5601 {

5602 #if __LP64__

         const uint64_t* literalContent = (uint64_t*)atom->contentPointer();

5604 return *literalContent;

5605 #else

5606 unsigned long hash = 5381;

         const uint8_t* byteContent = atom->contentPointer();

         for (int i=0; i < 8; ++i) {

                 hash = hash * 33 + byteContent[i];

5610 }

5611 return hash;

5612 #endif

5613 }

5614

5615 template <typename A>

 bool Literal8Section<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const

5618 {

         if ( rhs.section().type() != ld::Section::typeLiteral8 )

5620 return false;

         assert(this->type() == rhs.section().type());

         const uint64_t* literalContent = (uint64_t*)atom->contentPointer();

5623

         const Atom<A>* rhsAtom = dynamic_cast<const Atom<A>*>(&rhs);

5625 assert(rhsAtom != NULL);

5626 if ( rhsAtom != NULL ) {

                 const uint64_t* rhsLiteralContent = (uint64_t*)rhsAtom->contentPointer();

5628 return (*literalContent == *rhsLiteralContent);

5629 }

5630 return false;

5631 }

5632

5633 template <typename A>

 bool Literal16Section<A>::ignoreLabel(const char* label) const

5635 {

         return (label[0] == 'L') || (label[0] == 'l');

5637 }

5638

5639 template <typename A>

 unsigned long Literal16Section<A>::contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

5641 {

5642 unsigned long hash = 5381;

         const uint8_t* byteContent = atom->contentPointer();

         for (int i=0; i < 16; ++i) {

                 hash = hash * 33 + byteContent[i];

5646 }

5647 return hash;

5648 }

5649

5650 template <typename A>

 bool Literal16Section<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const

5653 {

         if ( rhs.section().type() != ld::Section::typeLiteral16 )

5655 return false;

         assert(this->type() == rhs.section().type());

         const uint64_t* literalContent = (uint64_t*)atom->contentPointer();

5658

         const Atom<A>* rhsAtom = dynamic_cast<const Atom<A>*>(&rhs);

5660 assert(rhsAtom != NULL);

5661 if ( rhsAtom != NULL ) {

                 const uint64_t* rhsLiteralContent = (uint64_t*)rhsAtom->contentPointer();

                 return ((literalContent[0] == rhsLiteralContent[0]) && (literalContent[1] == rhsLiteralContent[1]));

5664 }

5665 return false;

5666 }

5667

5668

5669

5670 template <typename A>

 typename A::P::uint_t CStringSection<A>::elementSizeAtAddress(pint_t addr)

5672 {

         const macho_section<P>* sect = this->machoSection();

         const char* stringContent = (char*)(this->file().fileContent() + sect->offset() + addr - sect->addr());

         return strlen(stringContent) + 1;

5676 }

5677

5678 template <typename A>

 bool CStringSection<A>::useElementAt(Parser<A>& parser, struct Parser<A>::LabelAndCFIBreakIterator& it, pint_t addr)

5680 {

5681 return true;

5682 }

5683

5684 template <typename A>

 bool CStringSection<A>::ignoreLabel(const char* label) const

5686 {

         return (label[0] == 'L') || (label[0] == 'l'); 

5688 }

5689

5690

5691 template <typename A>

 Atom<A>* CStringSection<A>::findAtomByAddress(pint_t addr)

5693 {

         Atom<A>* result = this->findContentAtomByAddress(addr, this->_beginAtoms, this->_endAtoms);

5695 return result;

5696 }

5697

5698 template <typename A>

 unsigned long CStringSection<A>::contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

5700 {

5701 unsigned long hash = 5381;

         const char* stringContent = (char*)atom->contentPointer();

         for (const char* s = stringContent; *s != '\0'; ++s) {

                 hash = hash * 33 + *s;

5705 }

5706 return hash;

5707 }

5708

5709

5710 template <typename A>

 bool CStringSection<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const

5713 {

         if ( rhs.section().type() != ld::Section::typeCString )

5715 return false;

         assert(this->type() == rhs.section().type());

         assert(strcmp(this->sectionName(), rhs.section().sectionName())== 0);

         assert(strcmp(this->segmentName(), rhs.section().segmentName())== 0);

         const char* stringContent = (char*)atom->contentPointer();

5720

         const Atom<A>* rhsAtom = dynamic_cast<const Atom<A>*>(&rhs);

5722 assert(rhsAtom != NULL);

5723 if ( rhsAtom != NULL ) {

                 if ( atom->_size != rhsAtom->_size )

5725 return false;

                 const char* rhsStringContent = (char*)rhsAtom->contentPointer();

                 return (strcmp(stringContent, rhsStringContent) == 0);

5728 }

5729 return false;

5730 }

5731

5732

5733 template <>

 ld::Fixup::Kind NonLazyPointerSection<x86>::fixupKind()

5735 {

         return ld::Fixup::kindStoreLittleEndian32;

5737 }

5738

5739 template <>

 ld::Fixup::Kind NonLazyPointerSection<arm>::fixupKind()

5741 {

         return ld::Fixup::kindStoreLittleEndian32;

5743 }

5744

5745 template <>

 ld::Fixup::Kind NonLazyPointerSection<arm64>::fixupKind()

5747 {

         return ld::Fixup::kindStoreLittleEndian64;

5749 }

5750

5751

5752 template <>

 void NonLazyPointerSection<x86_64>::makeFixups(class Parser<x86_64>& parser, const struct Parser<x86_64>::CFI_CU_InfoArrays&)

5754 {

         assert(0 && "x86_64 should not have non-lazy-pointer sections in .o files");

5756 }

5757

5758 template <typename A>

 void NonLazyPointerSection<A>::makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&)

5760 {

5761 // add references for each NLP atom based on indirect symbol table

         const macho_section<P>* sect = this->machoSection();

         const pint_t endAddr = sect->addr() + sect->size();

         for( pint_t addr = sect->addr(); addr < endAddr; addr += sizeof(pint_t)) {

5765 typename Parser<A>::SourceLocation src;

5766 typename Parser<A>::TargetDesc target;

                 src.atom = this->findAtomByAddress(addr);

5768 src.offsetInAtom = 0;

                 uint32_t symIndex = parser.symbolIndexFromIndirectSectionAddress(addr, sect);

5770 target.atom = NULL;

5771 target.name = NULL;

5772 target.weakImport = false;

5773 target.addend = 0;

5774 if ( symIndex == INDIRECT_SYMBOL_LOCAL ) {

5775 // use direct reference for local symbols

                         const pint_t* nlpContent = (pint_t*)(this->file().fileContent() + sect->offset() + addr - sect->addr());

                         pint_t targetAddr = P::getP(*nlpContent);

                         target.atom = parser.findAtomByAddress(targetAddr);

5779 target.weakImport = false;

                         target.addend = (targetAddr - target.atom->objectAddress());

5781 // <rdar://problem/8385011> if pointer to thumb function, mask of thumb bit (not an addend of +1)

                         if ( target.atom->isThumb() )

5783 target.addend &= (-2);

                         assert(src.atom->combine() == ld::Atom::combineNever);

5785 }

5786 else {

                         const macho_nlist<P>& sym = parser.symbolFromIndex(symIndex);

5788 // use direct reference for local symbols

                         if ( ((sym.n_type() & N_TYPE) == N_SECT) && ((sym.n_type() & N_EXT) == 0) ) {

                                 parser.findTargetFromAddressAndSectionNum(sym.n_value(), sym.n_sect(), target);

                                 assert(src.atom->combine() == ld::Atom::combineNever);

5792 }

5793 else {

                                 target.name = parser.nameFromSymbol(sym);

                                 target.weakImport = parser.weakImportFromSymbol(sym);

                                 assert(src.atom->combine() == ld::Atom::combineByNameAndReferences);

5797 }

5798 }

                 parser.addFixups(src, this->fixupKind(), target);

5800 }

5801 }

5802

5803 template <typename A>

 ld::Atom::Combine NonLazyPointerSection<A>::combine(Parser<A>& parser, pint_t addr)

5805 {

         const macho_section<P>* sect = this->machoSection();

         uint32_t symIndex = parser.symbolIndexFromIndirectSectionAddress(addr, sect);

5808 if ( symIndex == INDIRECT_SYMBOL_LOCAL)

                 return ld::Atom::combineNever;

5810

5811 // don't coalesce non-lazy-pointers to local symbols

         const macho_nlist<P>& sym = parser.symbolFromIndex(symIndex);

         if ( ((sym.n_type() & N_TYPE) == N_SECT) && ((sym.n_type() & N_EXT) == 0) ) 

                 return ld::Atom::combineNever;

5815

         return ld::Atom::combineByNameAndReferences;

5817 }

5818

5819 template <typename A>

 const char* NonLazyPointerSection<A>::targetName(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) 

5821 {

         assert(atom->combine() == ld::Atom::combineByNameAndReferences);

         assert(atom->fixupCount() == 1);

         ld::Fixup::iterator fit = atom->fixupsBegin();

5825 const char* name = NULL;

5826 switch ( fit->binding ) {

                 case ld::Fixup::bindingByNameUnbound:

5828 name = fit->u.name;

5829 break;

                 case ld::Fixup::bindingByContentBound:

                         name = fit->u.target->name();

5832 break;

                 case ld::Fixup::bindingsIndirectlyBound:

                         name = ind.indirectName(fit->u.bindingIndex);

5835 break;

5836 default:

5837 assert(0);

5838 }

5839 assert(name != NULL);

5840 return name;

5841 }

5842

5843 template <typename A>

 unsigned long NonLazyPointerSection<A>::contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

5845 {

         assert(atom->combine() == ld::Atom::combineByNameAndReferences);

5847 unsigned long hash = 9508;

         for (const char* s = this->targetName(atom, ind); *s != '\0'; ++s) {

                 hash = hash * 33 + *s;

5850 }

5851 return hash;

5852 }

5853

5854 template <typename A>

 bool NonLazyPointerSection<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& indirectBindingTable) const

5857 {

         if ( rhs.section().type() != ld::Section::typeNonLazyPointer )

5859 return false;

         assert(this->type() == rhs.section().type());

5861 // there can be many non-lazy pointer in different section names

5862 // we only want to coalesce in same section name

         if ( *this != rhs.section() )

5864 return false;

         const Atom<A>* rhsAtom = dynamic_cast<const Atom<A>*>(&rhs);

5866 assert(rhsAtom != NULL);

         const char* thisName = this->targetName(atom, indirectBindingTable);

         const char* rhsName = this->targetName(rhsAtom, indirectBindingTable);

         return (strcmp(thisName, rhsName) == 0);

5870 }

5871

5872 template <typename A>

 ld::Atom::Scope NonLazyPointerSection<A>::scopeAtAddress(Parser<A>& parser, pint_t addr)

5874 {

         const macho_section<P>* sect = this->machoSection();

         uint32_t symIndex = parser.symbolIndexFromIndirectSectionAddress(addr, sect);

5877 if ( symIndex == INDIRECT_SYMBOL_LOCAL)

                 return ld::Atom::scopeTranslationUnit;

5879 else

                 return ld::Atom::scopeLinkageUnit; 

5881 }

5882

5883

5884

5885 template <typename A>

 ld::Atom::Combine TLVPointerSection<A>::combine(Parser<A>& parser, pint_t addr)

5887 {

         return ld::Atom::combineByNameAndReferences;

5889 }

5890

5891 template <>

 void TLVPointerSection<arm>::makeFixups(class Parser<arm>& parser, const struct Parser<arm>::CFI_CU_InfoArrays&)

5893 {

5894 // add references for each thread local pointer atom based on indirect symbol table

         const macho_section<P>* sect = this->machoSection();

         const pint_t endAddr = sect->addr() + sect->size();

         for (pint_t addr = sect->addr(); addr < endAddr; addr += sizeof(pint_t)) {

5898 typename Parser<arm>::SourceLocation src;

5899 typename Parser<arm>::TargetDesc target;

                 src.atom = this->findAtomByAddress(addr);

5901 src.offsetInAtom = 0;

                 uint32_t symIndex = parser.symbolIndexFromIndirectSectionAddress(addr, sect);

5903 target.atom = NULL;

5904 target.name = NULL;

5905 target.weakImport = false;

5906 target.addend = 0;

5907 if ( symIndex == INDIRECT_SYMBOL_LOCAL ) {

                         throwf("unexpected INDIRECT_SYMBOL_LOCAL in section %s", this->sectionName());

5909 }

5910 else {

                         const macho_nlist<P>& sym = parser.symbolFromIndex(symIndex);

5912 // use direct reference for local symbols

                         if ( ((sym.n_type() & N_TYPE) == N_SECT) && ((sym.n_type() & N_EXT) == 0) ) {

                                 throwf("unexpected pointer to local symbol in section %s", this->sectionName());

5915 }

5916 else {

                                 target.name = parser.nameFromSymbol(sym);

                                 target.weakImport = parser.weakImportFromSymbol(sym);

                                 assert(src.atom->combine() == ld::Atom::combineByNameAndReferences);

5920 }

5921 }

                 parser.addFixups(src, ld::Fixup::kindStoreLittleEndian32, target);

5923 }

5924 }

5925

5926 template <typename A>

 void TLVPointerSection<A>::makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&)

5928 {

         assert(0 && "should not have thread-local-pointer sections in .o files");

5930 }

5931

5932

5933 template <typename A>

 const char* TLVPointerSection<A>::targetName(const class Atom<A>* atom, const ld::IndirectBindingTable& ind, bool* isStatic)

5935 {

         assert(atom->combine() == ld::Atom::combineByNameAndReferences);

         assert(atom->fixupCount() == 1);

5938 *isStatic = false;

         ld::Fixup::iterator fit = atom->fixupsBegin();

5940 const char* name = NULL;

5941 switch ( fit->binding ) {

                 case ld::Fixup::bindingByNameUnbound:

5943 name = fit->u.name;

5944 break;

                 case ld::Fixup::bindingByContentBound:

                         name = fit->u.target->name();

5947 break;

                 case ld::Fixup::bindingsIndirectlyBound:

                         name = ind.indirectName(fit->u.bindingIndex);

5950 break;

                 case ld::Fixup::bindingDirectlyBound:

                         name = fit->u.target->name();

                         *isStatic = (fit->u.target->scope() == ld::Atom::scopeTranslationUnit);

5954 break;

5955 default:

5956 assert(0);

5957 }

5958 assert(name != NULL);

5959 return name;

5960 }

5961

5962 template <typename A>

 unsigned long TLVPointerSection<A>::contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

5964 {

         assert(atom->combine() == ld::Atom::combineByNameAndReferences);

5966 unsigned long hash = 9508;

5967 bool isStatic;

         for (const char* s = this->targetName(atom, ind, &isStatic); *s != '\0'; ++s) {

                 hash = hash * 33 + *s;

5970 }

5971 return hash;

5972 }

5973

5974 template <typename A>

 bool TLVPointerSection<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs,

                                                                                                         const ld::IndirectBindingTable& indirectBindingTable) const

5977 {

         if ( rhs.section().type() != ld::Section::typeTLVPointers )

5979 return false;

         assert(this->type() == rhs.section().type());

         const Atom<A>* rhsAtom = dynamic_cast<const Atom<A>*>(&rhs);

5982 assert(rhsAtom != NULL);

5983 bool thisIsStatic;

5984 bool rhsIsStatic;

         const char* thisName = this->targetName(atom, indirectBindingTable, &thisIsStatic);

         const char* rhsName = this->targetName(rhsAtom, indirectBindingTable, &rhsIsStatic);

         return !thisIsStatic && !rhsIsStatic && (strcmp(thisName, rhsName) == 0);

5988 }

5989

5990

5991 template <typename A>

 const uint8_t* CFStringSection<A>::targetContent(const class Atom<A>* atom, const ld::IndirectBindingTable& ind,

                                                                                                         ContentType* ct, unsigned int* count)

5994 {

5995 *ct = contentUnknown;

         for (ld::Fixup::iterator fit=atom->fixupsBegin(), end=atom->fixupsEnd(); fit != end; ++fit) {

                 const ld::Atom* targetAtom = NULL;

5998 switch ( fit->binding ) {

                         case ld::Fixup::bindingByNameUnbound:

6000 // ignore reference to ___CFConstantStringClassReference

6001 // we are just looking for reference to backing string data

                                 assert(fit->offsetInAtom == 0);

                                 assert(strcmp(fit->u.name, "___CFConstantStringClassReference") == 0);

6004 break;

                         case ld::Fixup::bindingDirectlyBound:

                         case ld::Fixup::bindingByContentBound:

6007 targetAtom = fit->u.target;

6008 break;

                         case ld::Fixup::bindingsIndirectlyBound:

                                 targetAtom = ind.indirectAtom(fit->u.bindingIndex);

6011 break;

6012 default:

                                 assert(0 && "bad binding type");

6014 }

6015 assert(targetAtom != NULL);

                 const Atom<A>* target = dynamic_cast<const Atom<A>*>(targetAtom);

                 if ( targetAtom->section().type() == ld::Section::typeCString ) {

6018 *ct = contentUTF8;

                         *count = targetAtom->size();

6020 }

                 else if ( targetAtom->section().type() == ld::Section::typeUTF16Strings ) {

6022 *ct = contentUTF16;

                         *count = (targetAtom->size()+1)/2; // round up incase of buggy compiler that has only one trailing zero byte

6024 }

6025 else {

6026 *ct = contentUnknown;

6027 *count = 0;

6028 return NULL;

6029 }

6030 return target->contentPointer();

6031 }

6032 assert(0);

6033 return NULL;

6034 }

6035

6036 template <typename A>

 unsigned long CFStringSection<A>::contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

6038 {

6039 // base hash of CFString on hash of cstring it wraps

6040 ContentType cType;

6041 unsigned long hash;

6042 unsigned int charCount;

         const uint8_t* content = this->targetContent(atom, ind, &cType, &charCount);

6044 switch ( cType ) {

6045 case contentUTF8:

6046 hash = 9408;

                         for (const char* s = (char*)content; *s != '\0'; ++s) {

                                 hash = hash * 33 + *s;

6049 }

6050 return hash;

6051 case contentUTF16:

6052 hash = 407955;

6053 --charCount; // don't add last 0x0000 to hash because some buggy compilers only have trailing single byte

                         for (const uint16_t* s = (uint16_t*)content; charCount > 0; ++s, --charCount) {

                                 hash = hash * 1025 + *s;

6056 }

6057 return hash;

6058 case contentUnknown:

6059 // <rdar://problem/14134211> For malformed CFStrings, hash to address of atom so they have unique hashes

                         return ULONG_MAX - (unsigned long)(atom);

6061 }

6062 return 0;

6063 }

6064

6065

6066 template <typename A>

 bool CFStringSection<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& indirectBindingTable) const

6069 {

6070 if ( atom == &rhs )

6071 return true;

         if ( rhs.section().type() != ld::Section::typeCFString)

6073 return false;

         assert(this->type() == rhs.section().type());

         assert(strcmp(this->sectionName(), "__cfstring") == 0);

6076

6077 ContentType thisType;

6078 unsigned int charCount;

         const uint8_t* cstringContent = this->targetContent(atom, indirectBindingTable, &thisType, &charCount);

6080 ContentType rhsType;

         const Atom<A>* rhsAtom = dynamic_cast<const Atom<A>*>(&rhs);

6082 assert(rhsAtom != NULL);

6083 unsigned int rhsCharCount;

         const uint8_t* rhsStringContent = this->targetContent(rhsAtom, indirectBindingTable, &rhsType, &rhsCharCount);

6085

6086 if ( thisType != rhsType )

6087 return false;

6088

6089 if ( thisType == contentUnknown )

6090 return false;

6091

6092 if ( rhsType == contentUnknown )

6093 return false;

6094

6095 // no need to compare content of pointers are already the same

6096 if ( cstringContent == rhsStringContent )

6097 return true;

6098

6099 // no need to compare content if size is different

6100 if ( charCount != rhsCharCount )

6101 return false;

6102

6103 switch ( thisType ) {

6104 case contentUTF8:

                         return (strcmp((char*)cstringContent, (char*)rhsStringContent) == 0);

6106 case contentUTF16:

6107 {

                                 const uint16_t* cstringContent16 = (uint16_t*)cstringContent;

                                 const uint16_t* rhsStringContent16 = (uint16_t*)rhsStringContent;

                                 for (unsigned int i = 0; i < charCount; ++i) {

                                         if ( cstringContent16[i] != rhsStringContent16[i] )

6112 return false;

6113 }

6114 return true;

6115 }

6116 case contentUnknown:

6117 return false;

6118 }

6119 return false;

6120 }

6121

6122

6123 template <typename A>

 typename A::P::uint_t ObjC1ClassSection<A>::elementSizeAtAddress(pint_t addr)

6125 {

6126 // nominal size for each class is 48 bytes, but sometimes the compiler

6127 // over aligns and there is padding after class data

         const macho_section<P>* sct = this->machoSection();

         uint32_t align = 1 << sct->align();

         uint32_t size = ((12 * sizeof(pint_t)) + align-1) & (-align);

6131 return size;

6132 }

6133

6134 template <typename A>

 const char* ObjC1ClassSection<A>::unlabeledAtomName(Parser<A>& parser, pint_t addr)

6136 {

6137 // 8-bytes into class object is pointer to class name

         const macho_section<P>* sct = this->machoSection();

         uint32_t classObjcFileOffset = sct->offset() - sct->addr() + addr;

         const uint8_t* mappedFileContent = this->file().fileContent();

         pint_t nameAddr = P::getP(*((pint_t*)(mappedFileContent+classObjcFileOffset+2*sizeof(pint_t))));

6142

6143 // find section containing string address to get string bytes

         const macho_section<P>* const sections = parser.firstMachOSection();

         const uint32_t sectionCount = parser.machOSectionCount();

         for (uint32_t i=0; i < sectionCount; ++i) {

                 const macho_section<P>* aSect = &sections[i];

                 if ( (aSect->addr() <= nameAddr) && (nameAddr < (aSect->addr()+aSect->size())) ) {

                         assert((aSect->flags() & SECTION_TYPE) == S_CSTRING_LITERALS);

                         uint32_t nameFileOffset = aSect->offset() - aSect->addr() + nameAddr;

                         const char* name = (char*)mappedFileContent + nameFileOffset;

6152 // spin through symbol table to find absolute symbol corresponding to this class

                         for (uint32_t s=0; s < parser.symbolCount(); ++s) {

                                 const macho_nlist<P>& sym =     parser.symbolFromIndex(s);

                                 if ( (sym.n_type() & N_TYPE) != N_ABS )

6156 continue;

                                 const char* absName = parser.nameFromSymbol(sym);

                                 if ( strncmp(absName, ".objc_class_name_", 17) == 0 ) {

                                         if ( strcmp(&absName[17], name) == 0 )

6160 return absName;

6161 }

6162 }

                         assert(0 && "obj class name not found in symbol table");

6164 }

6165 }

         assert(0 && "obj class name not found");

6167 return "unknown objc class";

6168 }

6169

6170

6171 template <typename A>

 const char* ObjC2ClassRefsSection<A>::targetClassName(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

6173 {

         assert(atom->fixupCount() == 1);

         ld::Fixup::iterator fit = atom->fixupsBegin();

6176 const char* className = NULL;

6177 switch ( fit->binding ) {

                 case ld::Fixup::bindingByNameUnbound:

6179 className = fit->u.name;

6180 break;

                 case ld::Fixup::bindingDirectlyBound:

                 case ld::Fixup::bindingByContentBound:

                         className = fit->u.target->name();

6184 break;

                 case ld::Fixup::bindingsIndirectlyBound:

                         className = ind.indirectName(fit->u.bindingIndex);

6187 break;

6188 default:

                         assert(0 && "unsupported binding in objc2 class ref section");

6190 }

6191 assert(className != NULL);

6192 return className;

6193 }

6194

6195

6196 template <typename A>

 unsigned long ObjC2ClassRefsSection<A>::contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

6198 {

6199 unsigned long hash = 978;

         for (const char* s = targetClassName(atom, ind); *s != '\0'; ++s) {

                 hash = hash * 33 + *s;

6202 }

6203 return hash;

6204 }

6205

6206 template <typename A>

 bool ObjC2ClassRefsSection<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& indirectBindingTable) const

6209 {

         assert(this->type() == rhs.section().type());

         const Atom<A>* rhsAtom = dynamic_cast<const Atom<A>*>(&rhs);

6212 assert(rhsAtom != NULL);

         const char* thisClassName = targetClassName(atom, indirectBindingTable);

         const char* rhsClassName = targetClassName(rhsAtom, indirectBindingTable);

         return (strcmp(thisClassName, rhsClassName) == 0);

6216 }

6217

6218

6219 template <typename A>

 const char* Objc1ClassReferences<A>::targetCString(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

6221 {

         assert(atom->fixupCount() == 2);

         ld::Fixup::iterator fit = atom->fixupsBegin();

         if ( fit->kind == ld::Fixup::kindSetTargetAddress )

6225 ++fit;

         const ld::Atom* targetAtom = NULL;

6227 switch ( fit->binding ) {

                 case ld::Fixup::bindingByContentBound:

6229 targetAtom = fit->u.target;

6230 break;

                 case ld::Fixup::bindingsIndirectlyBound:

                         targetAtom = ind.indirectAtom(fit->u.bindingIndex);

6233 if ( targetAtom == NULL ) {

                                 fprintf(stderr, "missing target named %s\n", ind.indirectName(fit->u.bindingIndex));

6235 }

6236 break;

6237 default:

6238 assert(0);

6239 }

6240 assert(targetAtom != NULL);

         const Atom<A>* target = dynamic_cast<const Atom<A>*>(targetAtom);

6242 assert(target != NULL);

         return (char*)target->contentPointer();

6244 }

6245

6246

6247 template <typename A>

 const char* PointerToCStringSection<A>::targetCString(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

6249 {

         assert(atom->fixupCount() == 1);

         ld::Fixup::iterator fit = atom->fixupsBegin();

         const ld::Atom* targetAtom = NULL;

6253 switch ( fit->binding ) {

                 case ld::Fixup::bindingByContentBound:

6255 targetAtom = fit->u.target;

6256 break;

                 case ld::Fixup::bindingsIndirectlyBound:

                         targetAtom = ind.indirectAtom(fit->u.bindingIndex);

6259 break;

                 case ld::Fixup::bindingDirectlyBound:

6261 targetAtom = fit->u.target;

6262 break;

6263 default:

                         assert(0 && "unsupported reference to selector");

6265 }

6266 assert(targetAtom != NULL);

         const Atom<A>* target = dynamic_cast<const Atom<A>*>(targetAtom);

6268 assert(target != NULL);

         assert(target->contentType() == ld::Atom::typeCString);

         return (char*)target->contentPointer();

6271 }

6272

6273 template <typename A>

 unsigned long PointerToCStringSection<A>::contentHash(const class Atom<A>* atom, 

                                                                                                         const ld::IndirectBindingTable& indirectBindingTable) const

6276 {

6277 // make hash from section name and target cstring name

6278 unsigned long hash = 123;

         for (const char* s = this->sectionName(); *s != '\0'; ++s) {

                 hash = hash * 33 + *s;

6281 }

         for (const char* s = this->targetCString(atom, indirectBindingTable); *s != '\0'; ++s) {

                 hash = hash * 33 + *s;

6284 }

6285 return hash;

6286 }

6287

6288 template <typename A>

 bool PointerToCStringSection<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& indirectBindingTable) const

6291 {

         assert(this->type() == rhs.section().type());

6293 // there can be pointers-to-cstrings in different section names

6294 // we only want to coalesce in same section name

         if ( *this != rhs.section() )

6296 return false;

6297

6298 // get string content for this

         const char* cstringContent = this->targetCString(atom, indirectBindingTable);

         const Atom<A>* rhsAtom = dynamic_cast<const Atom<A>*>(&rhs);

6301 assert(rhsAtom != NULL);

         const char* rhsCstringContent = this->targetCString(rhsAtom, indirectBindingTable);

6303

6304 assert(cstringContent != NULL);

6305 assert(rhsCstringContent != NULL);

         return (strcmp(cstringContent, rhsCstringContent) == 0);

6307 }

6308

6309

6310

6311 template <typename A>

 unsigned long UTF16StringSection<A>::contentHash(const class Atom<A>* atom, const ld::IndirectBindingTable& ind) const

6313 {

6314 unsigned long hash = 5381;

         const uint16_t* stringContent = (uint16_t*)atom->contentPointer();

6316 // some buggy compilers end utf16 data with single byte, so don't use last word in hash computation

         unsigned int count = (atom->size()/2) - 1;

         for (const uint16_t* s = stringContent; count > 0; ++s, --count) {

                 hash = hash * 33 + *s;

6320 }

6321 return hash;

6322 }

6323

6324 template <typename A>

 bool UTF16StringSection<A>::canCoalesceWith(const class Atom<A>* atom, const ld::Atom& rhs, 

                                                                                                         const ld::IndirectBindingTable& ind) const

6327 {

         if ( rhs.section().type() != ld::Section::typeUTF16Strings )

6329 return false;

6330 assert(0);

6331 return false;

6332 }

6340 template <>

 uint32_t Section<x86_64>::x86_64PcRelOffset(uint8_t r_type)

6342 {

6343 switch ( r_type ) {

6344 case X86_64_RELOC_SIGNED:

6345 return 4;

6346 case X86_64_RELOC_SIGNED_1:

6347 return 5;

6348 case X86_64_RELOC_SIGNED_2:

6349 return 6;

6350 case X86_64_RELOC_SIGNED_4:

6351 return 8;

6352 }

6353 return 0;

6354 }

6355

6356

6357 template <>

 bool Section<x86_64>::addRelocFixup(class Parser<x86_64>& parser, const macho_relocation_info<P>* reloc)

6359 {

         const macho_section<P>* sect = this->machoSection();

6361 if ( sect == NULL ) {

                 warning("malformed mach-o, relocations not supported on section %s", this->sectionName());

6363 return false;

6364 }

         uint64_t srcAddr = sect->addr() + reloc->r_address();

6366 Parser<x86_64>::SourceLocation src;

6367 Parser<x86_64>::TargetDesc target;

6368 Parser<x86_64>::TargetDesc toTarget;

         src.atom = this->findAtomByAddress(srcAddr);

         if ( src.atom == NULL )

                 throwf("malformed mach-o, reloc addr 0x%llX not in any atom", srcAddr);

         src.offsetInAtom = srcAddr - src.atom->_objAddress;

         const uint8_t* fixUpPtr = file().fileContent() + sect->offset() + reloc->r_address();

6374 uint64_t contentValue = 0;

         const macho_relocation_info<x86_64::P>* nextReloc = &reloc[1];

6376 bool result = false;

6377 bool useDirectBinding;

         switch ( reloc->r_length() ) {

6379 case 0:

6380 contentValue = *fixUpPtr;

6381 break;

6382 case 1:

                         contentValue = (int64_t)(int16_t)E::get16(*((uint16_t*)fixUpPtr));

6384 break;

6385 case 2:

                         contentValue = (int64_t)(int32_t)E::get32(*((uint32_t*)fixUpPtr));

6387 break;

6388 case 3:

                         contentValue = E::get64(*((uint64_t*)fixUpPtr));

6390 break;

6391 }

6392 target.atom = NULL;

6393 target.name = NULL;

6394 target.weakImport = false;

6395 target.addend = 0;

         if ( reloc->r_extern() ) {

                 const macho_nlist<P>& sym = parser.symbolFromIndex(reloc->r_symbolnum());

6398 // use direct reference for local symbols

                 if ( ((sym.n_type() & N_TYPE) == N_SECT) && (((sym.n_type() & N_EXT) == 0) || (parser.nameFromSymbol(sym)[0] == 'L')) ) {

                         parser.findTargetFromAddressAndSectionNum(sym.n_value(), sym.n_sect(), target);

6401 target.addend += contentValue;

6402 }

6403 else {

                         target.name = parser.nameFromSymbol(sym);

                         target.weakImport = parser.weakImportFromSymbol(sym);

6406 target.addend = contentValue;

6407 }

6408 // cfstrings should always use direct reference to backing store

                 if ( (this->type() == ld::Section::typeCFString) && (src.offsetInAtom != 0) ) {

                         parser.findTargetFromAddressAndSectionNum(sym.n_value(), sym.n_sect(), target);

6411 target.addend = contentValue;

6412 }

6413 }

6414 else {

                 if ( reloc->r_pcrel()  )

                         contentValue += srcAddr + x86_64PcRelOffset(reloc->r_type());

                 parser.findTargetFromAddressAndSectionNum(contentValue, reloc->r_symbolnum(), target);

6418 }

         switch ( reloc->r_type() ) {

6420 case X86_64_RELOC_UNSIGNED:

                         if ( reloc->r_pcrel() )

6422 throw "pcrel and X86_64_RELOC_UNSIGNED not supported";

                         switch ( reloc->r_length() ) {

6424 case 0:

6425 case 1:

6426 throw "length < 2 and X86_64_RELOC_UNSIGNED not supported";

6427 case 2:

                                         parser.addFixups(src, ld::Fixup::kindStoreLittleEndian32, target);

6429 break;

6430 case 3:

                                         parser.addFixups(src, ld::Fixup::kindStoreLittleEndian64, target);

6432 break;

6433 }

6434 break;

6435 case X86_64_RELOC_SIGNED:

6436 case X86_64_RELOC_SIGNED_1:

6437 case X86_64_RELOC_SIGNED_2:

6438 case X86_64_RELOC_SIGNED_4:

                         if ( ! reloc->r_pcrel() )

6440 throw "not pcrel and X86_64_RELOC_SIGNED* not supported";

                         if ( reloc->r_length() != 2 ) 

6442 throw "length != 2 and X86_64_RELOC_SIGNED* not supported";

                         switch ( reloc->r_type() ) {

6444 case X86_64_RELOC_SIGNED:

                                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel32, target);

6446 break;

6447 case X86_64_RELOC_SIGNED_1:

                                         if ( reloc->r_extern() )

6449 target.addend += 1;

                                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel32_1, target);

6451 break;

6452 case X86_64_RELOC_SIGNED_2:

                                         if ( reloc->r_extern() )

6454 target.addend += 2;

                                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel32_2, target);

6456 break;

6457 case X86_64_RELOC_SIGNED_4:

                                         if ( reloc->r_extern() )

6459 target.addend += 4;

                                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel32_4, target);

6461 break;

6462 }

6463 break;

6464 case X86_64_RELOC_BRANCH:

                         if ( ! reloc->r_pcrel() )

6466 throw "not pcrel and X86_64_RELOC_BRANCH not supported";

                         switch ( reloc->r_length() ) {

6468 case 2:

                                         if ( (target.name != NULL) && (strncmp(target.name, "___dtrace_probe$", 16) == 0) ) {

                                                 parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindStoreX86DtraceCallSiteNop, false, target.name);

                                                 parser.addDtraceExtraInfos(src, &target.name[16]);

6472 }

                                         else if ( (target.name != NULL) && (strncmp(target.name, "___dtrace_isenabled$", 20) == 0) ) {

                                                 parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindStoreX86DtraceIsEnableSiteClear, false, target.name);

                                                 parser.addDtraceExtraInfos(src, &target.name[20]);

6476 }

6477 else {

                                                 parser.addFixups(src, ld::Fixup::kindStoreX86BranchPCRel32, target);

6479 }

6480 break;

6481 case 0:

                                         parser.addFixups(src, ld::Fixup::kindStoreX86BranchPCRel8, target);

6483 break;

6484 default:

                                         throwf("length=%d and X86_64_RELOC_BRANCH not supported", reloc->r_length());

6486 }

6487 break;

6488 case X86_64_RELOC_GOT:

                         if ( ! reloc->r_extern() ) 

6490 throw "not extern and X86_64_RELOC_GOT not supported";

                         if ( ! reloc->r_pcrel() )

6492 throw "not pcrel and X86_64_RELOC_GOT not supported";

                         if ( reloc->r_length() != 2 ) 

6494 throw "length != 2 and X86_64_RELOC_GOT not supported";

                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel32GOT, target);

6496 break;

6497 case X86_64_RELOC_GOT_LOAD:

                         if ( ! reloc->r_extern() ) 

6499 throw "not extern and X86_64_RELOC_GOT_LOAD not supported";

                         if ( ! reloc->r_pcrel() )

6501 throw "not pcrel and X86_64_RELOC_GOT_LOAD not supported";

                         if ( reloc->r_length() != 2 ) 

6503 throw "length != 2 and X86_64_RELOC_GOT_LOAD not supported";

                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel32GOTLoad, target);

6505 break;

6506 case X86_64_RELOC_SUBTRACTOR:

                         if ( reloc->r_pcrel() )

6508 throw "X86_64_RELOC_SUBTRACTOR cannot be pc-relative";

                         if ( reloc->r_length() < 2 )

6510 throw "X86_64_RELOC_SUBTRACTOR must have r_length of 2 or 3";

                         if ( !reloc->r_extern() )

6512 throw "X86_64_RELOC_SUBTRACTOR must have r_extern=1";

                         if ( nextReloc->r_type() != X86_64_RELOC_UNSIGNED )

6514 throw "X86_64_RELOC_SUBTRACTOR must be followed by X86_64_RELOC_UNSIGNED";

6515 result = true;

                         if ( nextReloc->r_pcrel() )

6517 throw "X86_64_RELOC_UNSIGNED following a X86_64_RELOC_SUBTRACTOR cannot be pc-relative";

                         if ( nextReloc->r_length() != reloc->r_length() )

6519 throw "X86_64_RELOC_UNSIGNED following a X86_64_RELOC_SUBTRACTOR must have same r_length";

                         if ( nextReloc->r_extern() ) {

                                 const macho_nlist<P>& sym = parser.symbolFromIndex(nextReloc->r_symbolnum());

6522 // use direct reference for local symbols

                                 if ( ((sym.n_type() & N_TYPE) == N_SECT) && (((sym.n_type() & N_EXT) == 0) || (parser.nameFromSymbol(sym)[0] == 'L')) ) {

                                         parser.findTargetFromAddressAndSectionNum(sym.n_value(), sym.n_sect(), toTarget);

6525 toTarget.addend = contentValue;

6526 useDirectBinding = true;

6527 }

6528 else {

                                         toTarget.name = parser.nameFromSymbol(sym);

                                         toTarget.weakImport = parser.weakImportFromSymbol(sym);

6531 toTarget.addend = contentValue;

6532 useDirectBinding = false;

6533 }

6534 }

6535 else {

                                 parser.findTargetFromAddressAndSectionNum(contentValue, nextReloc->r_symbolnum(), toTarget);

                                 useDirectBinding = (toTarget.atom->scope() == ld::Atom::scopeTranslationUnit) || ((toTarget.atom->combine() == ld::Atom::combineByNameAndContent) || (toTarget.atom->combine() == ld::Atom::combineByNameAndReferences));

6538 }

6539 if ( useDirectBinding ) {

                                 if ( (toTarget.atom->combine() == ld::Atom::combineByNameAndContent) || (toTarget.atom->combine() == ld::Atom::combineByNameAndReferences) )

                                         parser.addFixup(src, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, toTarget.atom);

6542 else

                                         parser.addFixup(src, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, toTarget.atom);

6544 }

6545 else

                                 parser.addFixup(src, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, toTarget.weakImport, toTarget.name);

                         parser.addFixup(src, ld::Fixup::k2of4, ld::Fixup::kindAddAddend, toTarget.addend);

                         if ( target.atom == NULL )

                                 parser.addFixup(src, ld::Fixup::k3of4, ld::Fixup::kindSubtractTargetAddress, false, target.name);

6550 else

                                 parser.addFixup(src, ld::Fixup::k3of4, ld::Fixup::kindSubtractTargetAddress, target.atom);

                         if ( reloc->r_length() == 2 )

                                 parser.addFixup(src, ld::Fixup::k4of4, ld::Fixup::kindStoreLittleEndian32);

6554 else

                                 parser.addFixup(src, ld::Fixup::k4of4, ld::Fixup::kindStoreLittleEndian64);

6556 break;

6557 case X86_64_RELOC_TLV:

                         if ( ! reloc->r_extern() ) 

6559 throw "not extern and X86_64_RELOC_TLV not supported";

                         if ( ! reloc->r_pcrel() )

6561 throw "not pcrel and X86_64_RELOC_TLV not supported";

                         if ( reloc->r_length() != 2 ) 

6563 throw "length != 2 and X86_64_RELOC_TLV not supported";

                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel32TLVLoad, target);

6565 break;

6566 default:

                         throwf("unknown relocation type %d", reloc->r_type());

6568 }

6569 return result;

6570 }

6571

6572

6573

6574 template <>

 bool Section<x86>::addRelocFixup(class Parser<x86>& parser, const macho_relocation_info<P>* reloc)

6576 {

         const macho_section<P>* sect = this->machoSection();

6578 uint32_t srcAddr;

6579 const uint8_t* fixUpPtr;

6580 uint32_t contentValue = 0;

         ld::Fixup::Kind kind = ld::Fixup::kindNone;

6582 Parser<x86>::SourceLocation src;

6583 Parser<x86>::TargetDesc target;

6584

         if ( (reloc->r_address() & R_SCATTERED) == 0 ) {

                 srcAddr = sect->addr() + reloc->r_address();

                 src.atom = this->findAtomByAddress(srcAddr);

                 src.offsetInAtom = srcAddr - src.atom->_objAddress;

                 fixUpPtr = file().fileContent() + sect->offset() + reloc->r_address();

                 switch ( reloc->r_type() ) {

6591 case GENERIC_RELOC_VANILLA:

                         switch ( reloc->r_length() ) {

6593 case 0:

                                         contentValue = (int32_t)(int8_t)*fixUpPtr;

                                         if ( reloc->r_pcrel() ) {

                                                 kind = ld::Fixup::kindStoreX86BranchPCRel8;

                                                 contentValue += srcAddr + sizeof(uint8_t);

6598 }

6599 else

6600 throw "r_length=0 and r_pcrel=0 not supported";

6601 break;

6602 case 1:

                                         contentValue = (int32_t)(int16_t)E::get16(*((uint16_t*)fixUpPtr));

                                         if ( reloc->r_pcrel() ) {

                                                 kind = ld::Fixup::kindStoreX86PCRel16;

                                                 contentValue += srcAddr + sizeof(uint16_t);

6607 }

6608 else

                                                 kind = ld::Fixup::kindStoreLittleEndian16;

6610 break;

6611 case 2:

                                         contentValue = E::get32(*((uint32_t*)fixUpPtr));

                                         if ( reloc->r_pcrel() ) {

                                                 kind = ld::Fixup::kindStoreX86BranchPCRel32;

                                                 contentValue += srcAddr + sizeof(uint32_t);

6616 }

6617 else

                                                 kind = ld::Fixup::kindStoreLittleEndian32;

6619 break;

6620 case 3:

6621 throw "r_length=3 not supported";

6622 }

                         if ( reloc->r_extern() ) {

6624 target.atom = NULL;

                                 const macho_nlist<P>& targetSymbol = parser.symbolFromIndex(reloc->r_symbolnum());

                                 target.name = parser.nameFromSymbol(targetSymbol);

                                 target.weakImport = parser.weakImportFromSymbol(targetSymbol);

                                 target.addend = (int32_t)contentValue;

6629 }

6630 else {

                                 parser.findTargetFromAddressAndSectionNum(contentValue, reloc->r_symbolnum(), target);

6632 }

                         if ( (kind == ld::Fixup::kindStoreX86BranchPCRel32) && (target.name != NULL) ) {

                                 if ( strncmp(target.name, "___dtrace_probe$", 16) == 0 ) {

                                         parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindStoreX86DtraceCallSiteNop, false, target.name);

                                         parser.addDtraceExtraInfos(src, &target.name[16]);

6637 return false;

6638 }

                                 else if ( strncmp(target.name, "___dtrace_isenabled$", 20) == 0 ) {

                                         parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindStoreX86DtraceIsEnableSiteClear, false, target.name);

                                         parser.addDtraceExtraInfos(src, &target.name[20]);

6642 return false;

6643 }

6644 }

                         parser.addFixups(src, kind, target);

6646 return false;

6647 break;

6648 case GENERIC_RLEOC_TLV:

6649 {

                                 if ( !reloc->r_extern() )

6651 throw "r_extern=0 and r_type=GENERIC_RLEOC_TLV not supported";

                                 if ( reloc->r_length() != 2 )

6653 throw "r_length!=2 and r_type=GENERIC_RLEOC_TLV not supported";

                                 const macho_nlist<P>& sym = parser.symbolFromIndex(reloc->r_symbolnum());

6655 // use direct reference for local symbols

                                 if ( ((sym.n_type() & N_TYPE) == N_SECT) && ((sym.n_type() & N_EXT) == 0) ) {

                                         parser.findTargetFromAddressAndSectionNum(sym.n_value(), sym.n_sect(), target);

6658 }

6659 else {

6660 target.atom = NULL;

                                         target.name = parser.nameFromSymbol(sym);

                                         target.weakImport = parser.weakImportFromSymbol(sym);

6663 }

                                 target.addend = (int64_t)(int32_t)E::get32(*((uint32_t*)fixUpPtr));

                                 if ( reloc->r_pcrel() ) {

                                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel32TLVLoad, target);

6667 }

6668 else {

                                         parser.addFixups(src, ld::Fixup::kindStoreX86Abs32TLVLoad, target);

6670 }

6671 return false;

6672 }

6673 break;

6674 default:

                         throwf("unsupported i386 relocation type (%d)", reloc->r_type());

6676 }

6677 }

6678 else {

6679 // scattered relocation

                 const macho_scattered_relocation_info<P>* sreloc = (macho_scattered_relocation_info<P>*)reloc;

                 srcAddr = sect->addr() + sreloc->r_address();

                 src.atom = this->findAtomByAddress(srcAddr);

                 assert(src.atom != NULL);

                 src.offsetInAtom = srcAddr - src.atom->_objAddress;

                 fixUpPtr = file().fileContent() + sect->offset() + sreloc->r_address();

                 uint32_t relocValue = sreloc->r_value();

6687 bool result = false;

6688 // file format allows pair to be scattered or not

                 const macho_scattered_relocation_info<P>* nextSReloc = &sreloc[1];

                 const macho_relocation_info<P>* nextReloc = &reloc[1];

6691 bool nextRelocIsPair = false;

6692 uint32_t nextRelocAddress = 0;

6693 uint32_t nextRelocValue = 0;

                 if ( (nextReloc->r_address() & R_SCATTERED) == 0 ) {

                         if ( nextReloc->r_type() == GENERIC_RELOC_PAIR ) {

6696 nextRelocIsPair = true;

6697 nextRelocAddress = nextReloc->r_address();

6698 result = true; // iterator should skip next reloc, since we've consumed it here

6699 }

6700 }

6701 else {

                         if ( nextSReloc->r_type() == GENERIC_RELOC_PAIR ) {

6703 nextRelocIsPair = true;

6704 nextRelocAddress = nextSReloc->r_address();

6705 nextRelocValue = nextSReloc->r_value();

6706 }

6707 }

                 switch (sreloc->r_type()) {

6709 case GENERIC_RELOC_VANILLA:

6710 // with a scattered relocation we get both the target (sreloc->r_value()) and the target+offset (*fixUpPtr)

                                 target.atom = parser.findAtomByAddress(relocValue);

                                 if ( sreloc->r_pcrel() ) {

                                         switch ( sreloc->r_length() ) {

6714 case 0:

                                                         contentValue = srcAddr + 1 + *fixUpPtr;

                                                         target.addend = (int32_t)contentValue - (int32_t)relocValue;

                                                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel8, target);

6718 break;

6719 case 1:

                                                         contentValue = srcAddr + 2 + LittleEndian::get16(*((uint16_t*)fixUpPtr));

                                                         target.addend = (int32_t)contentValue - (int32_t)relocValue;

                                                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel16, target);

6723 break;

6724 case 2:

                                                         contentValue = srcAddr + 4 + LittleEndian::get32(*((uint32_t*)fixUpPtr));

                                                         target.addend = (int32_t)contentValue - (int32_t)relocValue;

                                                         parser.addFixups(src, ld::Fixup::kindStoreX86PCRel32, target);

6728 break;

6729 case 3:

6730 throw "unsupported r_length=3 for scattered pc-rel vanilla reloc";

6731 break;

6732 }

6733 }

6734 else {

                                         if ( sreloc->r_length() != 2 )

                                                 throwf("unsupported r_length=%d for scattered vanilla reloc", sreloc->r_length());

                                         contentValue = LittleEndian::get32(*((uint32_t*)fixUpPtr));

                                         target.addend = (int32_t)contentValue - (int32_t)(target.atom->objectAddress());

                                         parser.addFixups(src, ld::Fixup::kindStoreLittleEndian32, target);

6740 }

6741 break;

6742 case GENERIC_RELOC_SECTDIFF:

6743 case GENERIC_RELOC_LOCAL_SECTDIFF:

6744 {

6745 if ( !nextRelocIsPair )

6746 throw "GENERIC_RELOC_SECTDIFF missing following pair";

                                         switch ( sreloc->r_length() ) {

6748 case 0:

6749 case 3:

6750 throw "bad length for GENERIC_RELOC_SECTDIFF";

6751 case 1:

                                                         contentValue = (int32_t)(int16_t)LittleEndian::get16(*((uint16_t*)fixUpPtr));

                                                         kind = ld::Fixup::kindStoreLittleEndian16;

6754 break;

6755 case 2:

                                                         contentValue = LittleEndian::get32(*((uint32_t*)fixUpPtr));

                                                         kind = ld::Fixup::kindStoreLittleEndian32;

6758 break;

6759 }

                                         Atom<x86>* fromAtom  = parser.findAtomByAddress(nextRelocValue);

                                         uint32_t offsetInFrom = nextRelocValue - fromAtom->_objAddress;

                                         parser.findTargetFromAddress(sreloc->r_value(), target);

6763 // check for addend encoded in the section content

                                         int64_t addend = (int32_t)contentValue - (int32_t)(sreloc->r_value() - nextRelocValue);

                                         if ( addend < 0 ) {

6766 // switch binding base on coalescing

                                                 if ( target.atom == NULL ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, false, target.name);

6769 }

                                                 else if ( target.atom->scope() == ld::Atom::scopeTranslationUnit ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, target.atom);

6772 }

                                                 else if ( (target.atom->combine() == ld::Atom::combineByNameAndContent) || (target.atom->combine() == ld::Atom::combineByNameAndReferences) ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, target.atom);

6775 }

6776 else {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, false, target.atom->name());

6778 }

                                                 parser.addFixup(src, ld::Fixup::k2of5, ld::Fixup::kindAddAddend, target.addend);

                                                 parser.addFixup(src, ld::Fixup::k3of5, ld::Fixup::kindSubtractTargetAddress, fromAtom);

                                                 parser.addFixup(src, ld::Fixup::k4of5, ld::Fixup::kindSubtractAddend, offsetInFrom-addend);

                                                 parser.addFixup(src, ld::Fixup::k5of5, kind);

6783 }

6784 else {

6785 // switch binding base on coalescing

                                                 if ( target.atom == NULL ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, false, target.name);

6788 }

                                                 else if ( target.atom->scope() == ld::Atom::scopeTranslationUnit ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, target.atom);

6791 }

                                                 else if ( (target.atom->combine() == ld::Atom::combineByNameAndContent) || (target.atom->combine() == ld::Atom::combineByNameAndReferences) ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, target.atom);

6794 }

6795 else {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, false, target.atom->name());

6797 }

                                                 parser.addFixup(src, ld::Fixup::k2of5, ld::Fixup::kindAddAddend, target.addend+addend);

                                                 parser.addFixup(src, ld::Fixup::k3of5, ld::Fixup::kindSubtractTargetAddress, fromAtom);

                                                 parser.addFixup(src, ld::Fixup::k4of5, ld::Fixup::kindSubtractAddend, offsetInFrom);

                                                 parser.addFixup(src, ld::Fixup::k5of5, kind);

6802 }

6803 }

6804 break;

6805 }

6806 return result;

6807 }

6808 }

6811

6814 #if SUPPORT_ARCH_arm_any

6815 template <>

 bool Section<arm>::addRelocFixup(class Parser<arm>& parser, const macho_relocation_info<P>* reloc)

6817 {

         const macho_section<P>* sect = this->machoSection();

6819 bool result = false;

6820 uint32_t srcAddr;

6821 uint32_t dstAddr;

6822 uint32_t* fixUpPtr;

6823 int32_t displacement = 0;

6824 uint32_t instruction = 0;

6825 pint_t contentValue = 0;

6826 Parser<arm>::SourceLocation src;

6827 Parser<arm>::TargetDesc target;

6828 const macho_relocation_info* nextReloc;

6829

         if ( (reloc->r_address() & R_SCATTERED) == 0 ) {

6831 bool externSymbolIsThumbDef = false;

                 srcAddr = sect->addr() + reloc->r_address();

                 src.atom = this->findAtomByAddress(srcAddr);

                 src.offsetInAtom = srcAddr - src.atom->_objAddress;

                 fixUpPtr = (uint32_t*)(file().fileContent() + sect->offset() + reloc->r_address());

                 if ( reloc->r_type() != ARM_RELOC_PAIR )

                         instruction = LittleEndian::get32(*fixUpPtr);

                 if ( reloc->r_extern() ) {

                         const macho_nlist<P>& targetSymbol = parser.symbolFromIndex(reloc->r_symbolnum());

6840 // use direct reference for local symbols

                         if ( ((targetSymbol.n_type() & N_TYPE) == N_SECT) && (((targetSymbol.n_type() & N_EXT) == 0) || (parser.nameFromSymbol(targetSymbol)[0] == 'L')) ) {

                                 parser.findTargetFromAddressAndSectionNum(targetSymbol.n_value(), targetSymbol.n_sect(), target);

6843 }

6844 else {

6845 target.atom = NULL;

                                 target.name = parser.nameFromSymbol(targetSymbol);

                                 target.weakImport = parser.weakImportFromSymbol(targetSymbol);

                                 if ( ((targetSymbol.n_type() & N_TYPE) == N_SECT) &&  (targetSymbol.n_desc() & N_ARM_THUMB_DEF) )

6849 externSymbolIsThumbDef = true;

6850 }

6851 }

                 switch ( reloc->r_type() ) {

6853 case ARM_RELOC_BR24:

6854 // Sign-extend displacement

                                 displacement = (instruction & 0x00FFFFFF) << 2;

                                 if ( (displacement & 0x02000000) != 0 )

6857 displacement |= 0xFC000000;

6858 // The pc added will be +8 from the pc

6859 displacement += 8;

6860 // If this is BLX add H << 1

                                 if ((instruction & 0xFE000000) == 0xFA000000)

                                         displacement += ((instruction & 0x01000000) >> 23);

                                 if ( reloc->r_extern() ) {

6864 dstAddr = srcAddr + displacement;

6865 // <rdar://problem/16652542> support large .o files

                                         if ( srcAddr > 0x2000000 ) {

                                                 dstAddr -= ((srcAddr + 0x1FFFFFF) & 0xFC000000);

6868 }

6869 target.addend = dstAddr;

6870 if ( externSymbolIsThumbDef )

                                                 target.addend &= -2; // remove thumb bit

6872 }

6873 else {

6874 dstAddr = srcAddr + displacement;

                                         parser.findTargetFromAddressAndSectionNum(dstAddr, reloc->r_symbolnum(), target);

6876 }

6877 // special case "calls" for dtrace

                                 if ( (target.name != NULL) && (strncmp(target.name, "___dtrace_probe$", 16) == 0) ) {

                                         parser.addFixup(src, ld::Fixup::k1of1,

                                                                                                                         ld::Fixup::kindStoreARMDtraceCallSiteNop, false, target.name);

                                         parser.addDtraceExtraInfos(src, &target.name[16]);

6882 }

                                 else if ( (target.name != NULL) && (strncmp(target.name, "___dtrace_isenabled$", 20) == 0) ) {

                                         parser.addFixup(src, ld::Fixup::k1of1, 

                                                                                                                         ld::Fixup::kindStoreARMDtraceIsEnableSiteClear, false, target.name);

                                         parser.addDtraceExtraInfos(src, &target.name[20]);

6887 }

6888 else {

                                         parser.addFixups(src, ld::Fixup::kindStoreARMBranch24, target);

6890 }

6891 break;

6892 case ARM_THUMB_RELOC_BR22:

6893 // thumb2 added two more bits to displacement, complicating the displacement decoding

6894 {

                                         uint32_t s = (instruction >> 10) & 0x1;

                                         uint32_t j1 = (instruction >> 29) & 0x1;

                                         uint32_t j2 = (instruction >> 27) & 0x1;

                                         uint32_t imm10 = instruction & 0x3FF;

                                         uint32_t imm11 = (instruction >> 16) & 0x7FF;

6900 uint32_t i1 = (j1 == s);

6901 uint32_t i2 = (j2 == s);

                                         uint32_t dis = (s << 24) | (i1 << 23) | (i2 << 22) | (imm10 << 12) | (imm11 << 1);

6903 int32_t sdis = dis;

6904 if ( s )

6905 sdis |= 0xFE000000;

6906 displacement = sdis;

6907 }

6908 // The pc added will be +4 from the pc

6909 displacement += 4;

6910 // If the instruction was blx, force the low 2 bits to be clear

6911 dstAddr = srcAddr + displacement;

                                 if ((instruction & 0xD0000000) == 0xC0000000)

6913 dstAddr &= 0xFFFFFFFC;

6914

                                 if ( reloc->r_extern() ) {

6916 // <rdar://problem/16652542> support large .o files

                                         if ( srcAddr > 0x1000000 ) {

                                                 dstAddr -= ((srcAddr + 0xFFFFFF) & 0xFE000000);

6919 }

                                         target.addend = (int64_t)(int32_t)dstAddr;

6921 }

6922 else {

                                         parser.findTargetFromAddressAndSectionNum(dstAddr, reloc->r_symbolnum(), target);

6924 }

6925 // special case "calls" for dtrace

                                 if ( (target.name != NULL) && (strncmp(target.name, "___dtrace_probe$", 16) == 0) ) {

                                         parser.addFixup(src, ld::Fixup::k1of1,

                                                                                                                         ld::Fixup::kindStoreThumbDtraceCallSiteNop, false, target.name);

                                         parser.addDtraceExtraInfos(src, &target.name[16]);

6930 }

                                 else if ( (target.name != NULL) && (strncmp(target.name, "___dtrace_isenabled$", 20) == 0) ) {

                                         parser.addFixup(src, ld::Fixup::k1of1, 

                                                                                                                         ld::Fixup::kindStoreThumbDtraceIsEnableSiteClear, false, target.name);

                                         parser.addDtraceExtraInfos(src, &target.name[20]);

6935 }

6936 else {

                                         parser.addFixups(src, ld::Fixup::kindStoreThumbBranch22, target);

6938 }

6939 break;

6940 case ARM_RELOC_VANILLA:

                                 if ( reloc->r_length() != 2 )

6942 throw "bad length for ARM_RELOC_VANILLA";

                                 contentValue = LittleEndian::get32(*fixUpPtr);

                                 if ( reloc->r_extern() ) {

                                         target.addend = (int32_t)contentValue;

6946 if ( externSymbolIsThumbDef )

                                                 target.addend &= -2; // remove thumb bit

6948 }

6949 else {

                                         parser.findTargetFromAddressAndSectionNum(contentValue, reloc->r_symbolnum(), target);

6951 // possible non-extern relocation turned into by-name ref because target is a weak-def

                                         if ( target.atom != NULL ) {

                                                 if ( target.atom->isThumb() )

                                                         target.addend &= -2; // remove thumb bit

6955 // if reference to LSDA, add group subordinate fixup

                                                 if ( target.atom->contentType() == ld::Atom::typeLSDA ) {

6957 Parser<arm>::SourceLocation src2;

6958 src2.atom = src.atom;

6959 src2.offsetInAtom = 0;

                                                         parser.addFixup(src2, ld::Fixup::k1of1, ld::Fixup::kindNoneGroupSubordinateLSDA, target.atom);

6961 }

6962 }

6963 }

                                 parser.addFixups(src, ld::Fixup::kindStoreLittleEndian32, target);

6965 break;

6966 case ARM_THUMB_32BIT_BRANCH:

6967 // silently ignore old unnecessary reloc

6968 break;

6969 case ARM_RELOC_HALF:

6970 nextReloc = &reloc[1];

                                 if ( nextReloc->r_type() == ARM_RELOC_PAIR ) {

6972 uint32_t instruction16;

                                         uint32_t other16 = (nextReloc->r_address() & 0xFFFF);

6974 bool isThumb;

                                         if ( reloc->r_length() & 2 ) {

6976 isThumb = true;

                                                 uint32_t i =    ((instruction & 0x00000400) >> 10);

                                                 uint32_t imm4 =  (instruction & 0x0000000F);

                                                 uint32_t imm3 = ((instruction & 0x70000000) >> 28);

                                                 uint32_t imm8 = ((instruction & 0x00FF0000) >> 16);

                                                 instruction16 = (imm4 << 12) | (i << 11) | (imm3 << 8) | imm8;

6982 }

6983 else {

6984 isThumb = false;

                                                 uint32_t imm4 = ((instruction & 0x000F0000) >> 16);

                                                 uint32_t imm12 = (instruction & 0x00000FFF);

                                                 instruction16 = (imm4 << 12) | imm12;

6988 }

                                         if ( reloc->r_length() & 1 ) {

6990 // high 16

                                                 dstAddr = ((instruction16 << 16) | other16);

                         if ( reloc->r_extern() ) {

6993 target.addend = dstAddr;

6994 if ( externSymbolIsThumbDef )

                                                                 target.addend &= -2; // remove thumb bit

6996 }

6997 else {

                             parser.findTargetFromAddress(dstAddr, target);

                             if ( target.atom->isThumb() )

                                 target.addend &= (-2); // remove thumb bit

7001 }

                                                 parser.addFixups(src, (isThumb ? ld::Fixup::kindStoreThumbHigh16 : ld::Fixup::kindStoreARMHigh16), target);

7003 }

7004 else {

7005 // low 16

                                                 dstAddr = (other16 << 16) | instruction16;

                         if ( reloc->r_extern() ) {

7008 target.addend = dstAddr;

7009 if ( externSymbolIsThumbDef )

                                                                 target.addend &= -2; // remove thumb bit

7011 }

7012 else {

                             parser.findTargetFromAddress(dstAddr, target);

                             if ( target.atom->isThumb() )

                                 target.addend &= (-2); // remove thumb bit

7016 }

                                                 parser.addFixups(src, (isThumb ? ld::Fixup::kindStoreThumbLow16 : ld::Fixup::kindStoreARMLow16), target);

7018 }

7019 result = true;

7020 }

7021 else

7022 throw "for ARM_RELOC_HALF, next reloc is not ARM_RELOC_PAIR";

7023 break;

7024 default:

                                 throwf("unknown relocation type %d", reloc->r_type());

7026 break;

7027 }

7028 }

7029 else {

                 const macho_scattered_relocation_info<P>* sreloc = (macho_scattered_relocation_info<P>*)reloc;

7031 // file format allows pair to be scattered or not

                 const macho_scattered_relocation_info<P>* nextSReloc = &sreloc[1];

7033 nextReloc = &reloc[1];

                 srcAddr = sect->addr() + sreloc->r_address();

7035 dstAddr = sreloc->r_value();

                 fixUpPtr = (uint32_t*)(file().fileContent() + sect->offset() + sreloc->r_address());

                 instruction = LittleEndian::get32(*fixUpPtr);

                 src.atom = this->findAtomByAddress(srcAddr);

                 src.offsetInAtom = srcAddr - src.atom->_objAddress;

7040 bool nextRelocIsPair = false;

7041 uint32_t nextRelocAddress = 0;

7042 uint32_t nextRelocValue = 0;

                 if ( (nextReloc->r_address() & R_SCATTERED) == 0 ) {

                         if ( nextReloc->r_type() == ARM_RELOC_PAIR ) {

7045 nextRelocIsPair = true;

7046 nextRelocAddress = nextReloc->r_address();

7047 result = true;

7048 }

7049 }

7050 else {

                         if ( nextSReloc->r_type() == ARM_RELOC_PAIR ) {

7052 nextRelocIsPair = true;

7053 nextRelocAddress = nextSReloc->r_address();

7054 nextRelocValue = nextSReloc->r_value();

7055 result = true;

7056 }

7057 }

                 switch ( sreloc->r_type() ) {

7059 case ARM_RELOC_VANILLA:

7060 // with a scattered relocation we get both the target (sreloc->r_value()) and the target+offset (*fixUpPtr)

                                 if ( sreloc->r_length() != 2 )

7062 throw "bad length for ARM_RELOC_VANILLA";

                                 target.atom = parser.findAtomByAddress(sreloc->r_value());

                                 if ( target.atom == NULL )

                                         throwf("bad r_value (0x%08X) for ARM_RELOC_VANILLA\n", sreloc->r_value());

                                 contentValue = LittleEndian::get32(*fixUpPtr);

                                 target.addend = contentValue - target.atom->_objAddress;

                                 if ( target.atom->isThumb() )

                                         target.addend &= -2; // remove thumb bit

                                 parser.addFixups(src, ld::Fixup::kindStoreLittleEndian32, target);

7071 break;

7072 case ARM_RELOC_BR24:

7073 // Sign-extend displacement

                                 displacement = (instruction & 0x00FFFFFF) << 2;

                                 if ( (displacement & 0x02000000) != 0 )

7076 displacement |= 0xFC000000;

7077 // The pc added will be +8 from the pc

7078 displacement += 8;

7079 // If this is BLX add H << 1

                                 if ((instruction & 0xFE000000) == 0xFA000000)

                                         displacement += ((instruction & 0x01000000) >> 23);

                                 target.atom = parser.findAtomByAddress(sreloc->r_value());

                                 target.addend = (int64_t)(srcAddr + displacement) - (int64_t)(target.atom->_objAddress);

                                 parser.addFixups(src, ld::Fixup::kindStoreARMBranch24, target);

7085 break;

7086 case ARM_THUMB_RELOC_BR22:

7087 // thumb2 added two more bits to displacement, complicating the displacement decoding

7088 {

                                         uint32_t s = (instruction >> 10) & 0x1;

                                         uint32_t j1 = (instruction >> 29) & 0x1;

                                         uint32_t j2 = (instruction >> 27) & 0x1;

                                         uint32_t imm10 = instruction & 0x3FF;

                                         uint32_t imm11 = (instruction >> 16) & 0x7FF;

7094 uint32_t i1 = (j1 == s);

7095 uint32_t i2 = (j2 == s);

                                         uint32_t dis = (s << 24) | (i1 << 23) | (i2 << 22) | (imm10 << 12) | (imm11 << 1);

7097 int32_t sdis = dis;

7098 if ( s )

7099 sdis |= 0xFE000000;

7100 displacement = sdis;

7101 }

7102 // The pc added will be +4 from the pc

7103 displacement += 4;

7104 dstAddr = srcAddr+displacement;

7105 // If the instruction was blx, force the low 2 bits to be clear

                                 if ((instruction & 0xF8000000) == 0xE8000000)

7107 dstAddr &= 0xFFFFFFFC;

                                 target.atom = parser.findAtomByAddress(sreloc->r_value());

                                 target.addend = dstAddr - target.atom->_objAddress;

                                 parser.addFixups(src, ld::Fixup::kindStoreThumbBranch22, target);

7111 break;

7112 case ARM_RELOC_SECTDIFF:

7113 case ARM_RELOC_LOCAL_SECTDIFF:

7114 {

7115 if ( ! nextRelocIsPair )

7116 throw "ARM_RELOC_SECTDIFF missing following pair";

                                         if ( sreloc->r_length() != 2 )

7118 throw "bad length for ARM_RELOC_SECTDIFF";

                                         contentValue = LittleEndian::get32(*fixUpPtr);

                                         Atom<arm>* fromAtom  = parser.findAtomByAddress(nextRelocValue);

                                         uint32_t offsetInFrom = nextRelocValue - fromAtom->_objAddress;

7122 uint32_t offsetInTarget;

                                         Atom<arm>* targetAtom = parser.findAtomByAddressOrLocalTargetOfStub(sreloc->r_value(), &offsetInTarget);

7124 // check for addend encoded in the section content

                     int64_t addend = (int32_t)contentValue - (int32_t)(sreloc->r_value() - nextRelocValue);

                                         if ( targetAtom->isThumb() )

7127 addend &= -2; // remove thumb bit

7128 // if reference to LSDA, add group subordinate fixup

                                         if ( targetAtom->contentType() == ld::Atom::typeLSDA ) {

7130 Parser<arm>::SourceLocation src2;

7131 src2.atom = src.atom;

7132 src2.offsetInAtom = 0;

                                                 parser.addFixup(src2, ld::Fixup::k1of1, ld::Fixup::kindNoneGroupSubordinateLSDA, targetAtom);

7134 }

                                         if ( addend < 0 ) { 

7136 // switch binding base on coalescing

                                                 if ( targetAtom->scope() == ld::Atom::scopeTranslationUnit ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, targetAtom);

7139 }

                                                 else if ( (targetAtom->combine() == ld::Atom::combineByNameAndContent) || (targetAtom->combine() == ld::Atom::combineByNameAndReferences) ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, targetAtom);

7142 }

7143 else {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, false, targetAtom->name());

7145 }

                                                 parser.addFixup(src, ld::Fixup::k2of5, ld::Fixup::kindAddAddend, offsetInTarget);

                                                 parser.addFixup(src, ld::Fixup::k3of5, ld::Fixup::kindSubtractTargetAddress, fromAtom);

                                                 parser.addFixup(src, ld::Fixup::k4of5, ld::Fixup::kindSubtractAddend, offsetInFrom-addend);

                                                 parser.addFixup(src, ld::Fixup::k5of5, ld::Fixup::kindStoreLittleEndian32);

7150 }

7151 else {

                                                 if ( targetAtom->scope() == ld::Atom::scopeTranslationUnit ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, targetAtom);

7154 }

                                                 else if ( (targetAtom->combine() == ld::Atom::combineByNameAndContent) || (targetAtom->combine() == ld::Atom::combineByNameAndReferences) ) {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, targetAtom);

7157 }

7158 else {

                                                         parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, false, targetAtom->name());

7160 }

                                                 parser.addFixup(src, ld::Fixup::k2of5, ld::Fixup::kindAddAddend, (uint32_t)(offsetInTarget+addend));

                                                 parser.addFixup(src, ld::Fixup::k3of5, ld::Fixup::kindSubtractTargetAddress, fromAtom);

                                                 parser.addFixup(src, ld::Fixup::k4of5, ld::Fixup::kindSubtractAddend, offsetInFrom);

                                                 parser.addFixup(src, ld::Fixup::k5of5, ld::Fixup::kindStoreLittleEndian32);

7165 }

7166 }

7167 break;

7168 case ARM_RELOC_HALF_SECTDIFF:

7169 if ( nextRelocIsPair ) {

                                         instruction = LittleEndian::get32(*fixUpPtr);

                                         Atom<arm>* fromAtom  = parser.findAtomByAddress(nextRelocValue);

                                         uint32_t offsetInFrom = nextRelocValue - fromAtom->_objAddress;

                                         Atom<arm>* targetAtom  = parser.findAtomByAddress(sreloc->r_value());

                                         uint32_t offsetInTarget = sreloc->r_value() - targetAtom->_objAddress;

7175 uint32_t instruction16;

                                         uint32_t other16 = (nextRelocAddress & 0xFFFF);

7177 bool isThumb;

                                         if ( sreloc->r_length() & 2 ) {

7179 isThumb = true;

                                                 uint32_t i =    ((instruction & 0x00000400) >> 10);

                                                 uint32_t imm4 =  (instruction & 0x0000000F);

                                                 uint32_t imm3 = ((instruction & 0x70000000) >> 28);

                                                 uint32_t imm8 = ((instruction & 0x00FF0000) >> 16);

                                                 instruction16 = (imm4 << 12) | (i << 11) | (imm3 << 8) | imm8;

7185 }

7186 else {

7187 isThumb = false;

                                                 uint32_t imm4 = ((instruction & 0x000F0000) >> 16);

                                                 uint32_t imm12 = (instruction & 0x00000FFF);

                                                 instruction16 = (imm4 << 12) | imm12;

7191 }

                                         if ( sreloc->r_length() & 1 )

                                                 dstAddr = ((instruction16 << 16) | other16);

7194 else

                                                 dstAddr = (other16 << 16) | instruction16;

                                         if ( targetAtom->isThumb() )

7197 dstAddr &= (-2); // remove thumb bit

                     int32_t addend = dstAddr - (sreloc->r_value() - nextRelocValue);

                                         if ( targetAtom->scope() == ld::Atom::scopeTranslationUnit ) {

                                                 parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, targetAtom);

7201 }

                                         else if ( (targetAtom->combine() == ld::Atom::combineByNameAndContent) || (targetAtom->combine() == ld::Atom::combineByNameAndReferences) ) {

                                                 parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, targetAtom);

7204 }

7205 else {

                                                 parser.addFixup(src, ld::Fixup::k1of5, ld::Fixup::kindSetTargetAddress, false, targetAtom->name());

7207 }

                                         parser.addFixup(src, ld::Fixup::k2of5, ld::Fixup::kindAddAddend, (uint32_t)offsetInTarget+addend);

                                         parser.addFixup(src, ld::Fixup::k3of5, ld::Fixup::kindSubtractTargetAddress, fromAtom);

                                         parser.addFixup(src, ld::Fixup::k4of5, ld::Fixup::kindSubtractAddend, offsetInFrom);

                                         if ( sreloc->r_length() & 1 ) {

7212 // high 16

                                                 parser.addFixup(src, ld::Fixup::k5of5, (isThumb ? ld::Fixup::kindStoreThumbHigh16 : ld::Fixup::kindStoreARMHigh16));

7214 }

7215 else {

7216 // low 16

                                                 parser.addFixup(src, ld::Fixup::k5of5, (isThumb ? ld::Fixup::kindStoreThumbLow16 : ld::Fixup::kindStoreARMLow16));

7218 }

7219 result = true;

7220 }

7221 else

7222 throw "ARM_RELOC_HALF_SECTDIFF reloc missing following pair";

7223 break;

7224 case ARM_RELOC_HALF:

7225 if ( nextRelocIsPair ) {

                                         instruction = LittleEndian::get32(*fixUpPtr);

                                         Atom<arm>* targetAtom  = parser.findAtomByAddress(sreloc->r_value());

7228 uint32_t instruction16;

                                         uint32_t other16 = (nextRelocAddress & 0xFFFF);

7230 bool isThumb;

                                         if ( sreloc->r_length() & 2 ) {

7232 isThumb = true;

                                                 uint32_t i =    ((instruction & 0x00000400) >> 10);

                                                 uint32_t imm4 =  (instruction & 0x0000000F);

                                                 uint32_t imm3 = ((instruction & 0x70000000) >> 28);

                                                 uint32_t imm8 = ((instruction & 0x00FF0000) >> 16);

                                                 instruction16 = (imm4 << 12) | (i << 11) | (imm3 << 8) | imm8;

7238 }

7239 else {

7240 isThumb = false;

                                                 uint32_t imm4 = ((instruction & 0x000F0000) >> 16);

                                                 uint32_t imm12 = (instruction & 0x00000FFF);

                                                 instruction16 = (imm4 << 12) | imm12;

7244 }

                                         if ( sreloc->r_length() & 1 )

                                                 dstAddr = ((instruction16 << 16) | other16);

7247 else

                                                 dstAddr = (other16 << 16) | instruction16;

                                         if ( targetAtom->scope() == ld::Atom::scopeTranslationUnit ) {

                                                 parser.addFixup(src, ld::Fixup::k1of3, ld::Fixup::kindSetTargetAddress, targetAtom);

7251 }

                                         else if ( (targetAtom->combine() == ld::Atom::combineByNameAndContent) || (targetAtom->combine() == ld::Atom::combineByNameAndReferences) ) {

                                                 parser.addFixup(src, ld::Fixup::k1of3, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, targetAtom);

7254 }

7255 else {

                                                 parser.addFixup(src, ld::Fixup::k1of3, ld::Fixup::kindSetTargetAddress, false, targetAtom->name());

7257 }

                                         parser.addFixup(src, ld::Fixup::k2of3, ld::Fixup::kindAddAddend, dstAddr - targetAtom->_objAddress);

                                         if ( sreloc->r_length() & 1 ) {

7260 // high 16

                                                 parser.addFixup(src, ld::Fixup::k3of3, (isThumb ? ld::Fixup::kindStoreThumbHigh16 : ld::Fixup::kindStoreARMHigh16));

7262 }

7263 else {

7264 // low 16

                                                 parser.addFixup(src, ld::Fixup::k3of3, (isThumb ? ld::Fixup::kindStoreThumbLow16 : ld::Fixup::kindStoreARMLow16));

7266 }

7267 result = true;

7268 }

7269 else

7270 throw "scattered ARM_RELOC_HALF reloc missing following pair";

7271 break;

7272 default:

                                 throwf("unknown ARM scattered relocation type %d", sreloc->r_type());

7274 }

7275 }

7276 return result;

7277 }

7278 #endif

7279

7280

7281 #if SUPPORT_ARCH_arm64

7282 template <>

 bool Section<arm64>::addRelocFixup(class Parser<arm64>& parser, const macho_relocation_info<P>* reloc)

7284 {

7285 bool result = false;

7286 Parser<arm64>::SourceLocation src;

         Parser<arm64>::TargetDesc               target = { NULL, NULL, false, 0 };

7288 Parser<arm64>::TargetDesc toTarget;

7289 int32_t prefixRelocAddend = 0;

         if ( reloc->r_type() == ARM64_RELOC_ADDEND ) {

                 uint32_t rawAddend = reloc->r_symbolnum(); 

7292 prefixRelocAddend = rawAddend;

                 if ( rawAddend & 0x00800000 )

7294 prefixRelocAddend |= 0xFF000000; // sign extend 24-bit signed int to 32-bits

                 uint32_t addendAddress = reloc->r_address();

7296 ++reloc; //advance to next reloc record

7297 result = true;

                 if ( reloc->r_address() != addendAddress )

7299 throw "ARM64_RELOC_ADDEND r_address does not match next reloc's r_address";

7300 }

         const macho_section<P>* sect = this->machoSection();

         uint64_t srcAddr = sect->addr() + reloc->r_address();

         src.atom = this->findAtomByAddress(srcAddr);

         src.offsetInAtom = srcAddr - src.atom->_objAddress;

         const uint8_t* fixUpPtr = file().fileContent() + sect->offset() + reloc->r_address();

7306 uint64_t contentValue = 0;

         const macho_relocation_info<arm64::P>* nextReloc = &reloc[1];

7308 bool useDirectBinding;

7309 uint32_t instruction;

7310 uint32_t encodedAddend;

         switch ( reloc->r_length() ) {

7312 case 0:

7313 contentValue = *fixUpPtr;

7314 break;

7315 case 1:

                         contentValue = (int64_t)(int16_t)E::get16(*((uint16_t*)fixUpPtr));

7317 break;

7318 case 2:

                         contentValue = (int64_t)(int32_t)E::get32(*((uint32_t*)fixUpPtr));

7320 break;

7321 case 3:

                         contentValue = E::get64(*((uint64_t*)fixUpPtr));

7323 break;

7324 }

         if ( reloc->r_extern() ) {

                 const macho_nlist<P>& sym = parser.symbolFromIndex(reloc->r_symbolnum());

                 const char* symbolName = parser.nameFromSymbol(sym);

                 if ( ((sym.n_type() & N_TYPE) == N_SECT) && (((sym.n_type() & N_EXT) == 0) || (symbolName[0] == 'L') || (symbolName[0] == 'l')) ) {

7329 // use direct reference for local symbols

                         parser.findTargetFromAddressAndSectionNum(sym.n_value(), sym.n_sect(), target);

7331 //target.addend += contentValue;

7332 }

                 else if ( ((sym.n_type() & N_TYPE) == N_SECT) && (src.atom->_objAddress <= sym.n_value()) && (sym.n_value() < (src.atom->_objAddress+src.atom->size())) ) {

7334 // <rdar://problem/13700961> spurious warning when weak function has reference to itself

7335 // use direct reference when atom targets itself

7336 target.atom = src.atom;

7337 target.name = NULL;

7338 }

7339 else {

7340 target.name = symbolName;

                         target.weakImport = parser.weakImportFromSymbol(sym);

7342 //target.addend = contentValue;

7343 }

7344 // cfstrings should always use direct reference to backing store

                 if ( (this->type() == ld::Section::typeCFString) && (src.offsetInAtom != 0) ) {

                         parser.findTargetFromAddressAndSectionNum(sym.n_value(), sym.n_sect(), target);

7347 //target.addend = contentValue;

7348 }

7349 }

7350 else {

                 if ( reloc->r_pcrel()  )

7352 contentValue += srcAddr;

                 parser.findTargetFromAddressAndSectionNum(contentValue, reloc->r_symbolnum(), target);

7354 }

         switch ( reloc->r_type() ) {

7356 case ARM64_RELOC_UNSIGNED:

                         if ( reloc->r_pcrel() )

7358 throw "pcrel and ARM64_RELOC_UNSIGNED not supported";

                         if ( reloc->r_extern() )

7360 target.addend = contentValue;

                         switch ( reloc->r_length() ) {

7362 case 0:

7363 case 1:

7364 throw "length < 2 and ARM64_RELOC_UNSIGNED not supported";

7365 case 2:

                                         parser.addFixups(src, ld::Fixup::kindStoreLittleEndian32, target);

7367 break;

7368 case 3:

                                         parser.addFixups(src, ld::Fixup::kindStoreLittleEndian64, target);

7370 break;

7371 }

7372 break;

7373 case ARM64_RELOC_BRANCH26:

                         if ( ! reloc->r_pcrel() )

7375 throw "not pcrel and ARM64_RELOC_BRANCH26 not supported";

                         if ( ! reloc->r_extern() ) 

7377 throw "r_extern == 0 and ARM64_RELOC_BRANCH26 not supported";

                         if ( reloc->r_length() != 2 )

7379 throw "r_length != 2 and ARM64_RELOC_BRANCH26 not supported";

                         if ( (target.name != NULL) && (strncmp(target.name, "___dtrace_probe$", 16) == 0) ) {

                                 parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindStoreARM64DtraceCallSiteNop, false, target.name);

                                 parser.addDtraceExtraInfos(src, &target.name[16]);

7383 }

                         else if ( (target.name != NULL) && (strncmp(target.name, "___dtrace_isenabled$", 20) == 0) ) {

                                 parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindStoreARM64DtraceIsEnableSiteClear, false, target.name);

                                 parser.addDtraceExtraInfos(src, &target.name[20]);

7387 }

7388 else {

7389 target.addend = prefixRelocAddend;

7390 instruction = contentValue;

                                 encodedAddend = (instruction & 0x03FFFFFF) << 2;

                                 if ( encodedAddend != 0 ) {

                                         if ( prefixRelocAddend == 0 ) {

                                                 warning("branch26 instruction at 0x%08X has embedded addend. ARM64_RELOC_ADDEND should be used instead", reloc->r_address());

7395 target.addend = encodedAddend;

7396 }

7397 else {

                                                 throwf("branch26 instruction at 0x%08X has embedded addend and ARM64_RELOC_ADDEND also used", reloc->r_address());

7399 }

7400 }

                                 parser.addFixups(src, ld::Fixup::kindStoreARM64Branch26, target);

7402 }

7403 break;

7404 case ARM64_RELOC_PAGE21:

                         if ( ! reloc->r_pcrel() )

7406 throw "not pcrel and ARM64_RELOC_PAGE21 not supported";

                         if ( ! reloc->r_extern() ) 

7408 throw "r_extern == 0 and ARM64_RELOC_PAGE21 not supported";

                         if ( reloc->r_length() != 2 ) 

7410 throw "length != 2 and ARM64_RELOC_PAGE21 not supported";

7411 target.addend = prefixRelocAddend;

7412 instruction = contentValue;

                         encodedAddend  = ((instruction & 0x60000000) >> 29) | ((instruction & 0x01FFFFE0) >> 3);

7414 encodedAddend *= 4096; // internally addend is in bytes, so scale

                         if ( encodedAddend != 0 ) {

                                 if ( prefixRelocAddend == 0 ) {

                                         warning("adrp instruction at 0x%08X has embedded addend. ARM64_RELOC_ADDEND should be used instead", reloc->r_address());

7418 target.addend = encodedAddend;

7419 }

7420 else {

                                         throwf("adrp instruction at 0x%08X has embedded addend and ARM64_RELOC_ADDEND also used", reloc->r_address());

7422 }

7423 }

                         parser.addFixups(src, ld::Fixup::kindStoreARM64Page21, target);

7425 break;

7426 case ARM64_RELOC_PAGEOFF12:

                         if ( reloc->r_pcrel() )

7428 throw "pcrel and ARM64_RELOC_PAGEOFF12 not supported";

                         if ( ! reloc->r_extern() ) 

7430 throw "r_extern == 0 and ARM64_RELOC_PAGEOFF12 not supported";

                         if ( reloc->r_length() != 2 ) 

7432 throw "length != 2 and ARM64_RELOC_PAGEOFF12 not supported";

7433 target.addend = prefixRelocAddend;

7434 instruction = contentValue;

                         encodedAddend = ((instruction & 0x003FFC00) >> 10);

7436 // internally addend is in bytes. Some instructions have an implicit scale factor

             if ( (instruction & 0x3B000000) == 0x39000000 ) {

                 switch ( instruction & 0xC0000000 ) {

7439 case 0x00000000:

7440 break;

7441 case 0x40000000:

7442 encodedAddend *= 2;

7443 break;

7444 case 0x80000000:

7445 encodedAddend *= 4;

7446 break;

7447 case 0xC0000000:

7448 encodedAddend *= 8;

7449 break;

7450 }

7451 }

                         if ( encodedAddend != 0 ) {

                                 if ( prefixRelocAddend == 0 ) {

                                         warning("pageoff12 instruction at 0x%08X has embedded addend. ARM64_RELOC_ADDEND should be used instead", reloc->r_address());

7455 target.addend = encodedAddend;

7456 }

7457 else {

                                         throwf("pageoff12 instruction at 0x%08X has embedded addend and ARM64_RELOC_ADDEND also used", reloc->r_address());

7459 }

7460 }

                         parser.addFixups(src, ld::Fixup::kindStoreARM64PageOff12, target);

7462 break;

7463 case ARM64_RELOC_GOT_LOAD_PAGE21:

                         if ( ! reloc->r_pcrel() )

7465 throw "not pcrel and ARM64_RELOC_GOT_LOAD_PAGE21 not supported";

                         if ( ! reloc->r_extern() ) 

7467 throw "r_extern == 0 and ARM64_RELOC_GOT_LOAD_PAGE21 not supported";

                         if ( reloc->r_length() != 2 ) 

7469 throw "length != 2 and ARM64_RELOC_GOT_LOAD_PAGE21 not supported";

                         if ( prefixRelocAddend != 0 )

7471 throw "ARM64_RELOC_ADDEND followed by ARM64_RELOC_GOT_LOAD_PAGE21 not supported";

7472 instruction = contentValue;

                         target.addend = ((instruction & 0x60000000) >> 29) | ((instruction & 0x01FFFFE0) >> 3);

             if ( target.addend != 0 )

7475 throw "non-zero addend with ARM64_RELOC_GOT_LOAD_PAGE21 is not supported";

                         parser.addFixups(src, ld::Fixup::kindStoreARM64GOTLoadPage21, target);

7477 break;

7478 case ARM64_RELOC_GOT_LOAD_PAGEOFF12:

                         if ( reloc->r_pcrel() )

7480 throw "pcrel and ARM64_RELOC_GOT_LOAD_PAGEOFF12 not supported";

                         if ( ! reloc->r_extern() ) 

7482 throw "r_extern == 0 and ARM64_RELOC_GOT_LOAD_PAGEOFF12 not supported";

                         if ( reloc->r_length() != 2 ) 

7484 throw "length != 2 and ARM64_RELOC_GOT_LOAD_PAGEOFF12 not supported";

                         if ( prefixRelocAddend != 0 )

7486 throw "ARM64_RELOC_ADDEND followed by ARM64_RELOC_GOT_LOAD_PAGEOFF12 not supported";

7487 instruction = contentValue;

                         target.addend = ((instruction & 0x003FFC00) >> 10);

                         parser.addFixups(src, ld::Fixup::kindStoreARM64GOTLoadPageOff12, target);

7490 break;

7491 case ARM64_RELOC_TLVP_LOAD_PAGE21:

                         if ( ! reloc->r_pcrel() )

7493 throw "not pcrel and ARM64_RELOC_TLVP_LOAD_PAGE21 not supported";

                         if ( ! reloc->r_extern() ) 

7495 throw "r_extern == 0 and ARM64_RELOC_TLVP_LOAD_PAGE21 not supported";

                         if ( reloc->r_length() != 2 ) 

7497 throw "length != 2 and ARM64_RELOC_TLVP_LOAD_PAGE21 not supported";

                         if ( prefixRelocAddend != 0 )

7499 throw "ARM64_RELOC_ADDEND followed by ARM64_RELOC_TLVP_LOAD_PAGE21 not supported";

7500 instruction = contentValue;

                         target.addend = ((instruction & 0x60000000) >> 29) | ((instruction & 0x01FFFFE0) >> 3);

             if ( target.addend != 0 )

7503 throw "non-zero addend with ARM64_RELOC_GOT_LOAD_PAGE21 is not supported";

                         parser.addFixups(src, ld::Fixup::kindStoreARM64TLVPLoadPage21, target);

7505 break;

7506 case ARM64_RELOC_TLVP_LOAD_PAGEOFF12:

                         if ( reloc->r_pcrel() )

7508 throw "pcrel and ARM64_RELOC_TLVP_LOAD_PAGEOFF12 not supported";

                         if ( ! reloc->r_extern() ) 

7510 throw "r_extern == 0 and ARM64_RELOC_TLVP_LOAD_PAGEOFF12 not supported";

                         if ( reloc->r_length() != 2 ) 

7512 throw "length != 2 and ARM64_RELOC_TLVP_LOAD_PAGEOFF12 not supported";

                         if ( prefixRelocAddend != 0 )

7514 throw "ARM64_RELOC_ADDEND followed by ARM64_RELOC_TLVP_LOAD_PAGEOFF12 not supported";

7515 instruction = contentValue;

                         target.addend = ((instruction & 0x003FFC00) >> 10);

                         parser.addFixups(src, ld::Fixup::kindStoreARM64TLVPLoadPageOff12, target);

7518 break;

7519 case ARM64_RELOC_SUBTRACTOR:

                         if ( reloc->r_pcrel() )

7521 throw "ARM64_RELOC_SUBTRACTOR cannot be pc-relative";

                         if ( reloc->r_length() < 2 )

7523 throw "ARM64_RELOC_SUBTRACTOR must have r_length of 2 or 3";

                         if ( !reloc->r_extern() )

7525 throw "ARM64_RELOC_SUBTRACTOR must have r_extern=1";

                         if ( nextReloc->r_type() != ARM64_RELOC_UNSIGNED )

7527 throw "ARM64_RELOC_SUBTRACTOR must be followed by ARM64_RELOC_UNSIGNED";

                         if ( prefixRelocAddend != 0 )

7529 throw "ARM64_RELOC_ADDEND followed by ARM64_RELOC_SUBTRACTOR not supported";

7530 result = true;

                         if ( nextReloc->r_pcrel() )

7532 throw "ARM64_RELOC_UNSIGNED following a ARM64_RELOC_SUBTRACTOR cannot be pc-relative";

                         if ( nextReloc->r_length() != reloc->r_length() )

7534 throw "ARM64_RELOC_UNSIGNED following a ARM64_RELOC_SUBTRACTOR must have same r_length";

                         if ( nextReloc->r_extern() ) {

                                 const macho_nlist<P>& sym = parser.symbolFromIndex(nextReloc->r_symbolnum());

7537 // use direct reference for local symbols

                                 if ( ((sym.n_type() & N_TYPE) == N_SECT) && (((sym.n_type() & N_EXT) == 0) || (parser.nameFromSymbol(sym)[0] == 'L')) ) {

                                         parser.findTargetFromAddressAndSectionNum(sym.n_value(), sym.n_sect(), toTarget);

7540 toTarget.addend = contentValue;

7541 useDirectBinding = true;

7542 }

7543 else {

                                         toTarget.name = parser.nameFromSymbol(sym);

                                         toTarget.weakImport = parser.weakImportFromSymbol(sym);

7546 toTarget.addend = contentValue;

7547 useDirectBinding = false;

7548 }

7549 }

7550 else {

                                 parser.findTargetFromAddressAndSectionNum(contentValue, nextReloc->r_symbolnum(), toTarget);

                                 useDirectBinding = (toTarget.atom->scope() == ld::Atom::scopeTranslationUnit);

7553 }

7554 if ( useDirectBinding ) {

                                 if ( (toTarget.atom->combine() == ld::Atom::combineByNameAndContent) || (toTarget.atom->combine() == ld::Atom::combineByNameAndReferences) )

                                         parser.addFixup(src, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, ld::Fixup::bindingByContentBound, toTarget.atom);

7557 else

                                         parser.addFixup(src, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, toTarget.atom);

7559 }

7560 else

                                 parser.addFixup(src, ld::Fixup::k1of4, ld::Fixup::kindSetTargetAddress, toTarget.weakImport, toTarget.name);

                         parser.addFixup(src, ld::Fixup::k2of4, ld::Fixup::kindAddAddend, toTarget.addend);

                         if ( target.atom == NULL )

                                 parser.addFixup(src, ld::Fixup::k3of4, ld::Fixup::kindSubtractTargetAddress, false, target.name);

7565 else

                                 parser.addFixup(src, ld::Fixup::k3of4, ld::Fixup::kindSubtractTargetAddress, target.atom);

                         if ( reloc->r_length() == 2 )

                                 parser.addFixup(src, ld::Fixup::k4of4, ld::Fixup::kindStoreLittleEndian32);

7569 else

                                 parser.addFixup(src, ld::Fixup::k4of4, ld::Fixup::kindStoreLittleEndian64);

7571 break;

7572 case ARM64_RELOC_POINTER_TO_GOT:

                         if ( ! reloc->r_extern() ) 

7574 throw "r_extern == 0 and ARM64_RELOC_POINTER_TO_GOT not supported";

                         if ( prefixRelocAddend != 0 )

7576 throw "ARM64_RELOC_ADDEND followed by ARM64_RELOC_POINTER_TO_GOT not supported";

                         if ( reloc->r_pcrel() ) {

                 if ( reloc->r_length() != 2 ) 

7579 throw "r_length != 2 and r_extern = 1 and ARM64_RELOC_POINTER_TO_GOT not supported";

                 parser.addFixups(src, ld::Fixup::kindStoreARM64PCRelToGOT, target);

7581 }

7582 else {

                 if ( reloc->r_length() != 3 ) 

7584 throw "r_length != 3 and r_extern = 0 and ARM64_RELOC_POINTER_TO_GOT not supported";

                 parser.addFixups(src, ld::Fixup::kindStoreARM64PointerToGOT, target);

7586 }

7587 break;

7588 #if SUPPORT_ARCH_arm64e

7589 case ARM64_RELOC_AUTHENTICATED_POINTER: {

                         if ( reloc->r_pcrel() )

7591 throw "pcrel and ARM64_RELOC_AUTHENTICATED_POINTER not supported";

                         if ( ! reloc->r_extern() )

7593 throw "r_extern == 0 and ARM64_RELOC_AUTHENTICATED_POINTER not supported";

7594 // An authenticated pointer is:

7595 // {

7596 // int32_t addend;

7597 // uint16_t diversityData;

7598 // uint16_t hasAddressDiversity : 1;

7599 // uint16_t key : 2;

7600 // uint16_t zeroes : 11;

7601 // uint16_t zero : 1;

7602 // uint16_t authenticated : 1;

7603 // }

                         target.addend = (int32_t)(contentValue & 0xFFFFFFFF);

7605 if (parser._supportsAuthenticatedPointers) {

                                 target.authData.discriminator = (uint16_t)(contentValue >> 32);

                                 target.authData.hasAddressDiversity = (contentValue & (1ULL << 48)) != 0;

                                 target.authData.key = (ld::Fixup::AuthData::ptrauth_key)((contentValue >> 49) & 0x3);

7609 } else {

7610 static bool emittedWarning = false;

7611 if (!emittedWarning) {

7612 emittedWarning = true;

7613 warning("stripping authenticated relocation as image uses -preload or -static");

7614 }

7615 }

                         bool isAuthenticated = (contentValue & (1ULL << 63)) != 0;

7617 if (!isAuthenticated)

7618 throw "ARM64_RELOC_AUTHENTICATED_POINTER value must have authenticated bit set";

                         switch ( reloc->r_length() ) {

7620 case 0:

7621 case 1:

7622 case 2:

7623 throw "length < 3 and ARM64_RELOC_AUTHENTICATED_POINTER not supported";

7624 case 3:

7625 if (parser._supportsAuthenticatedPointers)

                                                 parser.addFixups(src, ld::Fixup::kindStoreLittleEndianAuth64, target);

7627 else

                                                 parser.addFixups(src, ld::Fixup::kindStoreLittleEndian64, target);

7629 break;

7630 }

7631 break;

7632 }

7633 #endif

7634 default:

                         throwf("unknown relocation type %d", reloc->r_type());

7636 }

7637 return result;

7638 }

7639 #endif

7640

7641

7642 template <typename A>

 bool ObjC1ClassSection<A>::addRelocFixup(class Parser<A>& parser, const macho_relocation_info<P>* reloc)

7644 {

7645 // inherited

         FixedSizeSection<A>::addRelocFixup(parser, reloc);

7647

         assert(0 && "needs template specialization");

7649 return false;

7650 }

7651

7652 template <>

 bool ObjC1ClassSection<x86>::addRelocFixup(class Parser<x86>& parser, const macho_relocation_info<x86::P>* reloc)

7654 {

7655 // if this is the reloc for the super class name string, add implicit reference to super class

         if ( ((reloc->r_address() & R_SCATTERED) == 0) && (reloc->r_type() == GENERIC_RELOC_VANILLA) ) {

                 assert( reloc->r_length() == 2 );

                 assert( ! reloc->r_pcrel() );

7659

                 const macho_section<P>* sect = this->machoSection();

7661 Parser<x86>::SourceLocation src;

                 uint32_t srcAddr = sect->addr() + reloc->r_address();

                 src.atom = this->findAtomByAddress(srcAddr);

                 src.offsetInAtom = srcAddr - src.atom->objectAddress();

                 if ( src.offsetInAtom == 4 ) {

7666 Parser<x86>::TargetDesc stringTarget;

                         const uint8_t* fixUpPtr = file().fileContent() + sect->offset() + reloc->r_address();

                         uint32_t contentValue = LittleEndian::get32(*((uint32_t*)fixUpPtr));

                         parser.findTargetFromAddressAndSectionNum(contentValue, reloc->r_symbolnum(), stringTarget);

7670

                         assert(stringTarget.atom != NULL);

                         assert(stringTarget.atom->contentType() == ld::Atom::typeCString);

                         const char* superClassBaseName = (char*)stringTarget.atom->rawContentPointer();

                         char* superClassName = new char[strlen(superClassBaseName) + 20];

                         strcpy(superClassName, ".objc_class_name_");

7676 strcat(superClassName, superClassBaseName);

7677

                         parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindSetTargetAddress, false, superClassName);

7679 }

7680 }

7681 // inherited

         return FixedSizeSection<x86>::addRelocFixup(parser, reloc);

7683 }

7684

7685

7686

7687 template <typename A>

 bool Objc1ClassReferences<A>::addRelocFixup(class Parser<A>& parser, const macho_relocation_info<P>* reloc)

7689 {

7690 // inherited

         PointerToCStringSection<A>::addRelocFixup(parser, reloc);

7692

         assert(0 && "needs template specialization");

7694 return false;

7695 }

7696

7697

7698

7699 template <>

 bool Objc1ClassReferences<x86>::addRelocFixup(class Parser<x86>& parser, const macho_relocation_info<x86::P>* reloc)

7701 {

7702 // add implict class refs, fixups not usable yet, so look at relocations

         assert( (reloc->r_address() & R_SCATTERED) == 0 );

         assert( reloc->r_type() == GENERIC_RELOC_VANILLA );

         assert( reloc->r_length() == 2 );

         assert( ! reloc->r_pcrel() );

7707

         const macho_section<P>* sect = this->machoSection();

7709 Parser<x86>::SourceLocation src;

         uint32_t srcAddr = sect->addr() + reloc->r_address();

         src.atom = this->findAtomByAddress(srcAddr);

         src.offsetInAtom = srcAddr - src.atom->objectAddress();

7713 Parser<x86>::TargetDesc stringTarget;

         const uint8_t* fixUpPtr = file().fileContent() + sect->offset() + reloc->r_address();

         uint32_t contentValue = LittleEndian::get32(*((uint32_t*)fixUpPtr));

         parser.findTargetFromAddressAndSectionNum(contentValue, reloc->r_symbolnum(), stringTarget);

7717

         assert(stringTarget.atom != NULL);

         assert(stringTarget.atom->contentType() == ld::Atom::typeCString);

         const char* baseClassName = (char*)stringTarget.atom->rawContentPointer();

         char* objcClassName = new char[strlen(baseClassName) + 20];

         strcpy(objcClassName, ".objc_class_name_");

7723 strcat(objcClassName, baseClassName);

7724

         parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindSetTargetAddress, false, objcClassName);

7726

7727 // inherited

         return PointerToCStringSection<x86>::addRelocFixup(parser, reloc);

7729 }

7730

7731 #if SUPPORT_ARCH_arm64

7732 template <>

 void Section<arm64>::addLOH(class Parser<arm64>& parser, int kind, int count, const uint64_t addrs[]) {

7734 switch (kind) {

7735 case LOH_ARM64_ADRP_ADRP:

7736 case LOH_ARM64_ADRP_LDR:

7737 case LOH_ARM64_ADRP_ADD:

7738 case LOH_ARM64_ADRP_LDR_GOT:

                         if ( count != 2 )

                                 warning("arm64 Linker Optimiztion Hint %d has wrong number of arguments", kind);

7741 break;

7742 case LOH_ARM64_ADRP_ADD_LDR:

7743 case LOH_ARM64_ADRP_LDR_GOT_LDR:

7744 case LOH_ARM64_ADRP_ADD_STR:

7745 case LOH_ARM64_ADRP_LDR_GOT_STR:

                         if ( count != 3 )

                                 warning("arm64 Linker Optimiztion Hint %d has wrong number of arguments", kind);

7748 }

7749

7750 // pick lowest address in tuple for use as offsetInAtom

         uint64_t lowestAddress = addrs[0];

         for(int i=1; i < count; ++i) {

                 if ( addrs[i] < lowestAddress )

7754 lowestAddress = addrs[i];

7755 }

7756 // verify all other address are in same atom

         Atom<arm64>* inAtom = parser.findAtomByAddress(lowestAddress);

         const uint64_t atomStartAddr = inAtom->objectAddress();

         const uint64_t atomEndAddr = atomStartAddr + inAtom->size();

         for(int i=0; i < count; ++i) {

                 if ( (addrs[i] < atomStartAddr) || (addrs[i] >= atomEndAddr) ) {

                         warning("arm64 Linker Optimiztion Hint addresses are not in same atom: 0x%08llX and 0x%08llX",

7763 lowestAddress, addrs[i]);

7764 return; // skip this LOH

7765 }

                 if ( (addrs[i] & 0x3) != 0 ) {

                         warning("arm64 Linker Optimiztion Hint address is not 4-byte aligned: 0x%08llX", addrs[i]);

7768 return; // skip this LOH

7769 }

                 if ( (addrs[i] - lowestAddress) > 0xFFFF ) {

                         if ( parser.verboseOptimizationHints() ) {

                                 warning("arm64 Linker Optimiztion Hint addresses are too far apart: 0x%08llX and 0x%08llX",

7773 lowestAddress, addrs[i]);

7774 }

7775 return; // skip this LOH

7776 }

7777 }

7778

7779 // encoded kind, count, and address deltas in 64-bit addend

         ld::Fixup::LOH_arm64 extra;

7781 extra.addend = 0;

7782 extra.info.kind = kind;

         extra.info.count = count-1;

         extra.info.delta1 = (addrs[0] - lowestAddress) >> 2;

         extra.info.delta2 = (count > 1) ? ((addrs[1] - lowestAddress) >> 2) : 0;

         extra.info.delta3 = (count > 2) ? ((addrs[2] - lowestAddress) >> 2) : 0;

         extra.info.delta4 = (count > 3) ? ((addrs[3] - lowestAddress) >> 2) : 0;

         typename Parser<arm64>::SourceLocation src(inAtom, lowestAddress- inAtom->objectAddress());

         parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindLinkerOptimizationHint, extra.addend);

7790 }

7791 #endif

7792

7793

7794 template <typename A>

 void Section<A>::addLOH(class Parser<A>& parser, int kind, int count, const uint64_t addrs[]) {

7796

7797 }

7798

7799 template <typename A>

 void Section<A>::makeFixups(class Parser<A>& parser, const struct Parser<A>::CFI_CU_InfoArrays&)

7801 {

         const macho_section<P>* sect = this->machoSection();

         if ( sect->reloff() + (sect->nreloc() * sizeof(macho_relocation_info<P>)) > parser.fileLength() )

                 throwf("relocations for section %s/%s extends beyond end of file,", sect->segname(), Section<A>::makeSectionName(sect) );

         const macho_relocation_info<P>* relocs = (macho_relocation_info<P>*)(file().fileContent() + sect->reloff());

         const uint32_t relocCount = sect->nreloc();

         for (uint32_t r = 0; r < relocCount; ++r) {

7808 try {

                         if ( this->addRelocFixup(parser, &relocs[r]) )

7810 ++r; // skip next

7811 }

                 catch (const char* msg) {

                         throwf("in section %s,%s reloc %u: %s", sect->segname(), Section<A>::makeSectionName(sect), r, msg);

7814 }

7815 }

7816

7817 // add follow-on fixups if .o file is missing .subsections_via_symbols

         if ( this->addFollowOnFixups() ) {

                 Atom<A>* end = &_endAtoms[-1];

                 for(Atom<A>* p = _beginAtoms; p < end; ++p) {

                         typename Parser<A>::SourceLocation src(p, 0);

                         Atom<A>* nextAtom = &p[1];

                         parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindNoneFollowOn, nextAtom);

7824 }

7825 }

         else if ( this->type() == ld::Section::typeCode ) {

7827 // if FDE broke text not at a symbol, use followOn to keep code together

                 Atom<A>* end = &_endAtoms[-1];

                 for(Atom<A>* p = _beginAtoms; p < end; ++p) {

                         typename Parser<A>::SourceLocation src(p, 0);

                         Atom<A>* nextAtom = &p[1];

                         if ( (p->symbolTableInclusion() == ld::Atom::symbolTableIn) && (nextAtom->symbolTableInclusion() == ld::Atom::symbolTableNotIn) ) {

                                 parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindNoneFollowOn, nextAtom);

7834 }

7835 }

7836 }

         if ( !this->_altEntries.empty() && !this->addFollowOnFixups() ) {

                 if ( _altEntries.count(_beginAtoms) != 0 ) 

                         warning("N_ALT_ENTRY bit set on first atom in section %s/%s", sect->segname(), Section<A>::makeSectionName(sect));

7840

                 Atom<A>* end = &_endAtoms[-1];

                 for(Atom<A>* p = _beginAtoms; p < end; ++p) {

                         Atom<A>* nextAtom = &p[1];

7844 // <rdar://problem/22960070> support alt_entry aliases (alias process already added followOn, don't repeat)

                         if ( (_altEntries.count(nextAtom) != 0) && (p->_objAddress != nextAtom->_objAddress) ) {

                                 typename Parser<A>::SourceLocation src(p, 0);

                                 parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindNoneFollowOn, nextAtom);

                                 typename Parser<A>::SourceLocation src2(nextAtom, 0);

                                 parser.addFixup(src2, ld::Fixup::k1of1, ld::Fixup::kindNoneGroupSubordinate, p);

7850 }

7851 }

7852 }

7853

7854 // <rdar://problem/9218847> track data-in-code

         if ( parser.hasDataInCodeLabels() && (this->type() == ld::Section::typeCode) ) {

                 for (uint32_t i=0; i < parser.symbolCount(); ++i) {

                         const macho_nlist<P>& sym =     parser.symbolFromIndex(i);

7858 // ignore stabs

                         if ( (sym.n_type() & N_STAB) != 0 )

7860 continue;

7861 // ignore non-definitions

                         if ( (sym.n_type() & N_TYPE) != N_SECT )

7863 continue;

7864

7865 // 'L' labels do not denote atom breaks

                         const char* symbolName = parser.nameFromSymbol(sym);

                         if ( symbolName[0] == 'L' ) {

                                 if ( strncmp(symbolName, "L$start$", 8) == 0 ) {

                                         ld::Fixup::Kind kind = ld::Fixup::kindNone;

                                         if ( strncmp(&symbolName[8], "data$", 5) == 0 )

                                                 kind = ld::Fixup::kindDataInCodeStartData;

                                         else if ( strncmp(&symbolName[8], "code$", 5) == 0 )

                                                 kind = ld::Fixup::kindDataInCodeEnd;

                                         else if ( strncmp(&symbolName[8], "jt8$", 4) == 0 )

                                                 kind = ld::Fixup::kindDataInCodeStartJT8;

                                         else if ( strncmp(&symbolName[8], "jt16$", 4) == 0 )

                                                 kind = ld::Fixup::kindDataInCodeStartJT16;

                                         else if ( strncmp(&symbolName[8], "jt32$", 4) == 0 )

                                                 kind = ld::Fixup::kindDataInCodeStartJT32;

                                         else if ( strncmp(&symbolName[8], "jta32$", 4) == 0 )

                                                 kind = ld::Fixup::kindDataInCodeStartJTA32;

7882 else

                                                 warning("unknown L$start$ label %s in file %s", symbolName, this->file().path());

                                         if ( kind != ld::Fixup::kindNone ) {

                                                 Atom<A>* inAtom = parser.findAtomByAddress(sym.n_value());

                                                 typename Parser<A>::SourceLocation src(inAtom, sym.n_value() - inAtom->objectAddress());

                                                 parser.addFixup(src, ld::Fixup::k1of1, kind);

7888 }

7889 }

7890 }

7891 }

7892 }

7893

7894 // <rdar://problem/11150575> Handle LC_DATA_IN_CODE in object files

         if ( this->type() == ld::Section::typeCode ) {

                 const pint_t startAddr = this->_machOSection->addr();

                 const pint_t endAddr = startAddr + this->_machOSection->size();

                 for ( const macho_data_in_code_entry<P>* p = parser.dataInCodeStart(); p != parser.dataInCodeEnd(); ++p ) {

                         if ( (p->offset() >= startAddr) && (p->offset() < endAddr) ) {

                                 ld::Fixup::Kind kind = ld::Fixup::kindNone;

                                 switch ( p->kind() ) {

7902 case DICE_KIND_DATA:

                                                 kind = ld::Fixup::kindDataInCodeStartData;

7904 break;

7905 case DICE_KIND_JUMP_TABLE8:

                                                 kind = ld::Fixup::kindDataInCodeStartJT8;

7907 break;

7908 case DICE_KIND_JUMP_TABLE16:

                                                 kind = ld::Fixup::kindDataInCodeStartJT16;

7910 break;

7911 case DICE_KIND_JUMP_TABLE32:

                                                 kind = ld::Fixup::kindDataInCodeStartJT32;

7913 break;

7914 case DICE_KIND_ABS_JUMP_TABLE32:

                                                 kind = ld::Fixup::kindDataInCodeStartJTA32;

7916 break;

7917 default:

                                                 kind = ld::Fixup::kindDataInCodeStartData;

                                                 warning("uknown LC_DATA_IN_CODE kind (%d) at offset 0x%08X", p->kind(), p->offset());

7920 break;

7921 }

                                 Atom<A>* inAtom = parser.findAtomByAddress(p->offset());

                                 typename Parser<A>::SourceLocation srcStart(inAtom, p->offset() - inAtom->objectAddress());

                                 parser.addFixup(srcStart, ld::Fixup::k1of1, kind);

                                 typename Parser<A>::SourceLocation srcEnd(inAtom, p->offset() + p->length() - inAtom->objectAddress());

                                 parser.addFixup(srcEnd, ld::Fixup::k1of1, ld::Fixup::kindDataInCodeEnd);

7927 }

7928 }

7929 }

7930

7931 // <rdar://problem/11945700> convert linker optimization hints into internal format

         if ( this->type() == ld::Section::typeCode && parser.hasOptimizationHints() ) {

                 const pint_t startAddr = this->_machOSection->addr();

                 const pint_t endAddr = startAddr + this->_machOSection->size();

                 for (const uint8_t* p = parser.optimizationHintsStart(); p < parser.optimizationHintsEnd(); ) {

7936 uint64_t addrs[4];

                         int32_t kind = read_uleb128(&p, parser.optimizationHintsEnd());

                         if ( kind == 0 ) // padding at end of loh buffer

7939 break;

                         if ( kind == -1 ) {

7941 warning("malformed uleb128 kind in LC_LINKER_OPTIMIZATION_HINTS");

7942 break;

7943 }

                         int32_t count = read_uleb128(&p, parser.optimizationHintsEnd());

                         if ( count == -1 ) {

7946 warning("malformed uleb128 count in LC_LINKER_OPTIMIZATION_HINTS");

7947 break;

7948 }

                         if ( count > 3 ) {

7950 warning("address count > 3 in LC_LINKER_OPTIMIZATION_HINTS");

7951 break;

7952 }

                         for (int32_t i=0; i < count; ++i) {

                                 addrs[i] = read_uleb128(&p, parser.optimizationHintsEnd());

7955 }

                         if ( (startAddr <= addrs[0]) && (addrs[0] < endAddr) ) {

                                 this->addLOH(parser, kind, count, addrs);

7958 //fprintf(stderr, "kind=%d", kind);

7959 //for (int32_t i=0; i < count; ++i) {

7960 // fprintf(stderr, ", addr=0x%08llX", addrs[i]);

7961 //}

7962 //fprintf(stderr, "\n");

7963 }

7964 }

7965 }

7966

7967

7968 // add follow-on fixups for aliases

7969 if ( _hasAliases ) {

                 for(Atom<A>* p = _beginAtoms; p < _endAtoms; ++p) {

                         if ( p->isAlias() && ! this->addFollowOnFixups() ) {

                                 Atom<A>* targetOfAlias = &p[1];

                                 assert(p < &_endAtoms[-1]);

                                 assert(p->_objAddress == targetOfAlias->_objAddress);

                                 typename Parser<A>::SourceLocation src(p, 0);

                                 parser.addFixup(src, ld::Fixup::k1of1, ld::Fixup::kindNoneFollowOn, targetOfAlias);

7977 }

7978 }

7979 }

7980 }

7981

7982

7983

7984 //

7985 // main function used by linker to instantiate ld::Files

7986 //

 ld::relocatable::File* parse(const uint8_t* fileContent, uint64_t fileLength, 

                                                          const char* path, time_t modTime, ld::File::Ordinal ordinal, const ParserOptions& opts)

7989 {

7990 switch ( opts.architecture ) {

7991 #if SUPPORT_ARCH_x86_64

7992 case CPU_TYPE_X86_64:

                         if ( mach_o::relocatable::Parser<x86_64>::validFile(fileContent) )

                                 return mach_o::relocatable::Parser<x86_64>::parse(fileContent, fileLength, path, modTime, ordinal, opts);

7995 break;

7996 #endif

7997 #if SUPPORT_ARCH_i386

7998 case CPU_TYPE_I386:

                         if ( mach_o::relocatable::Parser<x86>::validFile(fileContent) )

                                 return mach_o::relocatable::Parser<x86>::parse(fileContent, fileLength, path, modTime, ordinal, opts);

8001 break;

8002 #endif

8003 #if SUPPORT_ARCH_arm_any

8004 case CPU_TYPE_ARM:

                         if ( mach_o::relocatable::Parser<arm>::validFile(fileContent, opts.objSubtypeMustMatch, opts.subType) )

                                 return mach_o::relocatable::Parser<arm>::parse(fileContent, fileLength, path, modTime, ordinal, opts);

8007 break;

8008 #endif

8009 #if SUPPORT_ARCH_arm64

8010 case CPU_TYPE_ARM64:

                         if ( mach_o::relocatable::Parser<arm64>::validFile(fileContent, opts.objSubtypeMustMatch, opts.subType) )

                                 return mach_o::relocatable::Parser<arm64>::parse(fileContent, fileLength, path, modTime, ordinal, opts);

8013 break;

8014 #endif

8015 }

8016 return NULL;

8017 }

8018

8019 //

8020 // used by archive reader to validate member object file

8021 //

 bool isObjectFile(const uint8_t* fileContent, uint64_t fileLength, const ParserOptions& opts)

8023 {

8024 switch ( opts.architecture ) {

8025 case CPU_TYPE_X86_64:

                         return ( mach_o::relocatable::Parser<x86_64>::validFile(fileContent) );

8027 case CPU_TYPE_I386:

                         return ( mach_o::relocatable::Parser<x86>::validFile(fileContent) );

8029 case CPU_TYPE_ARM:

                         return ( mach_o::relocatable::Parser<arm>::validFile(fileContent, opts.objSubtypeMustMatch, opts.subType) );

8031 case CPU_TYPE_ARM64:

                         return ( mach_o::relocatable::Parser<arm64>::validFile(fileContent, opts.objSubtypeMustMatch, opts.subType) );

8033 }

8034 return false;

8035 }

8036

8037 //

8038 // used by linker to infer architecture when no -arch is on command line

8039 //

 bool isObjectFile(const uint8_t* fileContent, cpu_type_t* result, cpu_subtype_t* subResult, ld::Platform* platform, uint32_t* minOsVers)

8041 {

         if ( mach_o::relocatable::Parser<x86_64>::validFile(fileContent) ) {

8043 *result = CPU_TYPE_X86_64;

                 const macho_header<Pointer64<LittleEndian> >* header = (const macho_header<Pointer64<LittleEndian> >*)fileContent;

                 *subResult = header->cpusubtype();

                 *platform = Parser<x86_64>::findPlatform(header, minOsVers);

8047 return true;

8048 }

         if ( mach_o::relocatable::Parser<x86>::validFile(fileContent) ) {

                 const macho_header<Pointer32<LittleEndian> >* header = (const macho_header<Pointer32<LittleEndian> >*)fileContent;

8051 *result = CPU_TYPE_I386;

8052 *subResult = CPU_SUBTYPE_X86_ALL;

                 *platform = Parser<x86>::findPlatform(header, minOsVers);

8054 return true;

8055 }

         if ( mach_o::relocatable::Parser<arm>::validFile(fileContent, false, 0) ) {

                 const macho_header<Pointer32<LittleEndian> >* header = (const macho_header<Pointer32<LittleEndian> >*)fileContent;

8058 *result = CPU_TYPE_ARM;

                 *subResult = header->cpusubtype();

                 *platform = Parser<arm>::findPlatform(header, minOsVers);

8061 return true;

8062 }

         if ( mach_o::relocatable::Parser<arm64>::validFile(fileContent, false, 0) ) {

                 const macho_header<Pointer64<LittleEndian> >* header = (const macho_header<Pointer64<LittleEndian> >*)fileContent;

8065 *result = CPU_TYPE_ARM64;

                 *subResult = header->cpusubtype();

                 *platform = Parser<arm64>::findPlatform(header, minOsVers);

8068 return true;

8069 }

8070 return false;

8071 }

8072

8073 //

8074 // used by linker is error messages to describe bad .o file

8075 //

 const char* archName(const uint8_t* fileContent)

8077 {

         if ( mach_o::relocatable::Parser<x86_64>::validFile(fileContent) ) {

                 return mach_o::relocatable::Parser<x86_64>::fileKind(fileContent);

8080 }

         if ( mach_o::relocatable::Parser<x86>::validFile(fileContent) ) {

                 return mach_o::relocatable::Parser<x86>::fileKind(fileContent);

8083 }

         if ( mach_o::relocatable::Parser<arm>::validFile(fileContent, false, 0) ) {

                 return mach_o::relocatable::Parser<arm>::fileKind(fileContent);

8086 }

8087 return NULL;

8088 }

8089

8090 //

8091 // Used by archive reader when -ObjC option is specified

8092 //

 bool hasObjC2Categories(const uint8_t* fileContent)

8094 {

         if ( mach_o::relocatable::Parser<x86_64>::validFile(fileContent) ) {

                 return mach_o::relocatable::Parser<x86_64>::hasObjC2Categories(fileContent);

8097 }

         else if ( mach_o::relocatable::Parser<arm>::validFile(fileContent, false, 0) ) {

                 return mach_o::relocatable::Parser<arm>::hasObjC2Categories(fileContent);

8100 }

         else if ( mach_o::relocatable::Parser<x86>::validFile(fileContent, false, 0) ) {

                 return mach_o::relocatable::Parser<x86>::hasObjC2Categories(fileContent);

8103 }

8104 #if SUPPORT_ARCH_arm64

     else if ( mach_o::relocatable::Parser<arm64>::validFile(fileContent, false, 0) ) {

         return mach_o::relocatable::Parser<arm64>::hasObjC2Categories(fileContent);

8107 }

8108 #endif

8109 return false;

8110 }

8111

8112 //

8113 // Used by archive reader when -ObjC option is specified

8114 //

 bool hasObjC1Categories(const uint8_t* fileContent)

8116 {

         if ( mach_o::relocatable::Parser<x86>::validFile(fileContent, false, 0) ) {

                 return mach_o::relocatable::Parser<x86>::hasObjC1Categories(fileContent);

8119 }

8120 return false;

8121 }

8122

8123 //

8124 // Used by bitcode obfuscator to get a list of non local symbols from object file

8125 //

 bool getNonLocalSymbols(const uint8_t* fileContent, std::vector<const char*> &syms)

8127 {

         if ( mach_o::relocatable::Parser<x86_64>::validFile(fileContent) ) {

                 return mach_o::relocatable::Parser<x86_64>::getNonLocalSymbols(fileContent, syms);

8130 }

         else if ( mach_o::relocatable::Parser<arm>::validFile(fileContent, false, 0) ) {

                 return mach_o::relocatable::Parser<arm>::getNonLocalSymbols(fileContent, syms);

8133 }

         else if ( mach_o::relocatable::Parser<x86>::validFile(fileContent, false, 0) ) {

                 return mach_o::relocatable::Parser<x86>::getNonLocalSymbols(fileContent, syms);

8136 }

8137 #if SUPPORT_ARCH_arm64

         else if ( mach_o::relocatable::Parser<arm64>::validFile(fileContent, false, 0) ) {

                 return mach_o::relocatable::Parser<arm64>::getNonLocalSymbols(fileContent, syms);

8140 }

8141 #endif

8142 return false;

8143 }

8144

8145

8146

8147 } // namespace relocatable

8148 } // namespace mach_o

8149

8150