darling-dyld/dyld3/MachOAnalyzerSet.h

203 lines
11 KiB
C
Raw Normal View History

2022-04-20 03:09:17 +00:00
/*
* Copyright (c) 2019 Apple Inc. All rights reserved.
*
* @APPLE_LICENSE_HEADER_START@
*
* This file contains Original Code and/or Modifications of Original Code
* as defined in and that are subject to the Apple Public Source License
* Version 2.0 (the 'License'). You may not use this file except in
* compliance with the License. Please obtain a copy of the License at
* http://www.opensource.apple.com/apsl/ and read it before using this
* file.
*
* The Original Code and all software distributed under the License are
* distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
* EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
* INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
* Please see the License for the specific language governing rights and
* limitations under the License.
*
* @APPLE_LICENSE_HEADER_END@
*/
#ifndef MachOAnalyzerSet_h
#define MachOAnalyzerSet_h
#include "MachOAnalyzer.h"
#include "Array.h"
namespace dyld3 {
//
// MachOAnalyzerSet is an abstraction to deal with sets of mach-o files. For instance,
// if a mach-o file A binds to a symbol in mach-o file B, the MachOAnalyzerSet lets you
// evaulate the bind such that you know where in B, the bind pointer in A needs to point.
//
// The goal of MachOAnalyzerSet is to be the one place for code that handles mach-o
// file interactions, such as two-level namespace binding, weak-def coalescing, and
// dyld cache patching.
//
// Conceptually, MachOAnalyzerSet is an ordered list of mach-o files. Each file is modeled
// as an WrappedMachO object. This is a lightweight POD struct of three pointers that
// can be copied around. A WrappedMachO consists of the MachOAnalyzer* that is represents,
// a pointer to the MachOAnalyzerSet it is in, and an abstract "other" pointer that the
// concrete implementation of MachOAnalyzerSet defines. All uses of mach-o files in
// the MachOAnalyzerSet method uses WrappedMachO types.
//
// // This is the key method on WrappedMachO. It is called during closure building to
// // compile down the fixups, as well as at runtime in dyld3 minimal closure mode
// // to parse LINKEDIT and rebase/bind pointers.
// void forEachFixup(Diagnostics& diag, FixUpHandler, CachePatchHandler) const;
//
//
// It would have been nice to have virtual methods on WrappedMachO, but C++ won't allow
// objects with vtables to be copied. So instead the methods on WrappedMachO simply
// forward to virtual methods in the owning MachOAnalyzerSet object. Therefore, there
// are two kinds of methods on MachOAnalyzerSet: methods for a WrappedMachO start with wmo_,
// whereas methods for the whole set start with mas_.
//
// // Walk all images in the set in order. "hidden" means the image was loaded with RTLD_LOCAL
// void mas_forEachImage(void (^handler)(const WrappedMachO& wmo, bool hidden, bool& stop)) const = 0;
//
// // fills in mainWmo with the WrappedMachO for the main executable in the set
// void mas_mainExecutable(WrappedMachO& mainWmo) const = 0;
//
// // returns a pointer to the start of the dyld cache used the mach-o files in the set
// void* mas_dyldCache() const = 0;
//
// // For weak-def coalescing. The file fromWmo needs to bind to symbolName. All files with weak-defs should be searched.
// // As a side effect of doing this binding, it may find that the symbol is bound overrides something in the dyld cache.
// // In that case, the CachePatchHandler function is called with info about how to patch the dyld cache.
// // This function has a default implementation. Only the dyld cache builder overrides this, because the set is all the
// // dylibs in the dyld cache, and coalescing should only look at files actually linked.
// bool mas_fromImageWeakDefLookup(const WrappedMachO& fromWmo, const char* symbolName, uint64_t addend,
// CachePatchHandler patcher, FixupTarget& target) const;
//
//
// // For a given WrappedMachO (fromWmo), find the nth dependent dylib. If depIndex is out of range, return false.
// // If child is weak-linked dylib that could not be loaded, set missingWeakDylib to true and return true.
// // Otherwise fill in childWmo and return true
// bool wmo_dependent(const WrappedMachO* fromWmo, uint32_t depIndex, WrappedMachO& childWmo, bool& missingWeakDylib) const = 0;
//
// // Returns the path to the specified WrappedMachO
// const char* wmo_path(const WrappedMachO* wmo) const = 0;
//
// // Called if a symbol cannot be found. If false is returned, then the symbol binding code will return an error.
// // If true is returned, then "target" must be set. It may be set to "NULL" as absolute/0.
// bool wmo_missingSymbolResolver(const WrappedMachO* fromWmo, bool weakImport, bool lazyBind, const char* symbolName,
// const char* expectedInDylibPath, const char* clientPath, FixupTarget& target) const = 0;
//
// // Returns the exports trie for the given binary. There is a default implementation which walks the load commands.
// // This should only be overriden if the MachOAnalyzerSet caches the export trie location.
// ExportsTrie wmo_getExportsTrie(const WrappedMachO* wmo) const;
//
// // This handles special symbols like C++ operator new which can exist in the main executable as non-weak but
// // coalesce with other weak implementations. It does not need to be overridden.
// void wmo_findExtraSymbolFrom(const WrappedMachO* fromWmo, CachePatchHandler ph) const;
//
// // This is core logic for two-level namespace symbol look ups. It does not need to be overridden.
// bool wmo_findSymbolFrom(const WrappedMachO* fromWmo, Diagnostics& diag, int libOrdinal, const char* symbolName,
// bool weakImport, bool lazyBind, uint64_t addend, CachePatchHandler ph, FixupTarget& target) const;
//
//
struct VIS_HIDDEN MachOAnalyzerSet
{
public:
#ifdef DARLING
MachOAnalyzerSet();
#endif
2022-04-20 03:09:17 +00:00
struct FixupTarget;
struct ExportsTrie { const uint8_t* start; const uint8_t* end; } ;
// Extra info needed when setting an actual pointer value at runtime
struct PointerMetaData
{
PointerMetaData();
PointerMetaData(const MachOLoaded::ChainedFixupPointerOnDisk* fixupLoc, uint16_t pointer_format);
uint32_t diversity : 16,
high8 : 8,
authenticated : 1,
key : 2,
usesAddrDiversity : 1;
};
typedef void (^FixUpHandler)(uint64_t fixupLocRuntimeOffset, PointerMetaData pmd, const FixupTarget& target, bool& stop);
typedef void (^CachePatchHandler)(uint32_t cachedDylibIndex, uint32_t exportCacheOffset, const FixupTarget& target);
struct WrappedMachO
{
const MachOAnalyzer* _mh;
const MachOAnalyzerSet* _set;
void* _other;
WrappedMachO() : _mh(nullptr), _set((nullptr)), _other((nullptr)) { }
WrappedMachO(const MachOAnalyzer* ma, const MachOAnalyzerSet* mas, void* o) : _mh(ma), _set(mas), _other(o) { }
~WrappedMachO() {}
// Used by: dyld cache building, dyld3s fixup applying, app closure building traditional format, dyldinfo tool
void forEachFixup(Diagnostics& diag, FixUpHandler, CachePatchHandler) const;
// convenience functions
bool dependent(uint32_t depIndex, WrappedMachO& childObj, bool& missingWeakDylib) const { return _set->wmo_dependent(this, depIndex, childObj, missingWeakDylib); }
const char* path() const { return (_set ? _set->wmo_path(this) : nullptr); }
ExportsTrie getExportsTrie() const { return _set->wmo_getExportsTrie(this); }
bool findSymbolFrom(Diagnostics& diag, int libOrdinal, const char* symbolName, bool weakImport, bool lazyBind, uint64_t addend, CachePatchHandler ph, FixupTarget& target) const
{ return _set->wmo_findSymbolFrom(this, diag, libOrdinal, symbolName, weakImport, lazyBind, addend, ph, target); }
bool missingSymbolResolver(bool weakImport, bool lazyBind, const char* symbolName, const char* expectedInDylibPath, const char* clientPath, FixupTarget& target) const
{ return _set->wmo_missingSymbolResolver(this, weakImport, lazyBind, symbolName, expectedInDylibPath, clientPath, target); }
bool findSymbolIn(Diagnostics& diag, const char* symbolName, uint64_t addend, FixupTarget& target) const;
private:
void forEachBind(Diagnostics& diag, FixUpHandler, CachePatchHandler) const;
};
struct FixupTarget
{
enum class Kind { rebase, bindToImage, bindAbsolute, bindMissingSymbol };
WrappedMachO foundInImage;
uint64_t offsetInImage = 0; // includes addend
const char* requestedSymbolName = nullptr;
const char* foundSymbolName = nullptr;
uint64_t addend = 0; // already added into offsetInImage
int libOrdinal = 0;
Kind kind = Kind::rebase;
bool isLazyBindRebase = false; // target is stub helper in same image
bool isWeakDef = false; // target symbol is a weak-def
bool weakCoalesced = false; // target found searching all images
bool weakBoundSameImage = false; // first weak-def was in same image as use
bool skippableWeakDef = false; // old binary that stripped symbol, so def will never be found
};
virtual void mas_forEachImage(void (^handler)(const WrappedMachO& wmo, bool hidden, bool& stop)) const = 0;
virtual bool mas_fromImageWeakDefLookup(const WrappedMachO& fromWmo, const char* symbolName, uint64_t addend, CachePatchHandler patcher, FixupTarget& target) const;
virtual void mas_mainExecutable(WrappedMachO& mainWmo) const = 0;
virtual void* mas_dyldCache() const = 0;
protected:
friend WrappedMachO;
virtual bool wmo_dependent(const WrappedMachO* fromWmo, uint32_t depIndex, WrappedMachO& childWmo, bool& missingWeakDylib) const = 0;
virtual const char* wmo_path(const WrappedMachO* wmo) const = 0;
virtual ExportsTrie wmo_getExportsTrie(const WrappedMachO* wmo) const;
virtual bool wmo_findSymbolFrom(const WrappedMachO* fromWmo, Diagnostics& diag, int libOrdinal, const char* symbolName, bool weakImport,
bool lazyBind, uint64_t addend, CachePatchHandler ph, FixupTarget& target) const;
virtual bool wmo_missingSymbolResolver(const WrappedMachO* fromWmo, bool weakImport, bool lazyBind, const char* symbolName,
const char* expectedInDylibPath, const char* clientPath, FixupTarget& target) const = 0;
virtual void wmo_findExtraSymbolFrom(const WrappedMachO* fromWmo, CachePatchHandler ph) const;
};
} // namespace dyld3
#endif /* MachOAnalyzerSet_h */