[Lldb-commits] [lldb] 96d1218 - Allow firmware binaries to be specified only by load address
Jason Molenda via lldb-commits
lldb-commits at lists.llvm.org
Tue Aug 2 14:14:22 PDT 2022
Author: Jason Molenda
Date: 2022-08-02T14:14:16-07:00
New Revision: 96d12187b3d28f63d29802a7af49dfe53cc306f3
URL: https://github.com/llvm/llvm-project/commit/96d12187b3d28f63d29802a7af49dfe53cc306f3
DIFF: https://github.com/llvm/llvm-project/commit/96d12187b3d28f63d29802a7af49dfe53cc306f3.diff
LOG: Allow firmware binaries to be specified only by load address
Add support to Mach-O corefiles and to live gdb remote serial protocol
connections for the corefile/remote stub to provide a list of load
addresses of binaries that should be found & loaded by lldb, and nothing
else. lldb will try to parse the binary out of memory, and if it can
find a UUID, try to find a binary & its debug information based on the
UUID, falling back to using the memory image if it must.
A bit of code unification from three parts of lldb that were loading
individual binaries already, so there is a shared method in
DynamicLoader to handle all of the variations they were doing.
Re-landing this with a uuid_is_null() implementation added to
Utility/UuidCompatibility.h for non-Darwin systems.
Differential Revision: https://reviews.llvm.org/D130813
rdar://94249937
rdar://94249384
Added:
lldb/test/API/macosx/lc-note/multiple-binary-corefile/Makefile
lldb/test/API/macosx/lc-note/multiple-binary-corefile/TestMultipleBinaryCorefile.py
lldb/test/API/macosx/lc-note/multiple-binary-corefile/create-multibin-corefile.cpp
lldb/test/API/macosx/lc-note/multiple-binary-corefile/main.c
lldb/test/API/macosx/lc-note/multiple-binary-corefile/one.c
lldb/test/API/macosx/lc-note/multiple-binary-corefile/two.c
Modified:
lldb/docs/lldb-gdb-remote.txt
lldb/include/lldb/Target/DynamicLoader.h
lldb/source/Core/DynamicLoader.cpp
lldb/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp
lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.cpp
lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.h
lldb/source/Plugins/Process/gdb-remote/ProcessGDBRemote.cpp
lldb/source/Plugins/Process/mach-core/ProcessMachCore.cpp
lldb/source/Utility/UuidCompatibility.h
Removed:
################################################################################
diff --git a/lldb/docs/lldb-gdb-remote.txt b/lldb/docs/lldb-gdb-remote.txt
index 820f3bd7bbc20..497980ed1229b 100644
--- a/lldb/docs/lldb-gdb-remote.txt
+++ b/lldb/docs/lldb-gdb-remote.txt
@@ -1073,6 +1073,12 @@ main-binary-uuid: is the UUID of a firmware type binary that the gdb stub knows
main-binary-address: is the load address of the firmware type binary
main-binary-slide: is the slide of the firmware type binary, if address isn't known
+binary-addresses: A comma-separated list of binary load addresses base16.
+ lldb will parse the binaries in memory to get UUIDs, then
+ try to find the binaries & debug info by UUID. Intended for
+ use with a small number of firmware type binaries where the
+ search for binary/debug info may be expensive.
+
//----------------------------------------------------------------------
// "qShlibInfoAddr"
//
diff --git a/lldb/include/lldb/Target/DynamicLoader.h b/lldb/include/lldb/Target/DynamicLoader.h
index 397b4aa303448..7e7a4218810b5 100644
--- a/lldb/include/lldb/Target/DynamicLoader.h
+++ b/lldb/include/lldb/Target/DynamicLoader.h
@@ -210,6 +210,52 @@ class DynamicLoader : public PluginInterface {
lldb::addr_t base_addr,
bool base_addr_is_offset);
+ /// Find/load a binary into lldb given a UUID and the address where it is
+ /// loaded in memory, or a slide to be applied to the file address.
+ /// May force an expensive search on the computer to find the binary by
+ /// UUID, should not be used for a large number of binaries - intended for
+ /// an environment where there may be one, or a few, binaries resident in
+ /// memory.
+ ///
+ /// Given a UUID, search for a binary and load it at the address provided,
+ /// or with the slide applied, or at the file address unslid.
+ ///
+ /// Given an address, try to read the binary out of memory, get the UUID,
+ /// find the file if possible and load it unslid, or add the memory module.
+ ///
+ /// \param[in] process
+ /// The process to add this binary to.
+ ///
+ /// \param[in] uuid
+ /// UUID of the binary to be loaded. UUID may be empty, and if a
+ /// load address is supplied, will read the binary from memory, get
+ /// a UUID and try to find a local binary. There is a performance
+ /// cost to doing this, it is not preferable.
+ ///
+ /// \param[in] value
+ /// Address where the binary should be loaded, or read out of memory.
+ /// Or a slide value, to be applied to the file addresses of the binary.
+ ///
+ /// \param[in] value_is_offset
+ /// A flag indicating that \p value is an address, or an offset to
+ /// be applied to the file addresses.
+ ///
+ /// \param[in] force_symbol_search
+ /// Allow the search to do a possibly expensive external search for
+ /// the ObjectFile and/or SymbolFile.
+ ///
+ /// \param[in] notify
+ /// Whether ModulesDidLoad should be called when a binary has been added
+ /// to the Target. The caller may prefer to batch up these when loading
+ /// multiple binaries.
+ ///
+ /// \return
+ /// Returns a shared pointer for the Module that has been added.
+ static lldb::ModuleSP
+ LoadBinaryWithUUIDAndAddress(Process *process, UUID uuid, lldb::addr_t value,
+ bool value_is_offset, bool force_symbol_search,
+ bool notify);
+
/// Get information about the shared cache for a process, if possible.
///
/// On some systems (e.g. Darwin based systems), a set of libraries that are
diff --git a/lldb/source/Core/DynamicLoader.cpp b/lldb/source/Core/DynamicLoader.cpp
index 96e0d4ec6555d..1fe60e000c6d5 100644
--- a/lldb/source/Core/DynamicLoader.cpp
+++ b/lldb/source/Core/DynamicLoader.cpp
@@ -13,11 +13,15 @@
#include "lldb/Core/ModuleSpec.h"
#include "lldb/Core/PluginManager.h"
#include "lldb/Core/Section.h"
+#include "lldb/Symbol/LocateSymbolFile.h"
#include "lldb/Symbol/ObjectFile.h"
#include "lldb/Target/MemoryRegionInfo.h"
+#include "lldb/Target/Platform.h"
#include "lldb/Target/Process.h"
#include "lldb/Target/Target.h"
#include "lldb/Utility/ConstString.h"
+#include "lldb/Utility/LLDBLog.h"
+#include "lldb/Utility/Log.h"
#include "lldb/lldb-private-interfaces.h"
#include "llvm/ADT/StringRef.h"
@@ -171,6 +175,100 @@ ModuleSP DynamicLoader::LoadModuleAtAddress(const FileSpec &file,
return nullptr;
}
+static ModuleSP ReadUnnamedMemoryModule(Process *process, addr_t addr) {
+ char namebuf[80];
+ snprintf(namebuf, sizeof(namebuf), "memory-image-0x%" PRIx64, addr);
+ return process->ReadModuleFromMemory(FileSpec(namebuf), addr);
+}
+
+ModuleSP DynamicLoader::LoadBinaryWithUUIDAndAddress(Process *process,
+ UUID uuid, addr_t value,
+ bool value_is_offset,
+ bool force_symbol_search,
+ bool notify) {
+ ModuleSP memory_module_sp;
+ ModuleSP module_sp;
+ PlatformSP platform_sp = process->GetTarget().GetPlatform();
+ Target &target = process->GetTarget();
+ Status error;
+ ModuleSpec module_spec;
+ module_spec.GetUUID() = uuid;
+
+ if (!uuid.IsValid() && !value_is_offset) {
+ memory_module_sp = ReadUnnamedMemoryModule(process, value);
+
+ if (memory_module_sp)
+ uuid = memory_module_sp->GetUUID();
+ }
+
+ if (uuid.IsValid()) {
+ ModuleSpec module_spec;
+ module_spec.GetUUID() = uuid;
+
+ if (!module_sp)
+ module_sp = target.GetOrCreateModule(module_spec, false, &error);
+
+ // If we haven't found a binary, or we don't have a SymbolFile, see
+ // if there is an external search tool that can find it.
+ if (force_symbol_search &&
+ (!module_sp || !module_sp->GetSymbolFileFileSpec())) {
+ Symbols::DownloadObjectAndSymbolFile(module_spec, error, true);
+ if (FileSystem::Instance().Exists(module_spec.GetFileSpec())) {
+ module_sp = std::make_shared<Module>(module_spec);
+ }
+ }
+ }
+
+ // If we couldn't find the binary anywhere else, as a last resort,
+ // read it out of memory.
+ if (!module_sp.get() && value != LLDB_INVALID_ADDRESS && !value_is_offset) {
+ if (!memory_module_sp)
+ memory_module_sp = ReadUnnamedMemoryModule(process, value);
+ if (memory_module_sp)
+ module_sp = memory_module_sp;
+ }
+
+ Log *log = GetLog(LLDBLog::DynamicLoader);
+ if (module_sp.get()) {
+ target.GetImages().AppendIfNeeded(module_sp, false);
+
+ bool changed = false;
+ if (module_sp->GetObjectFile()) {
+ if (value != LLDB_INVALID_ADDRESS) {
+ LLDB_LOGF(log, "Loading binary UUID %s at %s 0x%" PRIx64,
+ uuid.GetAsString().c_str(),
+ value_is_offset ? "offset" : "address", value);
+ module_sp->SetLoadAddress(target, value, value_is_offset, changed);
+ } else {
+ // No address/offset/slide, load the binary at file address,
+ // offset 0.
+ LLDB_LOGF(log, "Loading binary UUID %s at file address",
+ uuid.GetAsString().c_str());
+ module_sp->SetLoadAddress(target, 0, true /* value_is_slide */,
+ changed);
+ }
+ } else {
+ // In-memory image, load at its true address, offset 0.
+ LLDB_LOGF(log, "Loading binary UUID %s from memory at address 0x%" PRIx64,
+ uuid.GetAsString().c_str(), value);
+ module_sp->SetLoadAddress(target, 0, true /* value_is_slide */, changed);
+ }
+
+ if (notify) {
+ ModuleList added_module;
+ added_module.Append(module_sp, false);
+ target.ModulesDidLoad(added_module);
+ }
+ } else {
+ LLDB_LOGF(log, "Unable to find binary with UUID %s and load it at "
+ "%s 0x%" PRIx64,
+ uuid.GetAsString().c_str(),
+ value_is_offset ? "offset" : "address", value);
+ }
+
+ return module_sp;
+}
+
int64_t DynamicLoader::ReadUnsignedIntWithSizeInBytes(addr_t addr,
int size_in_bytes) {
Status error;
diff --git a/lldb/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp b/lldb/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp
index 5dc71fca36c25..15b06dbbfaec0 100644
--- a/lldb/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp
+++ b/lldb/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp
@@ -5600,7 +5600,8 @@ bool ObjectFileMachO::GetCorefileMainBinaryInfo(addr_t &value,
}
if (m_data.CopyData(offset, sizeof(uuid_t), raw_uuid) != 0) {
- uuid = UUID::fromOptionalData(raw_uuid, sizeof(uuid_t));
+ if (!uuid_is_null(raw_uuid))
+ uuid = UUID::fromOptionalData(raw_uuid, sizeof(uuid_t));
// convert the "main bin spec" type into our
// ObjectFile::BinaryType enum
switch (binspec_type) {
@@ -6901,7 +6902,8 @@ ObjectFileMachO::GetCorefileAllImageInfos() {
MachOCorefileImageEntry image_entry;
image_entry.filename = (const char *)m_data.GetCStr(&filepath_offset);
- image_entry.uuid = UUID::fromData(uuid, sizeof(uuid_t));
+ if (!uuid_is_null(uuid))
+ image_entry.uuid = UUID::fromData(uuid, sizeof(uuid_t));
image_entry.load_address = load_address;
image_entry.currently_executing = currently_executing;
@@ -6932,9 +6934,11 @@ ObjectFileMachO::GetCorefileAllImageInfos() {
MachOCorefileImageEntry image_entry;
image_entry.filename = filename;
- image_entry.uuid = UUID::fromData(uuid, sizeof(uuid_t));
+ if (!uuid_is_null(uuid))
+ image_entry.uuid = UUID::fromData(uuid, sizeof(uuid_t));
image_entry.load_address = load_address;
image_entry.slide = slide;
+ image_entry.currently_executing = true;
image_infos.all_image_infos.push_back(image_entry);
}
}
@@ -6951,42 +6955,41 @@ bool ObjectFileMachO::LoadCoreFileImages(lldb_private::Process &process) {
ModuleList added_modules;
for (const MachOCorefileImageEntry &image : image_infos.all_image_infos) {
- ModuleSpec module_spec;
- module_spec.GetUUID() = image.uuid;
- if (image.filename.empty()) {
- char namebuf[80];
- if (image.load_address != LLDB_INVALID_ADDRESS)
- snprintf(namebuf, sizeof(namebuf), "mem-image-0x%" PRIx64,
- image.load_address);
- else
- snprintf(namebuf, sizeof(namebuf), "mem-image+0x%" PRIx64, image.slide);
- module_spec.GetFileSpec() = FileSpec(namebuf);
- } else {
- module_spec.GetFileSpec() = FileSpec(image.filename.c_str());
- }
- if (image.currently_executing) {
+ ModuleSP module_sp;
+
+ if (!image.filename.empty()) {
Status error;
- Symbols::DownloadObjectAndSymbolFile(module_spec, error, true);
- if (FileSystem::Instance().Exists(module_spec.GetFileSpec())) {
- process.GetTarget().GetOrCreateModule(module_spec, false);
+ ModuleSpec module_spec;
+ module_spec.GetUUID() = image.uuid;
+ module_spec.GetFileSpec() = FileSpec(image.filename.c_str());
+ if (image.currently_executing) {
+ Symbols::DownloadObjectAndSymbolFile(module_spec, error, true);
+ if (FileSystem::Instance().Exists(module_spec.GetFileSpec())) {
+ process.GetTarget().GetOrCreateModule(module_spec, false);
+ }
}
- }
- Status error;
- ModuleSP module_sp =
- process.GetTarget().GetOrCreateModule(module_spec, false, &error);
- if (!module_sp.get() || !module_sp->GetObjectFile()) {
+ module_sp =
+ process.GetTarget().GetOrCreateModule(module_spec, false, &error);
+ process.GetTarget().GetImages().AppendIfNeeded(module_sp,
+ false /* notify */);
+ } else {
if (image.load_address != LLDB_INVALID_ADDRESS) {
- module_sp = process.ReadModuleFromMemory(module_spec.GetFileSpec(),
- image.load_address);
+ module_sp = DynamicLoader::LoadBinaryWithUUIDAndAddress(
+ &process, image.uuid, image.load_address,
+ false /* value_is_offset */, image.currently_executing,
+ false /* notify */);
+ } else if (image.slide != LLDB_INVALID_ADDRESS) {
+ module_sp = DynamicLoader::LoadBinaryWithUUIDAndAddress(
+ &process, image.uuid, image.slide, true /* value_is_offset */,
+ image.currently_executing, false /* notify */);
}
}
+
if (module_sp.get()) {
// Will call ModulesDidLoad with all modules once they've all
// been added to the Target with load addresses. Don't notify
// here, before the load address is set.
- const bool notify = false;
- process.GetTarget().GetImages().AppendIfNeeded(module_sp, notify);
- added_modules.Append(module_sp, notify);
+ added_modules.Append(module_sp, false /* notify */);
if (image.segment_load_addresses.size() > 0) {
if (log) {
std::string uuidstr = image.uuid.GetAsString();
diff --git a/lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.cpp b/lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.cpp
index 580cdde57d80f..8687175ee36c4 100644
--- a/lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.cpp
+++ b/lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.cpp
@@ -1033,6 +1033,13 @@ bool GDBRemoteCommunicationClient::GetProcessStandaloneBinary(
return true;
}
+std::vector<addr_t>
+GDBRemoteCommunicationClient::GetProcessStandaloneBinaries() {
+ if (m_qProcessInfo_is_valid == eLazyBoolCalculate)
+ GetCurrentProcessInfo();
+ return m_binary_addresses;
+}
+
bool GDBRemoteCommunicationClient::GetGDBServerVersion() {
if (m_qGDBServerVersion_is_valid == eLazyBoolCalculate) {
m_gdb_server_name.clear();
@@ -2192,6 +2199,14 @@ bool GDBRemoteCommunicationClient::GetCurrentProcessInfo(bool allow_lazy) {
m_process_standalone_value_is_offset = false;
++num_keys_decoded;
}
+ } else if (name.equals("binary-addresses")) {
+ addr_t addr;
+ while (!value.empty()) {
+ llvm::StringRef addr_str;
+ std::tie(addr_str, value) = value.split(',');
+ if (!addr_str.getAsInteger(16, addr))
+ m_binary_addresses.push_back(addr);
+ }
}
}
if (num_keys_decoded > 0)
diff --git a/lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.h b/lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.h
index 3d838d6d80747..3a62747603f6d 100644
--- a/lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.h
+++ b/lldb/source/Plugins/Process/gdb-remote/GDBRemoteCommunicationClient.h
@@ -220,6 +220,8 @@ class GDBRemoteCommunicationClient : public GDBRemoteClientBase {
bool GetProcessStandaloneBinary(UUID &uuid, lldb::addr_t &value,
bool &value_is_offset);
+ std::vector<lldb::addr_t> GetProcessStandaloneBinaries();
+
void GetRemoteQSupported();
bool GetVContSupported(char flavor);
@@ -593,6 +595,7 @@ class GDBRemoteCommunicationClient : public GDBRemoteClientBase {
UUID m_process_standalone_uuid;
lldb::addr_t m_process_standalone_value = LLDB_INVALID_ADDRESS;
bool m_process_standalone_value_is_offset = false;
+ std::vector<lldb::addr_t> m_binary_addresses;
llvm::VersionTuple m_os_version;
llvm::VersionTuple m_maccatalyst_version;
std::string m_os_build;
diff --git a/lldb/source/Plugins/Process/gdb-remote/ProcessGDBRemote.cpp b/lldb/source/Plugins/Process/gdb-remote/ProcessGDBRemote.cpp
index b7de05d498aa9..e3dada1864da5 100644
--- a/lldb/source/Plugins/Process/gdb-remote/ProcessGDBRemote.cpp
+++ b/lldb/source/Plugins/Process/gdb-remote/ProcessGDBRemote.cpp
@@ -581,80 +581,31 @@ Status ProcessGDBRemote::DoConnectRemote(llvm::StringRef remote_url) {
ModuleSP module_sp;
if (standalone_uuid.IsValid()) {
- ModuleSpec module_spec;
- module_spec.GetUUID() = standalone_uuid;
-
- // Look up UUID in global module cache before attempting
- // a more expensive search.
- Status error = ModuleList::GetSharedModule(module_spec, module_sp,
- nullptr, nullptr, nullptr);
-
- if (!module_sp) {
- // Force a an external lookup, if that tool is available.
- if (!module_spec.GetSymbolFileSpec()) {
- Status error;
- Symbols::DownloadObjectAndSymbolFile(module_spec, error, true);
- }
-
- if (FileSystem::Instance().Exists(module_spec.GetFileSpec())) {
- module_sp = std::make_shared<Module>(module_spec);
- }
- }
-
- // If we couldn't find the binary anywhere else, as a last resort,
- // read it out of memory.
- if (!module_sp.get() && standalone_value != LLDB_INVALID_ADDRESS &&
- !standalone_value_is_offset) {
- char namebuf[80];
- snprintf(namebuf, sizeof(namebuf), "mem-image-0x%" PRIx64,
- standalone_value);
- module_sp =
- ReadModuleFromMemory(FileSpec(namebuf), standalone_value);
- }
-
- Log *log = GetLog(LLDBLog::DynamicLoader);
- if (module_sp.get()) {
- target.GetImages().AppendIfNeeded(module_sp, false);
-
- bool changed = false;
- if (module_sp->GetObjectFile()) {
- if (standalone_value != LLDB_INVALID_ADDRESS) {
- if (log)
- log->Printf("Loading binary UUID %s at %s 0x%" PRIx64,
- standalone_uuid.GetAsString().c_str(),
- standalone_value_is_offset ? "offset" : "address",
- standalone_value);
- module_sp->SetLoadAddress(target, standalone_value,
- standalone_value_is_offset, changed);
- } else {
- // No address/offset/slide, load the binary at file address,
- // offset 0.
- if (log)
- log->Printf("Loading binary UUID %s at file address",
- standalone_uuid.GetAsString().c_str());
- const bool value_is_slide = true;
- module_sp->SetLoadAddress(target, 0, value_is_slide, changed);
- }
- } else {
- // In-memory image, load at its true address, offset 0.
- if (log)
- log->Printf("Loading binary UUID %s from memory",
- standalone_uuid.GetAsString().c_str());
- const bool value_is_slide = true;
- module_sp->SetLoadAddress(target, 0, value_is_slide, changed);
- }
+ const bool force_symbol_search = true;
+ const bool notify = true;
+ DynamicLoader::LoadBinaryWithUUIDAndAddress(
+ this, standalone_uuid, standalone_value,
+ standalone_value_is_offset, force_symbol_search, notify);
+ }
+ }
- ModuleList added_module;
- added_module.Append(module_sp, false);
- target.ModulesDidLoad(added_module);
- } else {
- if (log)
- log->Printf("Unable to find binary with UUID %s and load it at "
- "%s 0x%" PRIx64,
- standalone_uuid.GetAsString().c_str(),
- standalone_value_is_offset ? "offset" : "address",
- standalone_value);
- }
+ // The remote stub may know about a list of binaries to
+ // force load into the process -- a firmware type situation
+ // where multiple binaries are present in virtual memory,
+ // and we are only given the addresses of the binaries.
+ // Not intended for use with userland debugging when we
+ // a DynamicLoader plugin that knows how to find the loaded
+ // binaries and will track updates as binaries are added.
+
+ std::vector<addr_t> bin_addrs = m_gdb_comm.GetProcessStandaloneBinaries();
+ if (bin_addrs.size()) {
+ UUID uuid;
+ const bool value_is_slide = false;
+ for (addr_t addr : bin_addrs) {
+ const bool force_symbol_search = true;
+ const bool notify = true;
+ DynamicLoader::LoadBinaryWithUUIDAndAddress(
+ this, uuid, addr, value_is_slide, force_symbol_search, notify);
}
}
diff --git a/lldb/source/Plugins/Process/mach-core/ProcessMachCore.cpp b/lldb/source/Plugins/Process/mach-core/ProcessMachCore.cpp
index 7f943a5258c40..68786e8d80b00 100644
--- a/lldb/source/Plugins/Process/mach-core/ProcessMachCore.cpp
+++ b/lldb/source/Plugins/Process/mach-core/ProcessMachCore.cpp
@@ -180,88 +180,6 @@ bool ProcessMachCore::GetDynamicLoaderAddress(lldb::addr_t addr) {
return false;
}
-// We have a hint about a binary -- a UUID, possibly a load address.
-// Try to load a file with that UUID into lldb, and if we have a load
-// address, set it correctly. Else assume that the binary was loaded
-// with no slide.
-static bool load_standalone_binary(UUID uuid, addr_t value,
- bool value_is_offset, Target &target) {
- if (uuid.IsValid()) {
- ModuleSpec module_spec;
- module_spec.GetUUID() = uuid;
-
- // Look up UUID in global module cache before attempting
- // dsymForUUID-like action.
- ModuleSP module_sp;
- Status error = ModuleList::GetSharedModule(module_spec, module_sp, nullptr,
- nullptr, nullptr);
-
- if (!module_sp.get()) {
- // Force a a dsymForUUID lookup, if that tool is available.
- if (!module_spec.GetSymbolFileSpec()) {
- Status error;
- Symbols::DownloadObjectAndSymbolFile(module_spec, error, true);
- }
-
- if (FileSystem::Instance().Exists(module_spec.GetFileSpec())) {
- module_sp = std::make_shared<Module>(module_spec);
- }
- }
-
- // If we couldn't find the binary anywhere else, as a last resort,
- // read it out of memory in the corefile.
- if (!module_sp.get() && value != LLDB_INVALID_ADDRESS && !value_is_offset) {
- char namebuf[80];
- snprintf(namebuf, sizeof(namebuf), "mem-image-0x%" PRIx64, value);
- module_sp =
- target.GetProcessSP()->ReadModuleFromMemory(FileSpec(namebuf), value);
- }
-
- if (module_sp.get()) {
- target.SetArchitecture(module_sp->GetObjectFile()->GetArchitecture());
- target.GetImages().AppendIfNeeded(module_sp, false);
-
- // TODO: Instead of using the load address as a value, if we create a
- // memory module from that address, we could get the correct segment
- // offset values from the in-memory load commands and set them correctly.
- // In case the load address we were given is not correct for all segments,
- // e.g. something in the shared cache. DynamicLoaderDarwinKernel does
- // something similar for kexts. In the context of a corefile, this would
- // be an inexpensive operation. Not all binaries in a corefile will have
- // a Mach-O header/load commands in memory, so this will not work in all
- // cases.
-
- bool changed = false;
- if (module_sp->GetObjectFile()) {
- if (value != LLDB_INVALID_ADDRESS) {
- module_sp->SetLoadAddress(target, value, value_is_offset, changed);
- } else {
- // No address/offset/slide, load the binary at file address,
- // offset 0.
- const bool value_is_slide = true;
- module_sp->SetLoadAddress(target, 0, value_is_slide, changed);
- }
- } else {
- // In-memory image, load at its true address, offset 0.
- const bool value_is_slide = true;
- module_sp->SetLoadAddress(target, 0, value_is_slide, changed);
- }
-
- ModuleList added_module;
- added_module.Append(module_sp, false);
- target.ModulesDidLoad(added_module);
-
- // Flush info in the process (stack frames, etc).
- ProcessSP process_sp(target.GetProcessSP());
- if (process_sp)
- process_sp->Flush();
-
- return true;
- }
- }
- return false;
-}
-
// Process Control
Status ProcessMachCore::DoLoadCore() {
Log *log(GetLog(LLDBLog::DynamicLoader | LLDBLog::Process));
@@ -359,28 +277,21 @@ Status ProcessMachCore::DoLoadCore() {
objfile_binary_uuid.GetAsString().c_str(), objfile_binary_value,
objfile_binary_value_is_offset, type);
}
- if (objfile_binary_value != LLDB_INVALID_ADDRESS &&
- !objfile_binary_value_is_offset) {
- if (type == ObjectFile::eBinaryTypeUser) {
- load_standalone_binary(objfile_binary_uuid, objfile_binary_value,
- objfile_binary_value_is_offset, GetTarget());
- m_dyld_addr = objfile_binary_value;
- m_dyld_plugin_name = DynamicLoaderMacOSXDYLD::GetPluginNameStatic();
- found_main_binary_definitively = true;
- }
- if (type == ObjectFile::eBinaryTypeKernel) {
- m_mach_kernel_addr = objfile_binary_value;
- m_dyld_plugin_name = DynamicLoaderDarwinKernel::GetPluginNameStatic();
- found_main_binary_definitively = true;
- }
+ const bool force_symbol_search = true;
+ const bool notify = true;
+ if (DynamicLoader::LoadBinaryWithUUIDAndAddress(
+ this, objfile_binary_uuid, objfile_binary_value,
+ objfile_binary_value_is_offset, force_symbol_search, notify)) {
+ found_main_binary_definitively = true;
+ m_dyld_plugin_name = DynamicLoaderStatic::GetPluginNameStatic();
}
- if (!found_main_binary_definitively) {
- // ObjectFile::eBinaryTypeStandalone, undeclared types
- if (load_standalone_binary(objfile_binary_uuid, objfile_binary_value,
- objfile_binary_value_is_offset, GetTarget())) {
- found_main_binary_definitively = true;
- m_dyld_plugin_name = DynamicLoaderStatic::GetPluginNameStatic();
- }
+ if (type == ObjectFile::eBinaryTypeUser) {
+ m_dyld_addr = objfile_binary_value;
+ m_dyld_plugin_name = DynamicLoaderMacOSXDYLD::GetPluginNameStatic();
+ }
+ if (type == ObjectFile::eBinaryTypeKernel) {
+ m_mach_kernel_addr = objfile_binary_value;
+ m_dyld_plugin_name = DynamicLoaderDarwinKernel::GetPluginNameStatic();
}
}
@@ -426,8 +337,11 @@ Status ProcessMachCore::DoLoadCore() {
// We have no address specified, only a UUID. Load it at the file
// address.
const bool value_is_offset = false;
- if (load_standalone_binary(ident_uuid, ident_binary_addr, value_is_offset,
- GetTarget())) {
+ const bool force_symbol_search = true;
+ const bool notify = true;
+ if (DynamicLoader::LoadBinaryWithUUIDAndAddress(
+ this, ident_uuid, ident_binary_addr, value_is_offset,
+ force_symbol_search, notify)) {
found_main_binary_definitively = true;
m_dyld_plugin_name = DynamicLoaderStatic::GetPluginNameStatic();
}
diff --git a/lldb/source/Utility/UuidCompatibility.h b/lldb/source/Utility/UuidCompatibility.h
index e992c0c79a1f8..fe4aed00a3514 100644
--- a/lldb/source/Utility/UuidCompatibility.h
+++ b/lldb/source/Utility/UuidCompatibility.h
@@ -14,4 +14,12 @@
// uuid_t is guaranteed to always be a 16-byte array
typedef unsigned char uuid_t[16];
+// Return 1 if uuid is null, that is, all zeroes.
+int uuid_is_null(uuid_t uuid) {
+ for (int i = 0; i < 16; i++)
+ if (uuid[i])
+ return 0;
+ return 1;
+}
+
#endif // utility_UUID_COMPATIBILITY_H
diff --git a/lldb/test/API/macosx/lc-note/multiple-binary-corefile/Makefile b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/Makefile
new file mode 100644
index 0000000000000..8e561f17383fe
--- /dev/null
+++ b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/Makefile
@@ -0,0 +1,20 @@
+MAKE_DSYM := NO
+C_SOURCES := main.c
+LD_EXTRAS := -L. -lone -ltwo
+
+.PHONY: libone.dylib libtwo.dylib
+all: libone.dylib libtwo.dylib a.out create-empty-corefile
+
+create-empty-corefile:
+ "$(MAKE)" -f "$(MAKEFILE_RULES)" EXE=create-multibin-corefile \
+ CXX_SOURCES=create-multibin-corefile.cpp
+
+libone.dylib: one.c
+ $(MAKE) -f $(MAKEFILE_RULES) \
+ DYLIB_ONLY=YES DYLIB_NAME=one DYLIB_C_SOURCES=one.c
+
+libtwo.dylib: two.c
+ $(MAKE) -f $(MAKEFILE_RULES) \
+ DYLIB_ONLY=YES DYLIB_NAME=two DYLIB_C_SOURCES=two.c
+
+include Makefile.rules
diff --git a/lldb/test/API/macosx/lc-note/multiple-binary-corefile/TestMultipleBinaryCorefile.py b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/TestMultipleBinaryCorefile.py
new file mode 100644
index 0000000000000..5e74f0c3f8bfa
--- /dev/null
+++ b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/TestMultipleBinaryCorefile.py
@@ -0,0 +1,187 @@
+"""Test corefiles with "main bin spec"/"load binary" with only addrs work."""
+
+
+import os
+import re
+import subprocess
+
+import lldb
+from lldbsuite.test.decorators import *
+from lldbsuite.test.lldbtest import *
+from lldbsuite.test import lldbutil
+
+
+class TestMultipleBinaryCorefile(TestBase):
+
+ def initial_setup(self):
+ self.build()
+ self.aout_exe_basename = "a.out"
+ self.libone_exe_basename = "libone.dylib"
+ self.libtwo_exe_basename = "libtwo.dylib"
+ self.aout_exe = self.getBuildArtifact(self.aout_exe_basename)
+ self.aout_slide = 0x5000
+ self.libone_exe = self.getBuildArtifact(self.libone_exe_basename)
+ self.libone_slide = 0x100840000
+ self.libtwo_exe = self.getBuildArtifact(self.libtwo_exe_basename)
+ self.libtwo_slide = 0
+ self.corefile = self.getBuildArtifact("multiple-binaries.core")
+ self.create_corefile = self.getBuildArtifact("create-multibin-corefile")
+ cmd="%s %s %s@%x %s@%x %s@%x" % (self.create_corefile, self.corefile,
+ self.aout_exe, self.aout_slide,
+ self.libone_exe, self.libone_slide,
+ self.libtwo_exe, self.libtwo_slide)
+ call(cmd, shell=True)
+
+
+ def load_corefile_and_test(self):
+ target = self.dbg.CreateTarget('')
+ err = lldb.SBError()
+ if self.TraceOn():
+ self.runCmd("script print('loading corefile %s')" % self.corefile)
+ process = target.LoadCore(self.corefile)
+ self.assertEqual(process.IsValid(), True)
+ if self.TraceOn():
+ self.runCmd("script print('image list after loading corefile:')")
+ self.runCmd("image list")
+
+ self.assertEqual(target.GetNumModules(), 3)
+ fspec = target.GetModuleAtIndex(0).GetFileSpec()
+ self.assertEqual(fspec.GetFilename(), self.aout_exe_basename)
+
+ # libone.dylib was never loaded into lldb, see that we added a memory module.
+ fspec = target.GetModuleAtIndex(1).GetFileSpec()
+ self.assertIn('memory-image', fspec.GetFilename())
+
+ dwarfdump_uuid_regex = re.compile(
+ 'UUID: ([-0-9a-fA-F]+) \(([^\(]+)\) .*')
+ dwarfdump_cmd_output = subprocess.check_output(
+ ('/usr/bin/dwarfdump --uuid "%s"' % self.libone_exe), shell=True).decode("utf-8")
+ libone_uuid = None
+ for line in dwarfdump_cmd_output.splitlines():
+ match = dwarfdump_uuid_regex.search(line)
+ if match:
+ libone_uuid = match.group(1)
+
+ memory_image_uuid = target.GetModuleAtIndex(1).GetUUIDString()
+ self.assertEqual(libone_uuid, memory_image_uuid)
+
+ fspec = target.GetModuleAtIndex(2).GetFileSpec()
+ self.assertEqual(fspec.GetFilename(), self.libtwo_exe_basename)
+
+ # Executables "always" have this base address
+ aout_load = target.GetModuleAtIndex(0).GetObjectFileHeaderAddress().GetLoadAddress(target)
+ self.assertEqual(aout_load, 0x100000000 + self.aout_slide)
+
+ # Value from Makefile
+ libone_load = target.GetModuleAtIndex(1).GetObjectFileHeaderAddress().GetLoadAddress(target)
+ self.assertEqual(libone_load, self.libone_slide)
+
+ # Value from Makefile
+ libtwo_load = target.GetModuleAtIndex(2).GetObjectFileHeaderAddress().GetLoadAddress(target)
+ self.assertEqual(libtwo_load, self.libtwo_slide)
+
+ self.dbg.DeleteTarget(target)
+ self.dbg.Clear()
+
+ NO_DEBUG_INFO_TESTCASE = True
+
+ @skipIf(archs=no_match(['x86_64', 'arm64', 'arm64e', 'aarch64']))
+ @skipIfRemote
+ @skipUnlessDarwin
+ def test_corefile_binaries_dsymforuuid(self):
+ self.initial_setup()
+
+ if self.TraceOn():
+ self.runCmd("log enable lldb dyld host")
+ self.addTearDownHook(lambda: self.runCmd("log disable lldb dyld host"))
+
+ ## We can hook in our dsym-for-uuid shell script to lldb with this env
+ ## var instead of requiring a defaults write.
+ dsym_for_uuid = self.getBuildArtifact("dsym-for-uuid.sh")
+ os.environ['LLDB_APPLE_DSYMFORUUID_EXECUTABLE'] = dsym_for_uuid
+ if self.TraceOn():
+ print("Setting env var LLDB_APPLE_DSYMFORUUID_EXECUTABLE=" + dsym_for_uuid)
+ self.addTearDownHook(lambda: os.environ.pop('LLDB_APPLE_DSYMFORUUID_EXECUTABLE', None))
+
+ self.runCmd("settings set target.load-script-from-symbol-file true")
+ self.addTearDownHook(lambda: self.runCmd("settings set target.load-script-from-symbol-file false"))
+
+ dwarfdump_uuid_regex = re.compile(
+ 'UUID: ([-0-9a-fA-F]+) \(([^\(]+)\) .*')
+ dwarfdump_cmd_output = subprocess.check_output(
+ ('/usr/bin/dwarfdump --uuid "%s"' % self.libtwo_exe), shell=True).decode("utf-8")
+ libtwo_uuid = None
+ for line in dwarfdump_cmd_output.splitlines():
+ match = dwarfdump_uuid_regex.search(line)
+ if match:
+ libtwo_uuid = match.group(1)
+ self.assertNotEqual(libtwo_uuid, None, "Could not get uuid of built libtwo.dylib")
+
+ ### Create our dsym-for-uuid shell script which returns aout_exe
+ shell_cmds = [
+ '#! /bin/sh',
+ '# the last argument is the uuid',
+ 'while [ $# -gt 1 ]',
+ 'do',
+ ' shift',
+ 'done',
+ 'ret=0',
+ 'echo "<?xml version=\\"1.0\\" encoding=\\"UTF-8\\"?>"',
+ 'echo "<!DOCTYPE plist PUBLIC \\"-//Apple//DTD PLIST 1.0//EN\\" \\"http://www.apple.com/DTDs/PropertyList-1.0.dtd\\">"',
+ 'echo "<plist version=\\"1.0\\">"',
+ '',
+ 'if [ "$1" != "%s" ]' % (libtwo_uuid),
+ 'then',
+ ' echo "<key>DBGError</key><string>not found</string>"',
+ ' echo "</plist>"',
+ ' exit 1',
+ 'fi',
+ ' uuid=%s' % libtwo_uuid,
+ ' bin=%s' % self.libtwo_exe,
+ ' dsym=%s.dSYM/Contents/Resources/DWARF/%s' % (self.libtwo_exe, os.path.basename(self.libtwo_exe)),
+ 'echo "<dict><key>$uuid</key><dict>"',
+ '',
+ 'echo "<key>DBGDSYMPath</key><string>$dsym</string>"',
+ 'echo "<key>DBGSymbolRichExecutable</key><string>$bin</string>"',
+ 'echo "</dict></dict></plist>"',
+ 'exit $ret'
+ ]
+
+ with open(dsym_for_uuid, "w") as writer:
+ for l in shell_cmds:
+ writer.write(l + '\n')
+
+ os.chmod(dsym_for_uuid, 0o755)
+
+ # Register TWO of our binaries, but require dsymForUUID to find the third.
+ target = self.dbg.CreateTarget(self.aout_exe, '', '', False, lldb.SBError())
+ self.dbg.DeleteTarget(target)
+
+ if self.TraceOn():
+ self.runCmd("script print('Global image list, before loading corefile:')")
+ self.runCmd("image list -g")
+
+ self.load_corefile_and_test()
+
+ @skipIf(archs=no_match(['x86_64', 'arm64', 'arm64e', 'aarch64']))
+ @skipIfRemote
+ @skipUnlessDarwin
+ def test_corefile_binaries_preloaded(self):
+ self.initial_setup()
+
+ if self.TraceOn():
+ self.runCmd("log enable lldb dyld host")
+ self.addTearDownHook(lambda: self.runCmd("log disable lldb dyld host"))
+
+ # Register all three binaries in lldb's global module
+ # cache, then throw the Targets away.
+ target = self.dbg.CreateTarget(self.aout_exe, '', '', False, lldb.SBError())
+ self.dbg.DeleteTarget(target)
+ target = self.dbg.CreateTarget(self.libtwo_exe, '', '', False, lldb.SBError())
+ self.dbg.DeleteTarget(target)
+
+ if self.TraceOn():
+ self.runCmd("script print('Global image list, before loading corefile:')")
+ self.runCmd("image list -g")
+
+ self.load_corefile_and_test()
diff --git a/lldb/test/API/macosx/lc-note/multiple-binary-corefile/create-multibin-corefile.cpp b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/create-multibin-corefile.cpp
new file mode 100644
index 0000000000000..ebe71606806dd
--- /dev/null
+++ b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/create-multibin-corefile.cpp
@@ -0,0 +1,484 @@
+#include <errno.h>
+#include <fcntl.h>
+#include <inttypes.h>
+#include <mach-o/loader.h>
+#include <mach/thread_status.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <string>
+#include <sys/errno.h>
+#include <sys/stat.h>
+#include <sys/types.h>
+#include <sys/uio.h>
+#include <unistd.h>
+#include <uuid/uuid.h>
+#include <vector>
+
+// Given a list of binaries, and optional slides to be applied,
+// create a corefile whose memory is those binaries laid at at
+// their slid addresses.
+//
+// Add a 'main bin spec' LC_NOTE for the first binary, and
+// 'load binary' LC_NOTEs for any additional binaries, and
+// these LC_NOTEs will ONLY have the vmaddr of the binary - no
+// UUID, no slide, no filename.
+//
+// Test that lldb can use the load addresses, find the UUIDs,
+// and load the binaries/dSYMs and put them at the correct load
+// address.
+
+struct main_bin_spec_payload {
+ uint32_t version;
+ uint32_t type;
+ uint64_t address;
+ uint64_t slide;
+ uuid_t uuid;
+ uint32_t log2_pagesize;
+ uint32_t platform;
+};
+
+struct load_binary_payload {
+ uint32_t version;
+ uuid_t uuid;
+ uint64_t address;
+ uint64_t slide;
+ const char name[4];
+};
+
+union uint32_buf {
+ uint8_t bytebuf[4];
+ uint32_t val;
+};
+
+union uint64_buf {
+ uint8_t bytebuf[8];
+ uint64_t val;
+};
+
+void add_uint64(std::vector<uint8_t> &buf, uint64_t val) {
+ uint64_buf conv;
+ conv.val = val;
+ for (int i = 0; i < 8; i++)
+ buf.push_back(conv.bytebuf[i]);
+}
+
+void add_uint32(std::vector<uint8_t> &buf, uint32_t val) {
+ uint32_buf conv;
+ conv.val = val;
+ for (int i = 0; i < 4; i++)
+ buf.push_back(conv.bytebuf[i]);
+}
+
+std::vector<uint8_t> lc_thread_load_command(cpu_type_t cputype) {
+ std::vector<uint8_t> data;
+ // Emit an LC_THREAD register context appropriate for the cputype
+ // of the binary we're embedded. The tests in this case do not
+ // use the register values, so 0's are fine, lldb needs to see at
+ // least one LC_THREAD in the corefile.
+#if defined(__x86_64__)
+ if (cputype == CPU_TYPE_X86_64) {
+ add_uint32(data, LC_THREAD); // thread_command.cmd
+ add_uint32(data,
+ 16 + (x86_THREAD_STATE64_COUNT * 4)); // thread_command.cmdsize
+ add_uint32(data, x86_THREAD_STATE64); // thread_command.flavor
+ add_uint32(data, x86_THREAD_STATE64_COUNT); // thread_command.count
+ for (int i = 0; i < x86_THREAD_STATE64_COUNT; i++) {
+ add_uint32(data, 0); // whatever, just some empty register values
+ }
+ }
+#endif
+#if defined(__arm64__) || defined(__aarch64__)
+ if (cputype == CPU_TYPE_ARM64) {
+ add_uint32(data, LC_THREAD); // thread_command.cmd
+ add_uint32(data,
+ 16 + (ARM_THREAD_STATE64_COUNT * 4)); // thread_command.cmdsize
+ add_uint32(data, ARM_THREAD_STATE64); // thread_command.flavor
+ add_uint32(data, ARM_THREAD_STATE64_COUNT); // thread_command.count
+ for (int i = 0; i < ARM_THREAD_STATE64_COUNT; i++) {
+ add_uint32(data, 0); // whatever, just some empty register values
+ }
+ }
+#endif
+ return data;
+}
+
+void add_lc_note_main_bin_spec_load_command(
+ std::vector<std::vector<uint8_t>> &loadcmds, std::vector<uint8_t> &payload,
+ int payload_file_offset, std::string uuidstr, uint64_t address,
+ uint64_t slide) {
+ std::vector<uint8_t> loadcmd_data;
+
+ add_uint32(loadcmd_data, LC_NOTE); // note_command.cmd
+ add_uint32(loadcmd_data, 40); // note_command.cmdsize
+ char lc_note_name[16];
+ memset(lc_note_name, 0, 16);
+ strcpy(lc_note_name, "main bin spec");
+
+ // lc_note.data_owner
+ for (int i = 0; i < 16; i++)
+ loadcmd_data.push_back(lc_note_name[i]);
+
+ // we start writing the payload at payload_file_offset to leave
+ // room at the start for the header & the load commands.
+ uint64_t current_payload_offset = payload.size() + payload_file_offset;
+
+ add_uint64(loadcmd_data, current_payload_offset); // note_command.offset
+ add_uint64(loadcmd_data,
+ sizeof(struct main_bin_spec_payload)); // note_command.size
+
+ loadcmds.push_back(loadcmd_data);
+
+ // Now write the "main bin spec" payload.
+ add_uint32(payload, 2); // version
+ add_uint32(payload, 3); // type == 3 [ firmware, standalone, etc ]
+ add_uint64(payload, address); // load address
+ add_uint64(payload, slide); // slide
+ uuid_t uuid;
+ uuid_parse(uuidstr.c_str(), uuid);
+ for (int i = 0; i < sizeof(uuid_t); i++)
+ payload.push_back(uuid[i]);
+ add_uint32(payload, 0); // log2_pagesize unspecified
+ add_uint32(payload, 0); // platform unspecified
+}
+
+void add_lc_note_load_binary_load_command(
+ std::vector<std::vector<uint8_t>> &loadcmds, std::vector<uint8_t> &payload,
+ int payload_file_offset, std::string uuidstr, uint64_t address,
+ uint64_t slide) {
+ std::vector<uint8_t> loadcmd_data;
+
+ add_uint32(loadcmd_data, LC_NOTE); // note_command.cmd
+ add_uint32(loadcmd_data, 40); // note_command.cmdsize
+ char lc_note_name[16];
+ memset(lc_note_name, 0, 16);
+ strcpy(lc_note_name, "load binary");
+
+ // lc_note.data_owner
+ for (int i = 0; i < 16; i++)
+ loadcmd_data.push_back(lc_note_name[i]);
+
+ // we start writing the payload at payload_file_offset to leave
+ // room at the start for the header & the load commands.
+ uint64_t current_payload_offset = payload.size() + payload_file_offset;
+
+ add_uint64(loadcmd_data, current_payload_offset); // note_command.offset
+ add_uint64(loadcmd_data,
+ sizeof(struct load_binary_payload)); // note_command.size
+
+ loadcmds.push_back(loadcmd_data);
+
+ // Now write the "load binary" payload.
+ add_uint32(payload, 1); // version
+ uuid_t uuid;
+ uuid_parse(uuidstr.c_str(), uuid);
+ for (int i = 0; i < sizeof(uuid_t); i++)
+ payload.push_back(uuid[i]);
+ add_uint64(payload, address); // load address
+ add_uint64(payload, slide); // slide
+ add_uint32(payload, 0); // name
+}
+
+void add_lc_segment(std::vector<std::vector<uint8_t>> &loadcmds,
+ std::vector<uint8_t> &payload, int payload_file_offset,
+ uint64_t vmaddr, uint64_t size) {
+ std::vector<uint8_t> loadcmd_data;
+ struct segment_command_64 seg;
+ seg.cmd = LC_SEGMENT_64;
+ seg.cmdsize = sizeof(struct segment_command_64); // no sections
+ memset(seg.segname, 0, 16);
+ seg.vmaddr = vmaddr;
+ seg.vmsize = size;
+ seg.fileoff = payload.size() + payload_file_offset;
+ seg.filesize = size;
+ seg.maxprot = 1;
+ seg.initprot = 1;
+ seg.nsects = 0;
+ seg.flags = 0;
+
+ uint8_t *p = (uint8_t *)&seg;
+ for (int i = 0; i < sizeof(struct segment_command_64); i++) {
+ loadcmd_data.push_back(*(p + i));
+ }
+ loadcmds.push_back(loadcmd_data);
+}
+
+std::string scan_binary(const char *fn, uint64_t &vmaddr, cpu_type_t &cputype,
+ cpu_subtype_t &cpusubtype) {
+ FILE *f = fopen(fn, "r");
+ if (f == nullptr) {
+ fprintf(stderr, "Unable to open binary '%s' to get uuid\n", fn);
+ exit(1);
+ }
+ uint32_t num_of_load_cmds = 0;
+ uint32_t size_of_load_cmds = 0;
+ std::string uuid;
+ off_t file_offset = 0;
+ vmaddr = UINT64_MAX;
+
+ uint8_t magic[4];
+ if (::fread(magic, 1, 4, f) != 4) {
+ fprintf(stderr, "Failed to read magic number from input file %s\n", fn);
+ exit(1);
+ }
+ uint8_t magic_32_be[] = {0xfe, 0xed, 0xfa, 0xce};
+ uint8_t magic_32_le[] = {0xce, 0xfa, 0xed, 0xfe};
+ uint8_t magic_64_be[] = {0xfe, 0xed, 0xfa, 0xcf};
+ uint8_t magic_64_le[] = {0xcf, 0xfa, 0xed, 0xfe};
+
+ if (memcmp(magic, magic_32_be, 4) == 0 ||
+ memcmp(magic, magic_64_be, 4) == 0) {
+ fprintf(stderr, "big endian corefiles not supported\n");
+ exit(1);
+ }
+
+ ::fseeko(f, 0, SEEK_SET);
+ if (memcmp(magic, magic_32_le, 4) == 0) {
+ struct mach_header mh;
+ if (::fread(&mh, 1, sizeof(mh), f) != sizeof(mh)) {
+ fprintf(stderr, "error reading mach header from input file\n");
+ exit(1);
+ }
+ if (mh.cputype != CPU_TYPE_X86_64 && mh.cputype != CPU_TYPE_ARM64) {
+ fprintf(stderr,
+ "This tool creates an x86_64/arm64 corefile but "
+ "the supplied binary '%s' is cputype 0x%x\n",
+ fn, (uint32_t)mh.cputype);
+ exit(1);
+ }
+ num_of_load_cmds = mh.ncmds;
+ size_of_load_cmds = mh.sizeofcmds;
+ file_offset += sizeof(struct mach_header);
+ cputype = mh.cputype;
+ cpusubtype = mh.cpusubtype;
+ } else {
+ struct mach_header_64 mh;
+ if (::fread(&mh, 1, sizeof(mh), f) != sizeof(mh)) {
+ fprintf(stderr, "error reading mach header from input file\n");
+ exit(1);
+ }
+ if (mh.cputype != CPU_TYPE_X86_64 && mh.cputype != CPU_TYPE_ARM64) {
+ fprintf(stderr,
+ "This tool creates an x86_64/arm64 corefile but "
+ "the supplied binary '%s' is cputype 0x%x\n",
+ fn, (uint32_t)mh.cputype);
+ exit(1);
+ }
+ num_of_load_cmds = mh.ncmds;
+ size_of_load_cmds = mh.sizeofcmds;
+ file_offset += sizeof(struct mach_header_64);
+ cputype = mh.cputype;
+ cpusubtype = mh.cpusubtype;
+ }
+
+ off_t load_cmds_offset = file_offset;
+
+ for (int i = 0; i < num_of_load_cmds &&
+ (file_offset - load_cmds_offset) < size_of_load_cmds;
+ i++) {
+ ::fseeko(f, file_offset, SEEK_SET);
+ uint32_t cmd;
+ uint32_t cmdsize;
+ ::fread(&cmd, sizeof(uint32_t), 1, f);
+ ::fread(&cmdsize, sizeof(uint32_t), 1, f);
+ if (vmaddr == UINT64_MAX && cmd == LC_SEGMENT_64) {
+ struct segment_command_64 segcmd;
+ ::fseeko(f, file_offset, SEEK_SET);
+ if (::fread(&segcmd, 1, sizeof(segcmd), f) != sizeof(segcmd)) {
+ fprintf(stderr, "Unable to read LC_SEGMENT_64 load command.\n");
+ exit(1);
+ }
+ if (strcmp("__TEXT", segcmd.segname) == 0)
+ vmaddr = segcmd.vmaddr;
+ }
+ if (cmd == LC_UUID) {
+ struct uuid_command uuidcmd;
+ ::fseeko(f, file_offset, SEEK_SET);
+ if (::fread(&uuidcmd, 1, sizeof(uuidcmd), f) != sizeof(uuidcmd)) {
+ fprintf(stderr, "Unable to read LC_UUID load command.\n");
+ exit(1);
+ }
+ uuid_string_t uuidstr;
+ uuid_unparse(uuidcmd.uuid, uuidstr);
+ uuid = uuidstr;
+ }
+ file_offset += cmdsize;
+ }
+ return uuid;
+}
+
+void slide_macho_binary(std::vector<uint8_t> &image, uint64_t slide) {
+ uint8_t *p = image.data();
+ struct mach_header_64 *mh = (struct mach_header_64 *)p;
+ p += sizeof(struct mach_header_64);
+ for (int lc_idx = 0; lc_idx < mh->ncmds; lc_idx++) {
+ struct load_command *lc = (struct load_command *)p;
+ if (lc->cmd == LC_SEGMENT_64) {
+ struct segment_command_64 *seg = (struct segment_command_64 *)p;
+ if (seg->maxprot != 0 && seg->nsects > 0) {
+ seg->vmaddr += slide;
+ uint8_t *j = p + sizeof(segment_command_64);
+ for (int sect_idx = 0; sect_idx < seg->nsects; sect_idx++) {
+ struct section_64 *sect = (struct section_64 *)j;
+ sect->addr += slide;
+ j += sizeof(struct section_64);
+ }
+ }
+ }
+ p += lc->cmdsize;
+ }
+}
+
+int main(int argc, char **argv) {
+ if (argc < 3) {
+ fprintf(stderr,
+ "usage: output-corefile binary1[@optional-slide] "
+ "[binary2[@optional-slide] [binary3[@optional-slide] ...]]\n");
+ exit(1);
+ }
+
+ // An array of load commands (in the form of byte arrays)
+ std::vector<std::vector<uint8_t>> load_commands;
+
+ // An array of corefile contents (page data, lc_note data, etc)
+ std::vector<uint8_t> payload;
+
+ std::vector<std::string> input_filenames;
+ std::vector<uint64_t> input_slides;
+ std::vector<uint64_t> input_filesizes;
+ std::vector<uint64_t> input_filevmaddrs;
+ uint64_t main_binary_cputype = CPU_TYPE_ARM64;
+ uint64_t vmaddr = UINT64_MAX;
+ cpu_type_t cputype;
+ cpu_subtype_t cpusubtype;
+ for (int i = 2; i < argc; i++) {
+ std::string filename;
+ std::string filename_and_opt_hex(argv[i]);
+ uint64_t slide = 0;
+ auto at_pos = filename_and_opt_hex.find_last_of('@');
+ if (at_pos == std::string::npos) {
+ filename = filename_and_opt_hex;
+ } else {
+ filename = filename_and_opt_hex.substr(0, at_pos);
+ std::string hexstr = filename_and_opt_hex.substr(at_pos + 1);
+ errno = 0;
+ slide = (uint64_t)strtoull(hexstr.c_str(), nullptr, 16);
+ if (errno != 0) {
+ fprintf(stderr, "Unable to parse hex slide value in %s\n", argv[i]);
+ exit(1);
+ }
+ }
+ struct stat stbuf;
+ if (stat(filename.c_str(), &stbuf) == -1) {
+ fprintf(stderr, "Unable to stat '%s', exiting.\n", filename.c_str());
+ exit(1);
+ }
+ input_filenames.push_back(filename);
+ input_slides.push_back(slide);
+ input_filesizes.push_back(stbuf.st_size);
+ scan_binary(filename.c_str(), vmaddr, cputype, cpusubtype);
+ input_filevmaddrs.push_back(vmaddr + slide);
+ if (i == 2) {
+ main_binary_cputype = cputype;
+ }
+ }
+
+ const char *output_corefile_name = argv[1];
+ std::string empty_uuidstr = "00000000-0000-0000-0000-000000000000";
+
+ // First add all the load commands / payload so we can figure out how large
+ // the load commands will actually be.
+ load_commands.push_back(lc_thread_load_command(cputype));
+
+ add_lc_note_main_bin_spec_load_command(load_commands, payload, 0,
+ empty_uuidstr, 0, UINT64_MAX);
+ for (int i = 1; i < input_filenames.size(); i++) {
+ add_lc_note_load_binary_load_command(load_commands, payload, 0,
+ empty_uuidstr, 0, UINT64_MAX);
+ }
+
+ for (int i = 0; i < input_filenames.size(); i++) {
+ add_lc_segment(load_commands, payload, 0, 0, 0);
+ }
+
+ int size_of_load_commands = 0;
+ for (const auto &lc : load_commands)
+ size_of_load_commands += lc.size();
+
+ int size_of_header_and_load_cmds =
+ sizeof(struct mach_header_64) + size_of_load_commands;
+
+ // Erase the load commands / payload now that we know how much space is
+ // needed, redo it.
+ load_commands.clear();
+ payload.clear();
+
+ // Push the LC_THREAD load command.
+ load_commands.push_back(lc_thread_load_command(main_binary_cputype));
+
+ const off_t payload_offset = size_of_header_and_load_cmds;
+
+ add_lc_note_main_bin_spec_load_command(load_commands, payload, payload_offset,
+ empty_uuidstr, input_filevmaddrs[0],
+ UINT64_MAX);
+
+ for (int i = 1; i < input_filenames.size(); i++) {
+ add_lc_note_load_binary_load_command(load_commands, payload, payload_offset,
+ empty_uuidstr, input_filevmaddrs[i],
+ UINT64_MAX);
+ }
+
+ for (int i = 0; i < input_filenames.size(); i++) {
+ add_lc_segment(load_commands, payload, payload_offset, input_filevmaddrs[i],
+ input_filesizes[i]);
+
+ // Copy the contents of the binary into payload.
+ int fd = open(input_filenames[i].c_str(), O_RDONLY);
+ if (fd == -1) {
+ fprintf(stderr, "Unable to open %s for reading\n",
+ input_filenames[i].c_str());
+ exit(1);
+ }
+ std::vector<uint8_t> binary_contents;
+ for (int j = 0; j < input_filesizes[i]; j++) {
+ uint8_t byte;
+ read(fd, &byte, 1);
+ binary_contents.push_back(byte);
+ }
+ close(fd);
+
+ size_t cur_payload_size = payload.size();
+ payload.resize(cur_payload_size + binary_contents.size());
+ slide_macho_binary(binary_contents, input_slides[i]);
+ memcpy(payload.data() + cur_payload_size, binary_contents.data(),
+ binary_contents.size());
+ }
+
+ struct mach_header_64 mh;
+ mh.magic = MH_MAGIC_64;
+ mh.cputype = cputype;
+
+ mh.cpusubtype = cpusubtype;
+ mh.filetype = MH_CORE;
+ mh.ncmds = load_commands.size();
+ mh.sizeofcmds = size_of_load_commands;
+ mh.flags = 0;
+ mh.reserved = 0;
+
+ FILE *f = fopen(output_corefile_name, "w");
+
+ if (f == nullptr) {
+ fprintf(stderr, "Unable to open file %s for writing\n",
+ output_corefile_name);
+ exit(1);
+ }
+
+ fwrite(&mh, sizeof(mh), 1, f);
+
+ for (const auto &lc : load_commands)
+ fwrite(lc.data(), lc.size(), 1, f);
+
+ fwrite(payload.data(), payload.size(), 1, f);
+
+ fclose(f);
+}
diff --git a/lldb/test/API/macosx/lc-note/multiple-binary-corefile/main.c b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/main.c
new file mode 100644
index 0000000000000..eaab873b53e44
--- /dev/null
+++ b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/main.c
@@ -0,0 +1,7 @@
+#include <stdio.h>
+int one();
+int two();
+int main() {
+ puts("this is the standalone binary test program");
+ return one() + two();
+}
diff --git a/lldb/test/API/macosx/lc-note/multiple-binary-corefile/one.c b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/one.c
new file mode 100644
index 0000000000000..6e8fe4ad5ff75
--- /dev/null
+++ b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/one.c
@@ -0,0 +1 @@
+int one() { return 5; }
diff --git a/lldb/test/API/macosx/lc-note/multiple-binary-corefile/two.c b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/two.c
new file mode 100644
index 0000000000000..f44baa69c293a
--- /dev/null
+++ b/lldb/test/API/macosx/lc-note/multiple-binary-corefile/two.c
@@ -0,0 +1 @@
+int two() { return 10; }
More information about the lldb-commits
mailing list