[Lldb-commits] [lldb] [LLDB] FindLibCppStdFunctionCallableInfo improvements (PR #111892)

David Mentler via lldb-commits lldb-commits at lists.llvm.org
Thu Oct 10 14:11:26 PDT 2024


https://github.com/mentlerd updated https://github.com/llvm/llvm-project/pull/111892

>From b1e6178b1130135262884d99262716fcc0ada86e Mon Sep 17 00:00:00 2001
From: David Mentler <david.mentler at shapr3d.com>
Date: Mon, 7 Oct 2024 21:46:50 +0200
Subject: [PATCH 1/5] Make existing tests break

---
 .../data-formatter-stl/libcxx/function/main.cpp            | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/lldb/test/API/functionalities/data-formatter/data-formatter-stl/libcxx/function/main.cpp b/lldb/test/API/functionalities/data-formatter/data-formatter-stl/libcxx/function/main.cpp
index ef7c97470652fc..b17aba3fbbc70e 100644
--- a/lldb/test/API/functionalities/data-formatter/data-formatter-stl/libcxx/function/main.cpp
+++ b/lldb/test/API/functionalities/data-formatter/data-formatter-stl/libcxx/function/main.cpp
@@ -1,5 +1,10 @@
 #include <functional>
 
+template<typename = bool, typename = int>
+struct Dummy {
+  // Used to make lambda host function's symbol more complex
+};
+
 int foo(int x, int y) {
   return x + y - 1;
 }
@@ -18,7 +23,7 @@ struct Bar {
    }
 } ;
 
-int foo2() {
+int foo2(Dummy<> dummy = {}) {
    auto f = [](int x) {
        return x+1;
    };

>From d976756f47781d58c0367835a56b5b8e9130191b Mon Sep 17 00:00:00 2001
From: David Mentler <david.mentler at shapr3d.com>
Date: Wed, 9 Oct 2024 20:40:03 +0200
Subject: [PATCH 2/5] Expose conversion from DeclContext to Decl

---
 lldb/include/lldb/Symbol/CompilerDeclContext.h           | 2 ++
 lldb/include/lldb/Symbol/TypeSystem.h                    | 4 ++++
 lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.cpp | 7 +++++++
 lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.h   | 2 ++
 lldb/source/Symbol/CompilerDeclContext.cpp               | 6 ++++++
 5 files changed, 21 insertions(+)

diff --git a/lldb/include/lldb/Symbol/CompilerDeclContext.h b/lldb/include/lldb/Symbol/CompilerDeclContext.h
index 89b4a9787688bc..3954ddd8e52087 100644
--- a/lldb/include/lldb/Symbol/CompilerDeclContext.h
+++ b/lldb/include/lldb/Symbol/CompilerDeclContext.h
@@ -110,6 +110,8 @@ class CompilerDeclContext {
 
   ConstString GetScopeQualifiedName() const;
 
+  CompilerDecl GetDecl() const;
+
 private:
   TypeSystem *m_type_system = nullptr;
   void *m_opaque_decl_ctx = nullptr;
diff --git a/lldb/include/lldb/Symbol/TypeSystem.h b/lldb/include/lldb/Symbol/TypeSystem.h
index 7d48f9b316138c..4b531a83dd5fbb 100644
--- a/lldb/include/lldb/Symbol/TypeSystem.h
+++ b/lldb/include/lldb/Symbol/TypeSystem.h
@@ -134,6 +134,10 @@ class TypeSystem : public PluginInterface,
 
   virtual lldb::LanguageType DeclContextGetLanguage(void *opaque_decl_ctx) = 0;
 
+  virtual CompilerDecl DeclContextGetDecl(void *opaque_decl_ctx) {
+    return CompilerDecl();
+  }
+ 
   /// Returns the direct parent context of specified type
   virtual CompilerDeclContext
   GetCompilerDeclContextForType(const CompilerType &type);
diff --git a/lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.cpp b/lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.cpp
index fe0c53a7e9a3ea..678ac8d65331b7 100644
--- a/lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.cpp
+++ b/lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.cpp
@@ -9595,6 +9595,13 @@ TypeSystemClang::DeclContextGetLanguage(void *opaque_decl_ctx) {
   return eLanguageTypeUnknown;
 }
 
+CompilerDecl TypeSystemClang::DeclContextGetDecl(void *opaque_decl_ctx) {
+  if (auto *decl_ctx = (clang::DeclContext *)opaque_decl_ctx)
+    if (auto* decl = dyn_cast_or_null<clang::Decl>(decl_ctx))
+      return CompilerDecl(this, decl);
+  return CompilerDecl();
+}
+
 static bool IsClangDeclContext(const CompilerDeclContext &dc) {
   return dc.IsValid() && isa<TypeSystemClang>(dc.GetTypeSystem());
 }
diff --git a/lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.h b/lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.h
index e39aedec7e3902..e7ac6e320f20b7 100644
--- a/lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.h
+++ b/lldb/source/Plugins/TypeSystem/Clang/TypeSystemClang.h
@@ -595,6 +595,8 @@ class TypeSystemClang : public TypeSystem {
 
   lldb::LanguageType DeclContextGetLanguage(void *opaque_decl_ctx) override;
 
+  CompilerDecl DeclContextGetDecl(void *opaque_decl_ctx) override;
+
   std::vector<lldb_private::CompilerContext>
   DeclContextGetCompilerContext(void *opaque_decl_ctx) override;
 
diff --git a/lldb/source/Symbol/CompilerDeclContext.cpp b/lldb/source/Symbol/CompilerDeclContext.cpp
index b40a08e9b1953d..7a72c4301b0b5c 100644
--- a/lldb/source/Symbol/CompilerDeclContext.cpp
+++ b/lldb/source/Symbol/CompilerDeclContext.cpp
@@ -34,6 +34,12 @@ ConstString CompilerDeclContext::GetScopeQualifiedName() const {
   return ConstString();
 }
 
+CompilerDecl CompilerDeclContext::GetDecl() const {
+  if (IsValid())
+    return m_type_system->DeclContextGetDecl(m_opaque_decl_ctx);
+  return CompilerDecl();
+}
+
 bool CompilerDeclContext::IsClassMethod() {
   if (IsValid())
     return m_type_system->DeclContextIsClassMethod(m_opaque_decl_ctx);

>From 2e75bb0aac608d626fba5878315e9118bfcf9c8a Mon Sep 17 00:00:00 2001
From: David Mentler <david.mentler at shapr3d.com>
Date: Wed, 9 Oct 2024 20:41:04 +0200
Subject: [PATCH 3/5] IsPolymorphicClass already checks for record types and
 handles pointers to typenames

---
 .../CPlusPlus/ItaniumABI/ItaniumABILanguageRuntime.cpp    | 8 --------
 1 file changed, 8 deletions(-)

diff --git a/lldb/source/Plugins/LanguageRuntime/CPlusPlus/ItaniumABI/ItaniumABILanguageRuntime.cpp b/lldb/source/Plugins/LanguageRuntime/CPlusPlus/ItaniumABI/ItaniumABILanguageRuntime.cpp
index 4c547afe30fe81..4ac1e565cb2619 100644
--- a/lldb/source/Plugins/LanguageRuntime/CPlusPlus/ItaniumABI/ItaniumABILanguageRuntime.cpp
+++ b/lldb/source/Plugins/LanguageRuntime/CPlusPlus/ItaniumABI/ItaniumABILanguageRuntime.cpp
@@ -191,14 +191,6 @@ llvm::Error ItaniumABILanguageRuntime::TypeHasVTable(CompilerType type) {
       type = pointee_type;
   }
 
-  // Make sure this is a class or a struct first by checking the type class
-  // bitfield that gets returned.
-  if ((type.GetTypeClass() & (eTypeClassStruct | eTypeClassClass)) == 0) {
-    return llvm::createStringError(std::errc::invalid_argument,
-        "type \"%s\" is not a class or struct or a pointer to one",
-        original_type.GetTypeName().AsCString("<invalid>"));
-  }
-
   // Check if the type has virtual functions by asking it if it is polymorphic.
   if (!type.IsPolymorphicClass()) {
     return llvm::createStringError(std::errc::invalid_argument,

>From 248be8c68221edc03ee0691b3b2c83eda0789324 Mon Sep 17 00:00:00 2001
From: David Mentler <david.mentler at shapr3d.com>
Date: Wed, 9 Oct 2024 22:23:48 +0200
Subject: [PATCH 4/5] Digging for wrapped callable works

---
 .../CPlusPlus/CPPLanguageRuntime.cpp          | 132 +++++++++++++++++-
 1 file changed, 131 insertions(+), 1 deletion(-)

diff --git a/lldb/source/Plugins/LanguageRuntime/CPlusPlus/CPPLanguageRuntime.cpp b/lldb/source/Plugins/LanguageRuntime/CPlusPlus/CPPLanguageRuntime.cpp
index faa05e8f834ea1..7167cd4dc75f90 100644
--- a/lldb/source/Plugins/LanguageRuntime/CPlusPlus/CPPLanguageRuntime.cpp
+++ b/lldb/source/Plugins/LanguageRuntime/CPlusPlus/CPPLanguageRuntime.cpp
@@ -174,6 +174,137 @@ CPPLanguageRuntime::FindLibCppStdFunctionCallableInfo(
   if (!valobj_sp)
     return optional_info;
 
+  // std::function has many variants, try to disambiguate
+  ValueObjectSP func_as_base_ptr;
+  {
+    ValueObjectSP outer_f = valobj_sp->GetChildMemberWithName("__f_");
+    
+    if (!outer_f)
+      return optional_info; // Unrecognized implementation
+    
+    if (outer_f->IsPointerType()) {
+      // git: 3e519524c118651123eecf60c2bbc5d65ad9bac3
+      //
+      // class function<_Rp()> {
+      //   aligned_storage<3*sizeof(void*)>::type __buf_;
+      //   __base<_Rp>* __f_;
+      // }
+      
+      func_as_base_ptr = std::move(outer_f);
+    } else if (auto inner_f = outer_f->GetChildMemberWithName("__f_")) {
+      // git: 050b064f15ee56ee0b42c9b957a3dd0f32532394
+      //
+      // class function<_Rp(_ArgTypes...)> {
+      //   __value_func<_Rp(_ArgTypes...)> __f_;
+      // }
+      //
+      // class __value_func<_Rp(_ArgTypes...)> {
+      //   aligned_storage<3 * sizeof(void*)>::type __buf_;
+      //   __base<_Rp(_ArgTypes...)>* __f_;
+      // }
+      
+      func_as_base_ptr = std::move(inner_f);
+    } else
+      return optional_info; // Unrecognized implementation
+  }
+  
+  // __base<...> is a pure virtual class with an interface to create/copy/destroy/invoke
+  // the underlying value. This interface is implemented by partial specializations of the
+  // __func<_Fp, _Alloc, ...> template where _Fp is the wrapped functor object
+  Status status;
+  ValueObjectSP func_as_base = func_as_base_ptr->Dereference(status);
+  if (status.Fail())
+    return optional_info;
+  
+  // First we'll try to extract the __func<...> template instantiation's type by looking up
+  // the declarations of the member function pointers in it's vtable
+  CompilerType func_type;
+  {
+    ValueObjectSP vtable = func_as_base->GetVTable();
+
+    llvm::Expected<uint32_t> num_entries = vtable->GetNumChildren();
+    if (num_entries.takeError())
+      return optional_info;
+    
+    // __base is pure virtual, __func is final. All member function pointers are equally
+    // good candidates to find the enclosing class.
+    //
+    // In practice the first two vtable entries point to artificial destructors which the
+    // type system refuses to elaborate as their artificial specifications are not added
+    // to the enclosing class' declaration context. This causes various warnings, and dont
+    // get us any closer to the concrete type thus we skip them.
+    for (uint32_t idx = 2; idx < *num_entries; idx++) {
+      ValueObjectSP entry = vtable->GetChildAtIndex(idx);
+      
+      // Points to a potentially interesting member function
+      addr_t mfunc_load_addr = entry->GetValueAsUnsigned(0);
+      if (!mfunc_load_addr)
+        continue;
+      
+      Address mfunc_symbol_addr;
+      if (!valobj_sp->GetTargetSP()->ResolveLoadAddress(mfunc_load_addr, mfunc_symbol_addr))
+        continue;
+      
+      Function* func = mfunc_symbol_addr.CalculateSymbolContextFunction();
+      if (!func)
+        continue;
+      
+      CompilerDeclContext mfunc_decl_ctx = func->GetDeclContext();
+      if (!mfunc_decl_ctx.IsClassMethod())
+        continue;
+      
+      // Member functions are contained in their enclosing class' decl context
+      CompilerDeclContext mfunc_parent = mfunc_decl_ctx.GetDecl().GetDeclContext();
+      if (!mfunc_parent.IsValid())
+        continue;
+      
+      func_type = mfunc_parent.GetDecl().GetType();
+      break;
+    }
+  }
+  
+  // Regardless of what std::function wraps we are looking for the load address of a function to call
+  std::optional<addr_t> target_func_load_addr;
+
+  if (CompilerType callable_type = func_type.GetTypeTemplateArgument(0)) {
+    if (callable_type.IsFunctionPointerType() || callable_type.IsMemberFunctionPointerType()) {
+      // TODO: The previous implementation just does raw pointer arithmetic and reads
+      // 'a pointer' to a function right after the vtable.
+      //
+      // What is the preferred approach? Go digging for the compressed_pair.first in __func
+      // or assume layout citing ABI compatibility requirements?
+    } else if (callable_type.IsRecordType()) {
+      // Target is a lambda, or a generic callable. Search for a single operator() overload
+      std::optional<ConstString> mangled_func_name;
+      
+      for (uint32_t idx = 0; idx < callable_type.GetNumMemberFunctions(); idx++) {
+        TypeMemberFunctionImpl mfunc = callable_type.GetMemberFunctionAtIndex(idx);
+        
+        if (mfunc.GetKind() != eMemberFunctionKindInstanceMethod)
+          continue;
+        
+        if (mfunc.GetName() != "operator()")
+          continue;
+          
+        if (mangled_func_name)
+          return optional_info; // Cannot resolve ambiguous target
+        
+        mangled_func_name = mfunc.GetMangledName();
+      }
+      
+      // TODO: The SymbolFile did a bunch of work to reconstruct `callable_type`,
+      // including it's member functions. Surely it knows there they are loaded?
+    }
+  } else {
+    // TODO: What if we don't have debug info for callable_type? Do we fallback to
+    // treating the std::function as wrapping a function/member function pointer
+    // due to lack of options, or give up to avoid guessing wrong?
+  }
+  
+  if (!target_func_load_addr)
+    return optional_info;
+    
+  
   // Member __f_ has type __base*, the contents of which will hold:
   // 1) a vtable entry which may hold type information needed to discover the
   //    lambda being called
@@ -232,7 +363,6 @@ CPPLanguageRuntime::FindLibCppStdFunctionCallableInfo(
     return optional_info;
 
   uint32_t address_size = process->GetAddressByteSize();
-  Status status;
 
   // First item pointed to by __f_ should be the pointer to the vtable for
   // a __base object.

>From e7612f5c6417ababebfb7509d1dba697f07250db Mon Sep 17 00:00:00 2001
From: David Mentler <david.mentler at shapr3d.com>
Date: Thu, 10 Oct 2024 23:08:01 +0200
Subject: [PATCH 5/5] RecordType callable identification works, more questions

---
 .../CPlusPlus/CPPLanguageRuntime.cpp          | 113 ++++++++++++------
 1 file changed, 76 insertions(+), 37 deletions(-)

diff --git a/lldb/source/Plugins/LanguageRuntime/CPlusPlus/CPPLanguageRuntime.cpp b/lldb/source/Plugins/LanguageRuntime/CPlusPlus/CPPLanguageRuntime.cpp
index 7167cd4dc75f90..a3c719528e4e4b 100644
--- a/lldb/source/Plugins/LanguageRuntime/CPlusPlus/CPPLanguageRuntime.cpp
+++ b/lldb/source/Plugins/LanguageRuntime/CPlusPlus/CPPLanguageRuntime.cpp
@@ -219,6 +219,7 @@ CPPLanguageRuntime::FindLibCppStdFunctionCallableInfo(
   // First we'll try to extract the __func<...> template instantiation's type by looking up
   // the declarations of the member function pointers in it's vtable
   CompilerType func_type;
+  Address func_method_addr;
   {
     ValueObjectSP vtable = func_as_base->GetVTable();
 
@@ -241,11 +242,10 @@ CPPLanguageRuntime::FindLibCppStdFunctionCallableInfo(
       if (!mfunc_load_addr)
         continue;
       
-      Address mfunc_symbol_addr;
-      if (!valobj_sp->GetTargetSP()->ResolveLoadAddress(mfunc_load_addr, mfunc_symbol_addr))
+      if (!valobj_sp->GetTargetSP()->ResolveLoadAddress(mfunc_load_addr, func_method_addr))
         continue;
       
-      Function* func = mfunc_symbol_addr.CalculateSymbolContextFunction();
+      Function* func = func_method_addr.CalculateSymbolContextFunction();
       if (!func)
         continue;
       
@@ -263,47 +263,86 @@ CPPLanguageRuntime::FindLibCppStdFunctionCallableInfo(
     }
   }
   
-  // Regardless of what std::function wraps we are looking for the load address of a function to call
-  std::optional<addr_t> target_func_load_addr;
-
-  if (CompilerType callable_type = func_type.GetTypeTemplateArgument(0)) {
-    if (callable_type.IsFunctionPointerType() || callable_type.IsMemberFunctionPointerType()) {
-      // TODO: The previous implementation just does raw pointer arithmetic and reads
-      // 'a pointer' to a function right after the vtable.
-      //
-      // What is the preferred approach? Go digging for the compressed_pair.first in __func
-      // or assume layout citing ABI compatibility requirements?
-    } else if (callable_type.IsRecordType()) {
-      // Target is a lambda, or a generic callable. Search for a single operator() overload
-      std::optional<ConstString> mangled_func_name;
+  CompilerType callable_type = func_type.GetTypeTemplateArgument(0);
+  if (!callable_type)
+    return optional_info;
+  
+  if (callable_type.IsFunctionPointerType() || callable_type.IsMemberFunctionPointerType()) {
+    // TODO: The previous implementation just does raw pointer arithmetic and reads
+    // 'a pointer' to a function right after the vtable.
+    //
+    // What is the preferred approach? Go digging for the compressed_pair.first in __func
+    // or assume layout citing ABI compatibility requirements?
+  } else if (callable_type.IsRecordType()) {
+    // Target is a lambda, or a generic callable. Search for a single operator() overload
+    std::optional<ConstString> mangled_func_name;
+    
+    // TODO: I am still not sure whether it is a good idea to reconstruct the full type
+    // here.. it seems there are handy FindFunctions that could perhaps to a good job
+    // at locating candidates. However even when limiting the search to the decl_ctx of
+    // the class the code seems to iterate over way more DIEs than I expected. What to do?
+    
+    // TODO: Because we have access to the type we know a _lot_ about callable_type, we
+    // could even extract a ValueObjectSP to it if we wanted. It would be cool to make
+    // std::function have a synt children provider showing the wrapped lambda/callable!
+    
+    for (uint32_t idx = 0; idx < callable_type.GetNumMemberFunctions(); idx++) {
+      TypeMemberFunctionImpl mfunc = callable_type.GetMemberFunctionAtIndex(idx);
       
-      for (uint32_t idx = 0; idx < callable_type.GetNumMemberFunctions(); idx++) {
-        TypeMemberFunctionImpl mfunc = callable_type.GetMemberFunctionAtIndex(idx);
-        
-        if (mfunc.GetKind() != eMemberFunctionKindInstanceMethod)
-          continue;
-        
-        if (mfunc.GetName() != "operator()")
-          continue;
-          
-        if (mangled_func_name)
-          return optional_info; // Cannot resolve ambiguous target
+      if (mfunc.GetKind() != eMemberFunctionKindInstanceMethod)
+        continue;
+      
+      if (mfunc.GetName() != "operator()")
+        continue;
         
-        mangled_func_name = mfunc.GetMangledName();
-      }
+      if (mangled_func_name)
+        return optional_info; // Cannot resolve ambiguous target
+      
+      mangled_func_name = mfunc.GetMangledName();
+    }
+    
+    // Locate the symbol context corresponding to the target function
+    SymbolContext sc;
+    {
+      // We'll assume that callable_type is in the same module as the vtable
+      ModuleSP mod = func_method_addr.CalculateSymbolContextModule();
+    
+      // Limit our lookup to callable_type
+      CompilerDeclContext decl_ctx = callable_type.GetTypeSystem()->GetCompilerDeclContextForType(callable_type);
       
-      // TODO: The SymbolFile did a bunch of work to reconstruct `callable_type`,
-      // including it's member functions. Surely it knows there they are loaded?
+      SymbolContextList list;
+      mod->FindFunctions(*mangled_func_name, decl_ctx, eFunctionNameTypeFull, {}, list);
+      
+      if (list.GetSize() != 1)
+        return optional_info;
+      
+      list.GetContextAtIndex(0, sc);
     }
-  } else {
-    // TODO: What if we don't have debug info for callable_type? Do we fallback to
-    // treating the std::function as wrapping a function/member function pointer
-    // due to lack of options, or give up to avoid guessing wrong?
+    
+    // TODO: This feels a bit clunky, I am probably misusing the API? FindFunctions returns me
+    // SymbolContexts with the .function set but not .symbol ... At first glance it seemed like
+    // if we know the function there must be a symbol too!
+    if (!sc.function)
+      return optional_info;
+    
+    Symbol* symbol = sc.function->GetAddressRange().GetBaseAddress().CalculateSymbolContextSymbol();
+    if (!symbol)
+      return optional_info;
+    
+    return LibCppStdFunctionCallableInfo {
+      .callable_symbol = *symbol,
+      .callable_address = symbol->GetAddress(),
+      .callable_line_entry = sc.GetFunctionStartLineEntry(),
+      
+      // TODO: Can't tell lambdas apart from generic callables.. do we really need to?
+      // Is it important to have the correct qualification in the summary?
+      .callable_case = LibCppStdFunctionCallableCase::Lambda
+    };
   }
   
-  if (!target_func_load_addr)
+  // Unrecognized callable type - skip the original implementation for now
+  if (!callable_type.IsVoidType())
     return optional_info;
-    
   
   // Member __f_ has type __base*, the contents of which will hold:
   // 1) a vtable entry which may hold type information needed to discover the



More information about the lldb-commits mailing list