diff options
Diffstat (limited to 'lldb/source/Core/Mangled.cpp')
| -rw-r--r-- | lldb/source/Core/Mangled.cpp | 438 | 
1 files changed, 438 insertions, 0 deletions
diff --git a/lldb/source/Core/Mangled.cpp b/lldb/source/Core/Mangled.cpp new file mode 100644 index 000000000000..b06656aa3fb7 --- /dev/null +++ b/lldb/source/Core/Mangled.cpp @@ -0,0 +1,438 @@ +//===-- Mangled.cpp ---------------------------------------------*- C++ -*-===// +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// + +#include "lldb/Core/Mangled.h" + +#include "lldb/Core/RichManglingContext.h" +#include "lldb/Utility/ConstString.h" +#include "lldb/Utility/Log.h" +#include "lldb/Utility/Logging.h" +#include "lldb/Utility/RegularExpression.h" +#include "lldb/Utility/Stream.h" +#include "lldb/Utility/Timer.h" +#include "lldb/lldb-enumerations.h" + +#include "Plugins/Language/CPlusPlus/CPlusPlusLanguage.h" +#include "Plugins/Language/ObjC/ObjCLanguage.h" + +#include "llvm/ADT/StringRef.h" +#include "llvm/Demangle/Demangle.h" +#include "llvm/Support/Compiler.h" + +#include <mutex> +#include <string> +#include <utility> + +#include <stdlib.h> +#include <string.h> +using namespace lldb_private; + +static inline Mangled::ManglingScheme cstring_mangling_scheme(const char *s) { +  if (s) { +    if (s[0] == '?') +      return Mangled::eManglingSchemeMSVC; +    if (s[0] == '_' && s[1] == 'Z') +      return Mangled::eManglingSchemeItanium; +  } +  return Mangled::eManglingSchemeNone; +} + +static inline bool cstring_is_mangled(const char *s) { +  return cstring_mangling_scheme(s) != Mangled::eManglingSchemeNone; +} + +static ConstString  +get_demangled_name_without_arguments(ConstString mangled, +                                     ConstString demangled) { +  // This pair is <mangled name, demangled name without function arguments> +  static std::pair<ConstString, ConstString> +      g_most_recent_mangled_to_name_sans_args; + +  // Need to have the mangled & demangled names we're currently examining as +  // statics so we can return a const ref to them at the end of the func if we +  // don't have anything better. +  static ConstString g_last_mangled; +  static ConstString g_last_demangled; + +  if (mangled && g_most_recent_mangled_to_name_sans_args.first == mangled) { +    return g_most_recent_mangled_to_name_sans_args.second; +  } + +  g_last_demangled = demangled; +  g_last_mangled = mangled; + +  const char *mangled_name_cstr = mangled.GetCString(); + +  if (demangled && mangled_name_cstr && mangled_name_cstr[0]) { +    if (mangled_name_cstr[0] == '_' && mangled_name_cstr[1] == 'Z' && +        (mangled_name_cstr[2] != 'T' && // avoid virtual table, VTT structure, +                                        // typeinfo structure, and typeinfo +                                        // mangled_name +         mangled_name_cstr[2] != 'G' && // avoid guard variables +         mangled_name_cstr[2] != 'Z')) // named local entities (if we eventually +                                       // handle eSymbolTypeData, we will want +                                       // this back) +    { +      CPlusPlusLanguage::MethodName cxx_method(demangled); +      if (!cxx_method.GetBasename().empty()) { +        std::string shortname; +        if (!cxx_method.GetContext().empty()) +          shortname = cxx_method.GetContext().str() + "::"; +        shortname += cxx_method.GetBasename().str(); +        ConstString result(shortname.c_str()); +        g_most_recent_mangled_to_name_sans_args.first = mangled; +        g_most_recent_mangled_to_name_sans_args.second = result; +        return g_most_recent_mangled_to_name_sans_args.second; +      } +    } +  } + +  if (demangled) +    return g_last_demangled; +  return g_last_mangled; +} + +#pragma mark Mangled + +Mangled::Mangled(ConstString s) : m_mangled(), m_demangled() { +  if (s) +    SetValue(s); +} + +Mangled::Mangled(llvm::StringRef name) { +  if (!name.empty()) +    SetValue(ConstString(name)); +} + +// Convert to pointer operator. This allows code to check any Mangled objects +// to see if they contain anything valid using code such as: +// +//  Mangled mangled(...); +//  if (mangled) +//  { ... +Mangled::operator void *() const { +  return (m_mangled) ? const_cast<Mangled *>(this) : nullptr; +} + +// Logical NOT operator. This allows code to check any Mangled objects to see +// if they are invalid using code such as: +// +//  Mangled mangled(...); +//  if (!file_spec) +//  { ... +bool Mangled::operator!() const { return !m_mangled; } + +// Clear the mangled and demangled values. +void Mangled::Clear() { +  m_mangled.Clear(); +  m_demangled.Clear(); +} + +// Compare the string values. +int Mangled::Compare(const Mangled &a, const Mangled &b) { +  return ConstString::Compare( +      a.GetName(lldb::eLanguageTypeUnknown, ePreferMangled), +      b.GetName(lldb::eLanguageTypeUnknown, ePreferMangled)); +} + +// Set the string value in this objects. If "mangled" is true, then the mangled +// named is set with the new value in "s", else the demangled name is set. +void Mangled::SetValue(ConstString s, bool mangled) { +  if (s) { +    if (mangled) { +      m_demangled.Clear(); +      m_mangled = s; +    } else { +      m_demangled = s; +      m_mangled.Clear(); +    } +  } else { +    m_demangled.Clear(); +    m_mangled.Clear(); +  } +} + +void Mangled::SetValue(ConstString name) { +  if (name) { +    if (cstring_is_mangled(name.GetCString())) { +      m_demangled.Clear(); +      m_mangled = name; +    } else { +      m_demangled = name; +      m_mangled.Clear(); +    } +  } else { +    m_demangled.Clear(); +    m_mangled.Clear(); +  } +} + +// Local helpers for different demangling implementations. +static char *GetMSVCDemangledStr(const char *M) { +  char *demangled_cstr = llvm::microsoftDemangle( +      M, nullptr, nullptr, nullptr, +      llvm::MSDemangleFlags(llvm::MSDF_NoAccessSpecifier | +                            llvm::MSDF_NoCallingConvention | +                            llvm::MSDF_NoMemberType)); + +  if (Log *log = lldb_private::GetLogIfAllCategoriesSet(LIBLLDB_LOG_DEMANGLE)) { +    if (demangled_cstr && demangled_cstr[0]) +      LLDB_LOGF(log, "demangled msvc: %s -> \"%s\"", M, demangled_cstr); +    else +      LLDB_LOGF(log, "demangled msvc: %s -> error", M); +  } + +  return demangled_cstr; +} + +static char *GetItaniumDemangledStr(const char *M) { +  char *demangled_cstr = nullptr; + +  llvm::ItaniumPartialDemangler ipd; +  bool err = ipd.partialDemangle(M); +  if (!err) { +    // Default buffer and size (will realloc in case it's too small). +    size_t demangled_size = 80; +    demangled_cstr = static_cast<char *>(std::malloc(demangled_size)); +    demangled_cstr = ipd.finishDemangle(demangled_cstr, &demangled_size); + +    assert(demangled_cstr && +           "finishDemangle must always succeed if partialDemangle did"); +    assert(demangled_cstr[demangled_size - 1] == '\0' && +           "Expected demangled_size to return length including trailing null"); +  } + +  if (Log *log = lldb_private::GetLogIfAllCategoriesSet(LIBLLDB_LOG_DEMANGLE)) { +    if (demangled_cstr) +      LLDB_LOGF(log, "demangled itanium: %s -> \"%s\"", M, demangled_cstr); +    else +      LLDB_LOGF(log, "demangled itanium: %s -> error: failed to demangle", M); +  } + +  return demangled_cstr; +} + +// Explicit demangling for scheduled requests during batch processing. This +// makes use of ItaniumPartialDemangler's rich demangle info +bool Mangled::DemangleWithRichManglingInfo( +    RichManglingContext &context, SkipMangledNameFn *skip_mangled_name) { +  // We need to generate and cache the demangled name. +  static Timer::Category func_cat(LLVM_PRETTY_FUNCTION); +  Timer scoped_timer(func_cat, +                     "Mangled::DemangleWithRichNameIndexInfo (m_mangled = %s)", +                     m_mangled.GetCString()); + +  // Others are not meant to arrive here. ObjC names or C's main() for example +  // have their names stored in m_demangled, while m_mangled is empty. +  assert(m_mangled); + +  // Check whether or not we are interested in this name at all. +  ManglingScheme scheme = cstring_mangling_scheme(m_mangled.GetCString()); +  if (skip_mangled_name && skip_mangled_name(m_mangled.GetStringRef(), scheme)) +    return false; + +  switch (scheme) { +  case eManglingSchemeNone: +    // The current mangled_name_filter would allow llvm_unreachable here. +    return false; + +  case eManglingSchemeItanium: +    // We want the rich mangling info here, so we don't care whether or not +    // there is a demangled string in the pool already. +    if (context.FromItaniumName(m_mangled)) { +      // If we got an info, we have a name. Copy to string pool and connect the +      // counterparts to accelerate later access in GetDemangledName(). +      context.ParseFullName(); +      m_demangled.SetStringWithMangledCounterpart(context.GetBufferRef(), +                                                  m_mangled); +      return true; +    } else { +      m_demangled.SetCString(""); +      return false; +    } + +  case eManglingSchemeMSVC: { +    // We have no rich mangling for MSVC-mangled names yet, so first try to +    // demangle it if necessary. +    if (!m_demangled && !m_mangled.GetMangledCounterpart(m_demangled)) { +      if (char *d = GetMSVCDemangledStr(m_mangled.GetCString())) { +        // If we got an info, we have a name. Copy to string pool and connect +        // the counterparts to accelerate later access in GetDemangledName(). +        m_demangled.SetStringWithMangledCounterpart(llvm::StringRef(d), +                                                    m_mangled); +        ::free(d); +      } else { +        m_demangled.SetCString(""); +      } +    } + +    if (m_demangled.IsEmpty()) { +      // Cannot demangle it, so don't try parsing. +      return false; +    } else { +      // Demangled successfully, we can try and parse it with +      // CPlusPlusLanguage::MethodName. +      return context.FromCxxMethodName(m_demangled); +    } +  } +  } +  llvm_unreachable("Fully covered switch above!"); +} + +// Generate the demangled name on demand using this accessor. Code in this +// class will need to use this accessor if it wishes to decode the demangled +// name. The result is cached and will be kept until a new string value is +// supplied to this object, or until the end of the object's lifetime. +ConstString  +Mangled::GetDemangledName(lldb::LanguageType language) const { +  // Check to make sure we have a valid mangled name and that we haven't +  // already decoded our mangled name. +  if (m_mangled && m_demangled.IsNull()) { +    // We need to generate and cache the demangled name. +    static Timer::Category func_cat(LLVM_PRETTY_FUNCTION); +    Timer scoped_timer(func_cat, "Mangled::GetDemangledName (m_mangled = %s)", +                       m_mangled.GetCString()); + +    // Don't bother running anything that isn't mangled +    const char *mangled_name = m_mangled.GetCString(); +    ManglingScheme mangling_scheme{cstring_mangling_scheme(mangled_name)}; +    if (mangling_scheme != eManglingSchemeNone && +        !m_mangled.GetMangledCounterpart(m_demangled)) { +      // We didn't already mangle this name, demangle it and if all goes well +      // add it to our map. +      char *demangled_name = nullptr; +      switch (mangling_scheme) { +      case eManglingSchemeMSVC: +        demangled_name = GetMSVCDemangledStr(mangled_name); +        break; +      case eManglingSchemeItanium: { +        demangled_name = GetItaniumDemangledStr(mangled_name); +        break; +      } +      case eManglingSchemeNone: +        llvm_unreachable("eManglingSchemeNone was handled already"); +      } +      if (demangled_name) { +        m_demangled.SetStringWithMangledCounterpart( +            llvm::StringRef(demangled_name), m_mangled); +        free(demangled_name); +      } +    } +    if (m_demangled.IsNull()) { +      // Set the demangled string to the empty string to indicate we tried to +      // parse it once and failed. +      m_demangled.SetCString(""); +    } +  } + +  return m_demangled; +} + +ConstString +Mangled::GetDisplayDemangledName(lldb::LanguageType language) const { +  return GetDemangledName(language); +} + +bool Mangled::NameMatches(const RegularExpression ®ex, +                          lldb::LanguageType language) const { +  if (m_mangled && regex.Execute(m_mangled.AsCString())) +    return true; + +  ConstString demangled = GetDemangledName(language); +  return demangled && regex.Execute(demangled.AsCString()); +} + +// Get the demangled name if there is one, else return the mangled name. +ConstString Mangled::GetName(lldb::LanguageType language, +                             Mangled::NamePreference preference) const { +  if (preference == ePreferMangled && m_mangled) +    return m_mangled; + +  ConstString demangled = GetDemangledName(language); + +  if (preference == ePreferDemangledWithoutArguments) { +    return get_demangled_name_without_arguments(m_mangled, demangled); +  } +  if (preference == ePreferDemangled) { +    // Call the accessor to make sure we get a demangled name in case it hasn't +    // been demangled yet... +    if (demangled) +      return demangled; +    return m_mangled; +  } +  return demangled; +} + +// Dump a Mangled object to stream "s". We don't force our demangled name to be +// computed currently (we don't use the accessor). +void Mangled::Dump(Stream *s) const { +  if (m_mangled) { +    *s << ", mangled = " << m_mangled; +  } +  if (m_demangled) { +    const char *demangled = m_demangled.AsCString(); +    s->Printf(", demangled = %s", demangled[0] ? demangled : "<error>"); +  } +} + +// Dumps a debug version of this string with extra object and state information +// to stream "s". +void Mangled::DumpDebug(Stream *s) const { +  s->Printf("%*p: Mangled mangled = ", static_cast<int>(sizeof(void *) * 2), +            static_cast<const void *>(this)); +  m_mangled.DumpDebug(s); +  s->Printf(", demangled = "); +  m_demangled.DumpDebug(s); +} + +// Return the size in byte that this object takes in memory. The size includes +// the size of the objects it owns, and not the strings that it references +// because they are shared strings. +size_t Mangled::MemorySize() const { +  return m_mangled.MemorySize() + m_demangled.MemorySize(); +} + +// We "guess" the language because we can't determine a symbol's language from +// it's name.  For example, a Pascal symbol can be mangled using the C++ +// Itanium scheme, and defined in a compilation unit within the same module as +// other C++ units.  In addition, different targets could have different ways +// of mangling names from a given language, likewise the compilation units +// within those targets. +lldb::LanguageType Mangled::GuessLanguage() const { +  ConstString mangled = GetMangledName(); +  if (mangled) { +    const char *mangled_name = mangled.GetCString(); +    if (CPlusPlusLanguage::IsCPPMangledName(mangled_name)) +      return lldb::eLanguageTypeC_plus_plus; +    else if (ObjCLanguage::IsPossibleObjCMethodName(mangled_name)) +      return lldb::eLanguageTypeObjC; +  } else { +    // ObjC names aren't really mangled, so they won't necessarily be in the +    // mangled name slot. +    ConstString demangled_name = GetDemangledName(lldb::eLanguageTypeUnknown); +    if (demangled_name  +        && ObjCLanguage::IsPossibleObjCMethodName(demangled_name.GetCString())) +      return lldb::eLanguageTypeObjC; +   +  } +  return lldb::eLanguageTypeUnknown; +} + +// Dump OBJ to the supplied stream S. +Stream &operator<<(Stream &s, const Mangled &obj) { +  if (obj.GetMangledName()) +    s << "mangled = '" << obj.GetMangledName() << "'"; + +  ConstString demangled = +      obj.GetDemangledName(lldb::eLanguageTypeUnknown); +  if (demangled) +    s << ", demangled = '" << demangled << '\''; +  else +    s << ", demangled = <error>"; +  return s; +}  | 
