diff options
Diffstat (limited to 'lib/ObjectYAML/MinidumpEmitter.cpp')
| -rw-r--r-- | lib/ObjectYAML/MinidumpEmitter.cpp | 247 | 
1 files changed, 247 insertions, 0 deletions
| diff --git a/lib/ObjectYAML/MinidumpEmitter.cpp b/lib/ObjectYAML/MinidumpEmitter.cpp new file mode 100644 index 000000000000..bbfd2cd8cbab --- /dev/null +++ b/lib/ObjectYAML/MinidumpEmitter.cpp @@ -0,0 +1,247 @@ +//===- yaml2minidump.cpp - Convert a YAML file to a minidump file ---------===// +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// + +#include "llvm/ObjectYAML/MinidumpYAML.h" +#include "llvm/ObjectYAML/yaml2obj.h" +#include "llvm/Support/ConvertUTF.h" +#include "llvm/Support/raw_ostream.h" + +using namespace llvm; +using namespace llvm::minidump; +using namespace llvm::MinidumpYAML; + +namespace { +/// A helper class to manage the placement of various structures into the final +/// minidump binary. Space for objects can be allocated via various allocate*** +/// methods, while the final minidump file is written by calling the writeTo +/// method. The plain versions of allocation functions take a reference to the +/// data which is to be written (and hence the data must be available until +/// writeTo is called), while the "New" versions allocate the data in an +/// allocator-managed buffer, which is available until the allocator object is +/// destroyed. For both kinds of functions, it is possible to modify the +/// data for which the space has been "allocated" until the final writeTo call. +/// This is useful for "linking" the allocated structures via their offsets. +class BlobAllocator { +public: +  size_t tell() const { return NextOffset; } + +  size_t allocateCallback(size_t Size, +                          std::function<void(raw_ostream &)> Callback) { +    size_t Offset = NextOffset; +    NextOffset += Size; +    Callbacks.push_back(std::move(Callback)); +    return Offset; +  } + +  size_t allocateBytes(ArrayRef<uint8_t> Data) { +    return allocateCallback( +        Data.size(), [Data](raw_ostream &OS) { OS << toStringRef(Data); }); +  } + +  size_t allocateBytes(yaml::BinaryRef Data) { +    return allocateCallback(Data.binary_size(), [Data](raw_ostream &OS) { +      Data.writeAsBinary(OS); +    }); +  } + +  template <typename T> size_t allocateArray(ArrayRef<T> Data) { +    return allocateBytes({reinterpret_cast<const uint8_t *>(Data.data()), +                          sizeof(T) * Data.size()}); +  } + +  template <typename T, typename RangeType> +  std::pair<size_t, MutableArrayRef<T>> +  allocateNewArray(const iterator_range<RangeType> &Range); + +  template <typename T> size_t allocateObject(const T &Data) { +    return allocateArray(makeArrayRef(Data)); +  } + +  template <typename T, typename... Types> +  std::pair<size_t, T *> allocateNewObject(Types &&... Args) { +    T *Object = new (Temporaries.Allocate<T>()) T(std::forward<Types>(Args)...); +    return {allocateObject(*Object), Object}; +  } + +  size_t allocateString(StringRef Str); + +  void writeTo(raw_ostream &OS) const; + +private: +  size_t NextOffset = 0; + +  BumpPtrAllocator Temporaries; +  std::vector<std::function<void(raw_ostream &)>> Callbacks; +}; +} // namespace + +template <typename T, typename RangeType> +std::pair<size_t, MutableArrayRef<T>> +BlobAllocator::allocateNewArray(const iterator_range<RangeType> &Range) { +  size_t Num = std::distance(Range.begin(), Range.end()); +  MutableArrayRef<T> Array(Temporaries.Allocate<T>(Num), Num); +  std::uninitialized_copy(Range.begin(), Range.end(), Array.begin()); +  return {allocateArray(Array), Array}; +} + +size_t BlobAllocator::allocateString(StringRef Str) { +  SmallVector<UTF16, 32> WStr; +  bool OK = convertUTF8ToUTF16String(Str, WStr); +  assert(OK && "Invalid UTF8 in Str?"); +  (void)OK; + +  // The utf16 string is null-terminated, but the terminator is not counted in +  // the string size. +  WStr.push_back(0); +  size_t Result = +      allocateNewObject<support::ulittle32_t>(2 * (WStr.size() - 1)).first; +  allocateNewArray<support::ulittle16_t>(make_range(WStr.begin(), WStr.end())); +  return Result; +} + +void BlobAllocator::writeTo(raw_ostream &OS) const { +  size_t BeginOffset = OS.tell(); +  for (const auto &Callback : Callbacks) +    Callback(OS); +  assert(OS.tell() == BeginOffset + NextOffset && +         "Callbacks wrote an unexpected number of bytes."); +  (void)BeginOffset; +} + +static LocationDescriptor layout(BlobAllocator &File, yaml::BinaryRef Data) { +  return {support::ulittle32_t(Data.binary_size()), +          support::ulittle32_t(File.allocateBytes(Data))}; +} + +static size_t layout(BlobAllocator &File, MinidumpYAML::ExceptionStream &S) { +  File.allocateObject(S.MDExceptionStream); + +  size_t DataEnd = File.tell(); + +  // Lay out the thread context data, (which is not a part of the stream). +  // TODO: This usually (always?) matches the thread context of the +  // corresponding thread, and may overlap memory regions as well.  We could +  // add a level of indirection to the MinidumpYAML format (like an array of +  // Blobs that the LocationDescriptors index into) to be able to distinguish +  // the cases where location descriptions overlap vs happen to reference +  // identical data. +  S.MDExceptionStream.ThreadContext = layout(File, S.ThreadContext); + +  return DataEnd; +} + +static void layout(BlobAllocator &File, MemoryListStream::entry_type &Range) { +  Range.Entry.Memory = layout(File, Range.Content); +} + +static void layout(BlobAllocator &File, ModuleListStream::entry_type &M) { +  M.Entry.ModuleNameRVA = File.allocateString(M.Name); + +  M.Entry.CvRecord = layout(File, M.CvRecord); +  M.Entry.MiscRecord = layout(File, M.MiscRecord); +} + +static void layout(BlobAllocator &File, ThreadListStream::entry_type &T) { +  T.Entry.Stack.Memory = layout(File, T.Stack); +  T.Entry.Context = layout(File, T.Context); +} + +template <typename EntryT> +static size_t layout(BlobAllocator &File, +                     MinidumpYAML::detail::ListStream<EntryT> &S) { + +  File.allocateNewObject<support::ulittle32_t>(S.Entries.size()); +  for (auto &E : S.Entries) +    File.allocateObject(E.Entry); + +  size_t DataEnd = File.tell(); + +  // Lay out the auxiliary data, (which is not a part of the stream). +  DataEnd = File.tell(); +  for (auto &E : S.Entries) +    layout(File, E); + +  return DataEnd; +} + +static Directory layout(BlobAllocator &File, Stream &S) { +  Directory Result; +  Result.Type = S.Type; +  Result.Location.RVA = File.tell(); +  Optional<size_t> DataEnd; +  switch (S.Kind) { +  case Stream::StreamKind::Exception: +    DataEnd = layout(File, cast<MinidumpYAML::ExceptionStream>(S)); +    break; +  case Stream::StreamKind::MemoryInfoList: { +    MemoryInfoListStream &InfoList = cast<MemoryInfoListStream>(S); +    File.allocateNewObject<minidump::MemoryInfoListHeader>( +        sizeof(minidump::MemoryInfoListHeader), sizeof(minidump::MemoryInfo), +        InfoList.Infos.size()); +    File.allocateArray(makeArrayRef(InfoList.Infos)); +    break; +  } +  case Stream::StreamKind::MemoryList: +    DataEnd = layout(File, cast<MemoryListStream>(S)); +    break; +  case Stream::StreamKind::ModuleList: +    DataEnd = layout(File, cast<ModuleListStream>(S)); +    break; +  case Stream::StreamKind::RawContent: { +    RawContentStream &Raw = cast<RawContentStream>(S); +    File.allocateCallback(Raw.Size, [&Raw](raw_ostream &OS) { +      Raw.Content.writeAsBinary(OS); +      assert(Raw.Content.binary_size() <= Raw.Size); +      OS << std::string(Raw.Size - Raw.Content.binary_size(), '\0'); +    }); +    break; +  } +  case Stream::StreamKind::SystemInfo: { +    SystemInfoStream &SystemInfo = cast<SystemInfoStream>(S); +    File.allocateObject(SystemInfo.Info); +    // The CSD string is not a part of the stream. +    DataEnd = File.tell(); +    SystemInfo.Info.CSDVersionRVA = File.allocateString(SystemInfo.CSDVersion); +    break; +  } +  case Stream::StreamKind::TextContent: +    File.allocateArray(arrayRefFromStringRef(cast<TextContentStream>(S).Text)); +    break; +  case Stream::StreamKind::ThreadList: +    DataEnd = layout(File, cast<ThreadListStream>(S)); +    break; +  } +  // If DataEnd is not set, we assume everything we generated is a part of the +  // stream. +  Result.Location.DataSize = +      DataEnd.getValueOr(File.tell()) - Result.Location.RVA; +  return Result; +} + +namespace llvm { +namespace yaml { + +bool yaml2minidump(MinidumpYAML::Object &Obj, raw_ostream &Out, +                   ErrorHandler /*EH*/) { +  BlobAllocator File; +  File.allocateObject(Obj.Header); + +  std::vector<Directory> StreamDirectory(Obj.Streams.size()); +  Obj.Header.StreamDirectoryRVA = +      File.allocateArray(makeArrayRef(StreamDirectory)); +  Obj.Header.NumberOfStreams = StreamDirectory.size(); + +  for (auto &Stream : enumerate(Obj.Streams)) +    StreamDirectory[Stream.index()] = layout(File, *Stream.value()); + +  File.writeTo(Out); +  return true; +} + +} // namespace yaml +} // namespace llvm | 
