123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247 |
- //===- yaml2minidump.cpp - Convert a YAML file to a minidump file ---------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/ObjectYAML/MinidumpYAML.h"
- #include "llvm/ObjectYAML/yaml2obj.h"
- #include "llvm/Support/ConvertUTF.h"
- #include "llvm/Support/raw_ostream.h"
- using namespace llvm;
- using namespace llvm::minidump;
- using namespace llvm::MinidumpYAML;
- namespace {
- /// A helper class to manage the placement of various structures into the final
- /// minidump binary. Space for objects can be allocated via various allocate***
- /// methods, while the final minidump file is written by calling the writeTo
- /// method. The plain versions of allocation functions take a reference to the
- /// data which is to be written (and hence the data must be available until
- /// writeTo is called), while the "New" versions allocate the data in an
- /// allocator-managed buffer, which is available until the allocator object is
- /// destroyed. For both kinds of functions, it is possible to modify the
- /// data for which the space has been "allocated" until the final writeTo call.
- /// This is useful for "linking" the allocated structures via their offsets.
- class BlobAllocator {
- public:
- size_t tell() const { return NextOffset; }
- size_t allocateCallback(size_t Size,
- std::function<void(raw_ostream &)> Callback) {
- size_t Offset = NextOffset;
- NextOffset += Size;
- Callbacks.push_back(std::move(Callback));
- return Offset;
- }
- size_t allocateBytes(ArrayRef<uint8_t> Data) {
- return allocateCallback(
- Data.size(), [Data](raw_ostream &OS) { OS << toStringRef(Data); });
- }
- size_t allocateBytes(yaml::BinaryRef Data) {
- return allocateCallback(Data.binary_size(), [Data](raw_ostream &OS) {
- Data.writeAsBinary(OS);
- });
- }
- template <typename T> size_t allocateArray(ArrayRef<T> Data) {
- return allocateBytes({reinterpret_cast<const uint8_t *>(Data.data()),
- sizeof(T) * Data.size()});
- }
- template <typename T, typename RangeType>
- std::pair<size_t, MutableArrayRef<T>>
- allocateNewArray(const iterator_range<RangeType> &Range);
- template <typename T> size_t allocateObject(const T &Data) {
- return allocateArray(makeArrayRef(Data));
- }
- template <typename T, typename... Types>
- std::pair<size_t, T *> allocateNewObject(Types &&... Args) {
- T *Object = new (Temporaries.Allocate<T>()) T(std::forward<Types>(Args)...);
- return {allocateObject(*Object), Object};
- }
- size_t allocateString(StringRef Str);
- void writeTo(raw_ostream &OS) const;
- private:
- size_t NextOffset = 0;
- BumpPtrAllocator Temporaries;
- std::vector<std::function<void(raw_ostream &)>> Callbacks;
- };
- } // namespace
- template <typename T, typename RangeType>
- std::pair<size_t, MutableArrayRef<T>>
- BlobAllocator::allocateNewArray(const iterator_range<RangeType> &Range) {
- size_t Num = std::distance(Range.begin(), Range.end());
- MutableArrayRef<T> Array(Temporaries.Allocate<T>(Num), Num);
- std::uninitialized_copy(Range.begin(), Range.end(), Array.begin());
- return {allocateArray(Array), Array};
- }
- size_t BlobAllocator::allocateString(StringRef Str) {
- SmallVector<UTF16, 32> WStr;
- bool OK = convertUTF8ToUTF16String(Str, WStr);
- assert(OK && "Invalid UTF8 in Str?");
- (void)OK;
- // The utf16 string is null-terminated, but the terminator is not counted in
- // the string size.
- WStr.push_back(0);
- size_t Result =
- allocateNewObject<support::ulittle32_t>(2 * (WStr.size() - 1)).first;
- allocateNewArray<support::ulittle16_t>(make_range(WStr.begin(), WStr.end()));
- return Result;
- }
- void BlobAllocator::writeTo(raw_ostream &OS) const {
- size_t BeginOffset = OS.tell();
- for (const auto &Callback : Callbacks)
- Callback(OS);
- assert(OS.tell() == BeginOffset + NextOffset &&
- "Callbacks wrote an unexpected number of bytes.");
- (void)BeginOffset;
- }
- static LocationDescriptor layout(BlobAllocator &File, yaml::BinaryRef Data) {
- return {support::ulittle32_t(Data.binary_size()),
- support::ulittle32_t(File.allocateBytes(Data))};
- }
- static size_t layout(BlobAllocator &File, MinidumpYAML::ExceptionStream &S) {
- File.allocateObject(S.MDExceptionStream);
- size_t DataEnd = File.tell();
- // Lay out the thread context data, (which is not a part of the stream).
- // TODO: This usually (always?) matches the thread context of the
- // corresponding thread, and may overlap memory regions as well. We could
- // add a level of indirection to the MinidumpYAML format (like an array of
- // Blobs that the LocationDescriptors index into) to be able to distinguish
- // the cases where location descriptions overlap vs happen to reference
- // identical data.
- S.MDExceptionStream.ThreadContext = layout(File, S.ThreadContext);
- return DataEnd;
- }
- static void layout(BlobAllocator &File, MemoryListStream::entry_type &Range) {
- Range.Entry.Memory = layout(File, Range.Content);
- }
- static void layout(BlobAllocator &File, ModuleListStream::entry_type &M) {
- M.Entry.ModuleNameRVA = File.allocateString(M.Name);
- M.Entry.CvRecord = layout(File, M.CvRecord);
- M.Entry.MiscRecord = layout(File, M.MiscRecord);
- }
- static void layout(BlobAllocator &File, ThreadListStream::entry_type &T) {
- T.Entry.Stack.Memory = layout(File, T.Stack);
- T.Entry.Context = layout(File, T.Context);
- }
- template <typename EntryT>
- static size_t layout(BlobAllocator &File,
- MinidumpYAML::detail::ListStream<EntryT> &S) {
- File.allocateNewObject<support::ulittle32_t>(S.Entries.size());
- for (auto &E : S.Entries)
- File.allocateObject(E.Entry);
- size_t DataEnd = File.tell();
- // Lay out the auxiliary data, (which is not a part of the stream).
- DataEnd = File.tell();
- for (auto &E : S.Entries)
- layout(File, E);
- return DataEnd;
- }
- static Directory layout(BlobAllocator &File, Stream &S) {
- Directory Result;
- Result.Type = S.Type;
- Result.Location.RVA = File.tell();
- Optional<size_t> DataEnd;
- switch (S.Kind) {
- case Stream::StreamKind::Exception:
- DataEnd = layout(File, cast<MinidumpYAML::ExceptionStream>(S));
- break;
- case Stream::StreamKind::MemoryInfoList: {
- MemoryInfoListStream &InfoList = cast<MemoryInfoListStream>(S);
- File.allocateNewObject<minidump::MemoryInfoListHeader>(
- sizeof(minidump::MemoryInfoListHeader), sizeof(minidump::MemoryInfo),
- InfoList.Infos.size());
- File.allocateArray(makeArrayRef(InfoList.Infos));
- break;
- }
- case Stream::StreamKind::MemoryList:
- DataEnd = layout(File, cast<MemoryListStream>(S));
- break;
- case Stream::StreamKind::ModuleList:
- DataEnd = layout(File, cast<ModuleListStream>(S));
- break;
- case Stream::StreamKind::RawContent: {
- RawContentStream &Raw = cast<RawContentStream>(S);
- File.allocateCallback(Raw.Size, [&Raw](raw_ostream &OS) {
- Raw.Content.writeAsBinary(OS);
- assert(Raw.Content.binary_size() <= Raw.Size);
- OS << std::string(Raw.Size - Raw.Content.binary_size(), '\0');
- });
- break;
- }
- case Stream::StreamKind::SystemInfo: {
- SystemInfoStream &SystemInfo = cast<SystemInfoStream>(S);
- File.allocateObject(SystemInfo.Info);
- // The CSD string is not a part of the stream.
- DataEnd = File.tell();
- SystemInfo.Info.CSDVersionRVA = File.allocateString(SystemInfo.CSDVersion);
- break;
- }
- case Stream::StreamKind::TextContent:
- File.allocateArray(arrayRefFromStringRef(cast<TextContentStream>(S).Text));
- break;
- case Stream::StreamKind::ThreadList:
- DataEnd = layout(File, cast<ThreadListStream>(S));
- break;
- }
- // If DataEnd is not set, we assume everything we generated is a part of the
- // stream.
- Result.Location.DataSize =
- DataEnd.getValueOr(File.tell()) - Result.Location.RVA;
- return Result;
- }
- namespace llvm {
- namespace yaml {
- bool yaml2minidump(MinidumpYAML::Object &Obj, raw_ostream &Out,
- ErrorHandler /*EH*/) {
- BlobAllocator File;
- File.allocateObject(Obj.Header);
- std::vector<Directory> StreamDirectory(Obj.Streams.size());
- Obj.Header.StreamDirectoryRVA =
- File.allocateArray(makeArrayRef(StreamDirectory));
- Obj.Header.NumberOfStreams = StreamDirectory.size();
- for (auto &Stream : enumerate(Obj.Streams))
- StreamDirectory[Stream.index()] = layout(File, *Stream.value());
- File.writeTo(Out);
- return true;
- }
- } // namespace yaml
- } // namespace llvm
|