1581d79a4SPavel Labath //===- Minidump.cpp - Minidump object file implementation -----------------===//
2581d79a4SPavel Labath //
3581d79a4SPavel Labath // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4581d79a4SPavel Labath // See https://llvm.org/LICENSE.txt for license information.
5581d79a4SPavel Labath // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6581d79a4SPavel Labath //
7581d79a4SPavel Labath //===----------------------------------------------------------------------===//
8581d79a4SPavel Labath 
9581d79a4SPavel Labath #include "llvm/Object/Minidump.h"
10581d79a4SPavel Labath #include "llvm/Object/Error.h"
1151d9fa0aSPavel Labath #include "llvm/Support/ConvertUTF.h"
12581d79a4SPavel Labath 
13581d79a4SPavel Labath using namespace llvm;
14581d79a4SPavel Labath using namespace llvm::object;
15581d79a4SPavel Labath using namespace llvm::minidump;
16581d79a4SPavel Labath 
17581d79a4SPavel Labath Optional<ArrayRef<uint8_t>>
getRawStream(minidump::StreamType Type) const18581d79a4SPavel Labath MinidumpFile::getRawStream(minidump::StreamType Type) const {
19581d79a4SPavel Labath   auto It = StreamMap.find(Type);
20581d79a4SPavel Labath   if (It != StreamMap.end())
21581d79a4SPavel Labath     return getRawStream(Streams[It->second]);
22581d79a4SPavel Labath   return None;
23581d79a4SPavel Labath }
24581d79a4SPavel Labath 
getString(size_t Offset) const2551d9fa0aSPavel Labath Expected<std::string> MinidumpFile::getString(size_t Offset) const {
2651d9fa0aSPavel Labath   // Minidump strings consist of a 32-bit length field, which gives the size of
2751d9fa0aSPavel Labath   // the string in *bytes*. This is followed by the actual string encoded in
2851d9fa0aSPavel Labath   // UTF16.
2951d9fa0aSPavel Labath   auto ExpectedSize =
3051d9fa0aSPavel Labath       getDataSliceAs<support::ulittle32_t>(getData(), Offset, 1);
3151d9fa0aSPavel Labath   if (!ExpectedSize)
3251d9fa0aSPavel Labath     return ExpectedSize.takeError();
3351d9fa0aSPavel Labath   size_t Size = (*ExpectedSize)[0];
3451d9fa0aSPavel Labath   if (Size % 2 != 0)
3551d9fa0aSPavel Labath     return createError("String size not even");
3651d9fa0aSPavel Labath   Size /= 2;
3751d9fa0aSPavel Labath   if (Size == 0)
3851d9fa0aSPavel Labath     return "";
3951d9fa0aSPavel Labath 
4051d9fa0aSPavel Labath   Offset += sizeof(support::ulittle32_t);
41ebdc698dSPavel Labath   auto ExpectedData =
42ebdc698dSPavel Labath       getDataSliceAs<support::ulittle16_t>(getData(), Offset, Size);
4351d9fa0aSPavel Labath   if (!ExpectedData)
4451d9fa0aSPavel Labath     return ExpectedData.takeError();
4551d9fa0aSPavel Labath 
46ebdc698dSPavel Labath   SmallVector<UTF16, 32> WStr(Size);
47ebdc698dSPavel Labath   copy(*ExpectedData, WStr.begin());
48ebdc698dSPavel Labath 
4951d9fa0aSPavel Labath   std::string Result;
50ebdc698dSPavel Labath   if (!convertUTF16ToUTF8String(WStr, Result))
5151d9fa0aSPavel Labath     return createError("String decoding failed");
5251d9fa0aSPavel Labath 
5351d9fa0aSPavel Labath   return Result;
5451d9fa0aSPavel Labath }
5551d9fa0aSPavel Labath 
56*6e0b1ce4SPavel Labath Expected<iterator_range<MinidumpFile::MemoryInfoIterator>>
getMemoryInfoList() const57*6e0b1ce4SPavel Labath MinidumpFile::getMemoryInfoList() const {
58*6e0b1ce4SPavel Labath   Optional<ArrayRef<uint8_t>> Stream = getRawStream(StreamType::MemoryInfoList);
59*6e0b1ce4SPavel Labath   if (!Stream)
60aaff480cSPavel Labath     return createError("No such stream");
61*6e0b1ce4SPavel Labath   auto ExpectedHeader =
62*6e0b1ce4SPavel Labath       getDataSliceAs<minidump::MemoryInfoListHeader>(*Stream, 0, 1);
63*6e0b1ce4SPavel Labath   if (!ExpectedHeader)
64*6e0b1ce4SPavel Labath     return ExpectedHeader.takeError();
65*6e0b1ce4SPavel Labath   const minidump::MemoryInfoListHeader &H = ExpectedHeader.get()[0];
66*6e0b1ce4SPavel Labath   Expected<ArrayRef<uint8_t>> Data =
67*6e0b1ce4SPavel Labath       getDataSlice(*Stream, H.SizeOfHeader, H.SizeOfEntry * H.NumberOfEntries);
68*6e0b1ce4SPavel Labath   if (!Data)
69*6e0b1ce4SPavel Labath     return Data.takeError();
70*6e0b1ce4SPavel Labath   return make_range(MemoryInfoIterator(*Data, H.SizeOfEntry),
71*6e0b1ce4SPavel Labath                     MemoryInfoIterator({}, H.SizeOfEntry));
72*6e0b1ce4SPavel Labath }
73*6e0b1ce4SPavel Labath 
74*6e0b1ce4SPavel Labath template <typename T>
getListStream(StreamType Type) const75*6e0b1ce4SPavel Labath Expected<ArrayRef<T>> MinidumpFile::getListStream(StreamType Type) const {
76*6e0b1ce4SPavel Labath   Optional<ArrayRef<uint8_t>> Stream = getRawStream(Type);
77*6e0b1ce4SPavel Labath   if (!Stream)
78*6e0b1ce4SPavel Labath     return createError("No such stream");
79*6e0b1ce4SPavel Labath   auto ExpectedSize = getDataSliceAs<support::ulittle32_t>(*Stream, 0, 1);
80aaff480cSPavel Labath   if (!ExpectedSize)
81aaff480cSPavel Labath     return ExpectedSize.takeError();
82aaff480cSPavel Labath 
83aaff480cSPavel Labath   size_t ListSize = ExpectedSize.get()[0];
84aaff480cSPavel Labath 
85aaff480cSPavel Labath   size_t ListOffset = 4;
86cfc4519eSPavel Labath   // Some producers insert additional padding bytes to align the list to an
87cfc4519eSPavel Labath   // 8-byte boundary. Check for that by comparing the list size with the overall
88cfc4519eSPavel Labath   // stream size.
89*6e0b1ce4SPavel Labath   if (ListOffset + sizeof(T) * ListSize < Stream->size())
90aaff480cSPavel Labath     ListOffset = 8;
91aaff480cSPavel Labath 
92*6e0b1ce4SPavel Labath   return getDataSliceAs<T>(*Stream, ListOffset, ListSize);
93aaff480cSPavel Labath }
94cfc4519eSPavel Labath template Expected<ArrayRef<Module>>
95cfc4519eSPavel Labath     MinidumpFile::getListStream(StreamType) const;
96cfc4519eSPavel Labath template Expected<ArrayRef<Thread>>
97cfc4519eSPavel Labath     MinidumpFile::getListStream(StreamType) const;
982d29e16cSPavel Labath template Expected<ArrayRef<MemoryDescriptor>>
992d29e16cSPavel Labath     MinidumpFile::getListStream(StreamType) const;
100aaff480cSPavel Labath 
101581d79a4SPavel Labath Expected<ArrayRef<uint8_t>>
getDataSlice(ArrayRef<uint8_t> Data,size_t Offset,size_t Size)102581d79a4SPavel Labath MinidumpFile::getDataSlice(ArrayRef<uint8_t> Data, size_t Offset, size_t Size) {
103581d79a4SPavel Labath   // Check for overflow.
104581d79a4SPavel Labath   if (Offset + Size < Offset || Offset + Size < Size ||
105581d79a4SPavel Labath       Offset + Size > Data.size())
106581d79a4SPavel Labath     return createEOFError();
107581d79a4SPavel Labath   return Data.slice(Offset, Size);
108581d79a4SPavel Labath }
109581d79a4SPavel Labath 
110581d79a4SPavel Labath Expected<std::unique_ptr<MinidumpFile>>
create(MemoryBufferRef Source)111581d79a4SPavel Labath MinidumpFile::create(MemoryBufferRef Source) {
112581d79a4SPavel Labath   ArrayRef<uint8_t> Data = arrayRefFromStringRef(Source.getBuffer());
113581d79a4SPavel Labath   auto ExpectedHeader = getDataSliceAs<minidump::Header>(Data, 0, 1);
114581d79a4SPavel Labath   if (!ExpectedHeader)
115581d79a4SPavel Labath     return ExpectedHeader.takeError();
116581d79a4SPavel Labath 
117581d79a4SPavel Labath   const minidump::Header &Hdr = (*ExpectedHeader)[0];
118581d79a4SPavel Labath   if (Hdr.Signature != Header::MagicSignature)
119581d79a4SPavel Labath     return createError("Invalid signature");
120581d79a4SPavel Labath   if ((Hdr.Version & 0xffff) != Header::MagicVersion)
121581d79a4SPavel Labath     return createError("Invalid version");
122581d79a4SPavel Labath 
123581d79a4SPavel Labath   auto ExpectedStreams = getDataSliceAs<Directory>(Data, Hdr.StreamDirectoryRVA,
124581d79a4SPavel Labath                                                    Hdr.NumberOfStreams);
125581d79a4SPavel Labath   if (!ExpectedStreams)
126581d79a4SPavel Labath     return ExpectedStreams.takeError();
127581d79a4SPavel Labath 
128581d79a4SPavel Labath   DenseMap<StreamType, std::size_t> StreamMap;
129*6e0b1ce4SPavel Labath   for (const auto &StreamDescriptor : llvm::enumerate(*ExpectedStreams)) {
130*6e0b1ce4SPavel Labath     StreamType Type = StreamDescriptor.value().Type;
131*6e0b1ce4SPavel Labath     const LocationDescriptor &Loc = StreamDescriptor.value().Location;
132581d79a4SPavel Labath 
133*6e0b1ce4SPavel Labath     Expected<ArrayRef<uint8_t>> Stream =
134*6e0b1ce4SPavel Labath         getDataSlice(Data, Loc.RVA, Loc.DataSize);
135*6e0b1ce4SPavel Labath     if (!Stream)
136*6e0b1ce4SPavel Labath       return Stream.takeError();
137581d79a4SPavel Labath 
138581d79a4SPavel Labath     if (Type == StreamType::Unused && Loc.DataSize == 0) {
139581d79a4SPavel Labath       // Ignore dummy streams. This is technically ill-formed, but a number of
140581d79a4SPavel Labath       // existing minidumps seem to contain such streams.
141581d79a4SPavel Labath       continue;
142581d79a4SPavel Labath     }
143581d79a4SPavel Labath 
144581d79a4SPavel Labath     if (Type == DenseMapInfo<StreamType>::getEmptyKey() ||
145581d79a4SPavel Labath         Type == DenseMapInfo<StreamType>::getTombstoneKey())
146581d79a4SPavel Labath       return createError("Cannot handle one of the minidump streams");
147581d79a4SPavel Labath 
148581d79a4SPavel Labath     // Update the directory map, checking for duplicate stream types.
149*6e0b1ce4SPavel Labath     if (!StreamMap.try_emplace(Type, StreamDescriptor.index()).second)
150581d79a4SPavel Labath       return createError("Duplicate stream type");
151581d79a4SPavel Labath   }
152581d79a4SPavel Labath 
153581d79a4SPavel Labath   return std::unique_ptr<MinidumpFile>(
154581d79a4SPavel Labath       new MinidumpFile(Source, Hdr, *ExpectedStreams, std::move(StreamMap)));
155581d79a4SPavel Labath }
156