LLVM 22.0.0git
OnDiskTrieRawHashMap.cpp
Go to the documentation of this file.
1//===----------------------------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8///
9/// \file Implements OnDiskTrieRawHashMap.
10///
11//===----------------------------------------------------------------------===//
12
14#include "DatabaseFile.h"
18#include "llvm/Config/llvm-config.h"
22
23using namespace llvm;
24using namespace llvm::cas;
25using namespace llvm::cas::ondisk;
26
27#if LLVM_ENABLE_ONDISK_CAS
28
29//===----------------------------------------------------------------------===//
30// TrieRawHashMap data structures.
31//===----------------------------------------------------------------------===//
32
33namespace {
34
35class SubtrieHandle;
36class TrieRawHashMapHandle;
37class TrieVisitor;
38
39/// A value stored in the slots inside a SubTrie. A stored value can either be a
40/// subtrie (encoded after negation) which is the file offset to another
41/// subtrie, or it can be a fileset to a DataRecord.
42class SubtrieSlotValue {
43public:
44 explicit operator bool() const { return !isEmpty(); }
45 bool isEmpty() const { return !Offset; }
46 bool isData() const { return Offset > 0; }
47 bool isSubtrie() const { return Offset < 0; }
48 uint64_t asData() const {
49 assert(isData());
50 return Offset;
51 }
52 uint64_t asSubtrie() const {
53 assert(isSubtrie());
54 return -Offset;
55 }
56
57 FileOffset asSubtrieFileOffset() const { return FileOffset(asSubtrie()); }
58
59 FileOffset asDataFileOffset() const { return FileOffset(asData()); }
60
61 int64_t getRawOffset() const { return Offset; }
62
63 static SubtrieSlotValue getDataOffset(int64_t Offset) {
64 return SubtrieSlotValue(Offset);
65 }
66
67 static SubtrieSlotValue getSubtrieOffset(int64_t Offset) {
68 return SubtrieSlotValue(-Offset);
69 }
70
71 static SubtrieSlotValue getDataOffset(FileOffset Offset) {
72 return getDataOffset(Offset.get());
73 }
74
75 static SubtrieSlotValue getSubtrieOffset(FileOffset Offset) {
76 return getDataOffset(Offset.get());
77 }
78
79 static SubtrieSlotValue getFromSlot(std::atomic<int64_t> &Slot) {
80 return SubtrieSlotValue(Slot.load());
81 }
82
83 SubtrieSlotValue() = default;
84
85private:
86 friend class SubtrieHandle;
87 explicit SubtrieSlotValue(int64_t Offset) : Offset(Offset) {}
88 int64_t Offset = 0;
89};
90
91/// Subtrie layout:
92/// - 2-bytes: StartBit
93/// - 1-bytes: NumBits=lg(num-slots)
94/// - 5-bytes: 0-pad
95/// - <slots>
96class SubtrieHandle {
97public:
98 struct Header {
99 /// The bit this subtrie starts on.
100 uint16_t StartBit;
101
102 /// The number of bits this subtrie handles. It has 2^NumBits slots.
103 uint8_t NumBits;
104
105 /// 0-pad to 8B.
106 uint8_t ZeroPad1B;
107 uint32_t ZeroPad4B;
108 };
109
110 /// Slot storage:
111 /// - zero: Empty
112 /// - positive: RecordOffset
113 /// - negative: SubtrieOffset
114 using SlotT = std::atomic<int64_t>;
115
116 static int64_t getSlotsSize(uint32_t NumBits) {
117 return sizeof(int64_t) * (1u << NumBits);
118 }
119
120 static int64_t getSize(uint32_t NumBits) {
121 return sizeof(SubtrieHandle::Header) + getSlotsSize(NumBits);
122 }
123
124 int64_t getSize() const { return getSize(H->NumBits); }
125 size_t getNumSlots() const { return Slots.size(); }
126
127 SubtrieSlotValue load(size_t I) const {
128 return SubtrieSlotValue(Slots[I].load());
129 }
130 void store(size_t I, SubtrieSlotValue V) {
131 return Slots[I].store(V.getRawOffset());
132 }
133
134 void printHash(raw_ostream &OS, ArrayRef<uint8_t> Bytes) const;
135
136 /// Return None on success, or the existing offset on failure.
137 bool compare_exchange_strong(size_t I, SubtrieSlotValue &Expected,
138 SubtrieSlotValue New) {
139 return Slots[I].compare_exchange_strong(Expected.Offset, New.Offset);
140 }
141
142 /// Sink \p V from \p I in this subtrie down to \p NewI in a new subtrie with
143 /// \p NumSubtrieBits.
144 ///
145 /// \p UnusedSubtrie maintains a 1-item "free" list of unused subtries. If a
146 /// new subtrie is created that isn't used because of a lost race, then it If
147 /// it's already valid, it should be used instead of allocating a new one.
148 /// should be returned as an out parameter to be passed back in the future.
149 /// If it's already valid, it should be used instead of allocating a new one.
150 ///
151 /// Returns the subtrie that now lives at \p I.
152 Expected<SubtrieHandle> sink(size_t I, SubtrieSlotValue V,
153 MappedFileRegionArena &Alloc,
154 size_t NumSubtrieBits,
155 SubtrieHandle &UnusedSubtrie, size_t NewI);
156
157 /// Only safe if the subtrie is empty.
158 void reinitialize(uint32_t StartBit, uint32_t NumBits);
159
160 SubtrieSlotValue getOffset() const {
161 return SubtrieSlotValue::getSubtrieOffset(
162 reinterpret_cast<const char *>(H) - Region->data());
163 }
164
165 FileOffset getFileOffset() const { return getOffset().asSubtrieFileOffset(); }
166
167 explicit operator bool() const { return H; }
168
169 Header &getHeader() const { return *H; }
170 uint32_t getStartBit() const { return H->StartBit; }
171 uint32_t getNumBits() const { return H->NumBits; }
172
173 static Expected<SubtrieHandle> create(MappedFileRegionArena &Alloc,
174 uint32_t StartBit, uint32_t NumBits);
175
176 static SubtrieHandle getFromFileOffset(MappedFileRegion &Region,
177 FileOffset Offset) {
178 return SubtrieHandle(Region, SubtrieSlotValue::getSubtrieOffset(Offset));
179 }
180
181 SubtrieHandle() = default;
182 SubtrieHandle(MappedFileRegion &Region, Header &H)
183 : Region(&Region), H(&H), Slots(getSlots(H)) {}
184 SubtrieHandle(MappedFileRegion &Region, SubtrieSlotValue Offset)
185 : SubtrieHandle(Region, *reinterpret_cast<Header *>(
186 Region.data() + Offset.asSubtrie())) {}
187
188private:
189 MappedFileRegion *Region = nullptr;
190 Header *H = nullptr;
192
193 static MutableArrayRef<SlotT> getSlots(Header &H) {
194 return MutableArrayRef(reinterpret_cast<SlotT *>(&H + 1), 1u << H.NumBits);
195 }
196};
197
198/// Handle for a TrieRawHashMap table.
199///
200/// TrieRawHashMap table layout:
201/// - [8-bytes: Generic table header]
202/// - 1-byte: NumSubtrieBits
203/// - 1-byte: Flags (not used yet)
204/// - 2-bytes: NumHashBits
205/// - 4-bytes: RecordDataSize (in bytes)
206/// - 8-bytes: RootTrieOffset
207/// - 8-bytes: AllocatorOffset (reserved for implementing free lists)
208/// - <name> '\0'
209///
210/// Record layout:
211/// - <hash>
212/// - <data>
213class TrieRawHashMapHandle {
214public:
215 static constexpr TableHandle::TableKind Kind =
216 TableHandle::TableKind::TrieRawHashMap;
217
218 struct Header {
219 TableHandle::Header GenericHeader;
220 uint8_t NumSubtrieBits;
221 uint8_t Flags; ///< None used yet.
222 uint16_t NumHashBits;
223 uint32_t RecordDataSize;
224 std::atomic<int64_t> RootTrieOffset;
225 std::atomic<int64_t> AllocatorOffset;
226 };
227
228 operator TableHandle() const {
229 if (!H)
230 return TableHandle();
231 return TableHandle(*Region, H->GenericHeader);
232 }
233
234 struct RecordData {
235 OnDiskTrieRawHashMap::ValueProxy Proxy;
236 SubtrieSlotValue Offset;
237 FileOffset getFileOffset() const { return Offset.asDataFileOffset(); }
238 };
239
240 enum Limits : size_t {
241 /// Seems like 65528 hash bits ought to be enough.
242 MaxNumHashBytes = UINT16_MAX >> 3,
243 MaxNumHashBits = MaxNumHashBytes << 3,
244
245 /// 2^16 bits in a trie is 65536 slots. This restricts us to a 16-bit
246 /// index. This many slots is suspicously large anyway.
247 MaxNumRootBits = 16,
248
249 /// 2^10 bits in a trie is 1024 slots. This many slots seems suspiciously
250 /// large for subtries.
251 MaxNumSubtrieBits = 10,
252 };
253
254 static constexpr size_t getNumHashBytes(size_t NumHashBits) {
255 assert(NumHashBits % 8 == 0);
256 return NumHashBits / 8;
257 }
258 static constexpr size_t getRecordSize(size_t RecordDataSize,
259 size_t NumHashBits) {
260 return RecordDataSize + getNumHashBytes(NumHashBits);
261 }
262
263 RecordData getRecord(SubtrieSlotValue Offset);
264 Expected<RecordData> createRecord(MappedFileRegionArena &Alloc,
265 ArrayRef<uint8_t> Hash);
266
267 explicit operator bool() const { return H; }
268 const Header &getHeader() const { return *H; }
269 SubtrieHandle getRoot() const;
270 Expected<SubtrieHandle> getOrCreateRoot(MappedFileRegionArena &Alloc);
271 MappedFileRegion &getRegion() const { return *Region; }
272
273 size_t getFlags() const { return H->Flags; }
274 size_t getNumSubtrieBits() const { return H->NumSubtrieBits; }
275 size_t getNumHashBits() const { return H->NumHashBits; }
276 size_t getNumHashBytes() const { return getNumHashBytes(H->NumHashBits); }
277 size_t getRecordDataSize() const { return H->RecordDataSize; }
278 size_t getRecordSize() const {
279 return getRecordSize(H->RecordDataSize, H->NumHashBits);
280 }
281
282 TrieHashIndexGenerator getIndexGen(SubtrieHandle Root,
283 ArrayRef<uint8_t> Hash) {
284 assert(Root.getStartBit() == 0);
285 assert(getNumHashBytes() == Hash.size());
286 assert(getNumHashBits() == Hash.size() * 8);
287 return TrieHashIndexGenerator{Root.getNumBits(), getNumSubtrieBits(), Hash};
288 }
289
290 static Expected<TrieRawHashMapHandle>
291 create(MappedFileRegionArena &Alloc, StringRef Name,
292 std::optional<uint64_t> NumRootBits, uint64_t NumSubtrieBits,
293 uint64_t NumHashBits, uint64_t RecordDataSize);
294
295 void
296 print(raw_ostream &OS,
297 function_ref<void(ArrayRef<char>)> PrintRecordData = nullptr) const;
298
300 function_ref<Error(FileOffset, OnDiskTrieRawHashMap::ConstValueProxy)>
301 RecordVerifier) const;
302 TrieRawHashMapHandle() = default;
303 TrieRawHashMapHandle(MappedFileRegion &Region, Header &H)
304 : Region(&Region), H(&H) {}
305 TrieRawHashMapHandle(MappedFileRegion &Region, intptr_t HeaderOffset)
306 : TrieRawHashMapHandle(
307 Region, *reinterpret_cast<Header *>(Region.data() + HeaderOffset)) {
308 }
309
310private:
311 MappedFileRegion *Region = nullptr;
312 Header *H = nullptr;
313};
314
315} // end anonymous namespace
316
318 DatabaseFile File;
319 TrieRawHashMapHandle Trie;
320};
321
323 uint32_t StartBit,
324 uint32_t NumBits) {
325 assert(StartBit <= TrieRawHashMapHandle::MaxNumHashBits);
326 assert(NumBits <= UINT8_MAX);
327 assert(NumBits <= TrieRawHashMapHandle::MaxNumRootBits);
328
329 auto Mem = Alloc.allocate(getSize(NumBits));
330 if (LLVM_UNLIKELY(!Mem))
331 return Mem.takeError();
332 auto *H =
333 new (*Mem) SubtrieHandle::Header{(uint16_t)StartBit, (uint8_t)NumBits,
334 /*ZeroPad1B=*/0, /*ZeroPad4B=*/0};
335 SubtrieHandle S(Alloc.getRegion(), *H);
336 for (auto I = S.Slots.begin(), E = S.Slots.end(); I != E; ++I)
337 new (I) SlotT(0);
338 return S;
339}
340
341SubtrieHandle TrieRawHashMapHandle::getRoot() const {
342 if (int64_t Root = H->RootTrieOffset)
343 return SubtrieHandle(getRegion(), SubtrieSlotValue::getSubtrieOffset(Root));
344 return SubtrieHandle();
345}
346
348TrieRawHashMapHandle::getOrCreateRoot(MappedFileRegionArena &Alloc) {
349 assert(&Alloc.getRegion() == &getRegion());
350 if (SubtrieHandle Root = getRoot())
351 return Root;
352
353 int64_t Race = 0;
354 auto LazyRoot = SubtrieHandle::create(Alloc, 0, H->NumSubtrieBits);
355 if (LLVM_UNLIKELY(!LazyRoot))
356 return LazyRoot.takeError();
357 if (H->RootTrieOffset.compare_exchange_strong(
358 Race, LazyRoot->getOffset().asSubtrie()))
359 return *LazyRoot;
360
361 // There was a race. Return the other root.
362 //
363 // TODO: Avoid leaking the lazy root by storing it in an allocator.
364 return SubtrieHandle(getRegion(), SubtrieSlotValue::getSubtrieOffset(Race));
365}
366
368TrieRawHashMapHandle::create(MappedFileRegionArena &Alloc, StringRef Name,
369 std::optional<uint64_t> NumRootBits,
370 uint64_t NumSubtrieBits, uint64_t NumHashBits,
371 uint64_t RecordDataSize) {
372 // Allocate.
373 auto Offset = Alloc.allocateOffset(sizeof(Header) + Name.size() + 1);
374 if (LLVM_UNLIKELY(!Offset))
375 return Offset.takeError();
376
377 // Construct the header and the name.
378 assert(Name.size() <= UINT16_MAX && "Expected smaller table name");
379 assert(NumSubtrieBits <= UINT8_MAX && "Expected valid subtrie bits");
380 assert(NumHashBits <= UINT16_MAX && "Expected valid hash size");
381 assert(RecordDataSize <= UINT32_MAX && "Expected smaller table name");
382 auto *H = new (Alloc.getRegion().data() + *Offset)
384 (uint32_t)sizeof(Header)},
385 (uint8_t)NumSubtrieBits,
386 /*Flags=*/0,
387 (uint16_t)NumHashBits,
388 (uint32_t)RecordDataSize,
389 /*RootTrieOffset=*/{0},
390 /*AllocatorOffset=*/{0}};
391 char *NameStorage = reinterpret_cast<char *>(H + 1);
392 llvm::copy(Name, NameStorage);
393 NameStorage[Name.size()] = 0;
394
395 // Construct a root trie, if requested.
396 TrieRawHashMapHandle Trie(Alloc.getRegion(), *H);
397 auto Sub = SubtrieHandle::create(Alloc, 0, *NumRootBits);
398 if (LLVM_UNLIKELY(!Sub))
399 return Sub.takeError();
400 if (NumRootBits)
401 H->RootTrieOffset = Sub->getOffset().asSubtrie();
402 return Trie;
403}
404
405TrieRawHashMapHandle::RecordData
406TrieRawHashMapHandle::getRecord(SubtrieSlotValue Offset) {
407 char *Begin = Region->data() + Offset.asData();
409 Proxy.Data = MutableArrayRef(Begin, getRecordDataSize());
410 Proxy.Hash = ArrayRef(reinterpret_cast<const uint8_t *>(Proxy.Data.end()),
411 getNumHashBytes());
412 return RecordData{Proxy, Offset};
413}
414
416TrieRawHashMapHandle::createRecord(MappedFileRegionArena &Alloc,
417 ArrayRef<uint8_t> Hash) {
418 assert(&Alloc.getRegion() == Region);
419 assert(Hash.size() == getNumHashBytes());
420 auto Offset = Alloc.allocateOffset(getRecordSize());
421 if (LLVM_UNLIKELY(!Offset))
422 return Offset.takeError();
423
424 RecordData Record = getRecord(SubtrieSlotValue::getDataOffset(*Offset));
425 llvm::copy(Hash, const_cast<uint8_t *>(Record.Proxy.Hash.begin()));
426 return Record;
427}
428
431 // Check alignment.
433 return createStringError(make_error_code(std::errc::protocol_error),
434 "unaligned file offset at 0x" +
435 utohexstr(Offset.get(), /*LowerCase=*/true));
436
437 // Check bounds.
438 //
439 // Note: There's no potential overflow when using \c uint64_t because Offset
440 // is in valid offset range and the record size is in \c [0,UINT32_MAX].
441 if (!validOffset(Offset) ||
442 Offset.get() + Impl->Trie.getRecordSize() > Impl->File.getAlloc().size())
443 return createStringError(make_error_code(std::errc::protocol_error),
444 "file offset too large: 0x" +
445 utohexstr(Offset.get(), /*LowerCase=*/true));
446
447 // Looks okay...
448 TrieRawHashMapHandle::RecordData D =
449 Impl->Trie.getRecord(SubtrieSlotValue::getDataOffset(Offset));
450 return const_pointer(D.Proxy, D.getFileOffset());
451}
452
454OnDiskTrieRawHashMap::find(ArrayRef<uint8_t> Hash) const {
455 TrieRawHashMapHandle Trie = Impl->Trie;
456 assert(Hash.size() == Trie.getNumHashBytes() && "Invalid hash");
457
458 SubtrieHandle S = Trie.getRoot();
459 if (!S)
460 return const_pointer();
461
462 TrieHashIndexGenerator IndexGen = Trie.getIndexGen(S, Hash);
463 size_t Index = IndexGen.next();
464 for (;;) {
465 // Try to set the content.
466 SubtrieSlotValue V = S.load(Index);
467 if (!V)
468 return const_pointer();
469
470 // Check for an exact match.
471 if (V.isData()) {
472 TrieRawHashMapHandle::RecordData D = Trie.getRecord(V);
473 return D.Proxy.Hash == Hash ? const_pointer(D.Proxy, D.getFileOffset())
474 : const_pointer();
475 }
476
477 Index = IndexGen.next();
478 S = SubtrieHandle(Trie.getRegion(), V);
479 }
480}
481
482/// Only safe if the subtrie is empty.
483void SubtrieHandle::reinitialize(uint32_t StartBit, uint32_t NumBits) {
484 assert(StartBit > H->StartBit);
485 assert(NumBits <= H->NumBits);
486 // Ideally would also assert that all slots are empty, but that's expensive.
487
488 H->StartBit = StartBit;
489 H->NumBits = NumBits;
490}
491
492Expected<OnDiskTrieRawHashMap::pointer>
493OnDiskTrieRawHashMap::insertLazy(ArrayRef<uint8_t> Hash,
494 LazyInsertOnConstructCB OnConstruct,
495 LazyInsertOnLeakCB OnLeak) {
496 TrieRawHashMapHandle Trie = Impl->Trie;
497 assert(Hash.size() == Trie.getNumHashBytes() && "Invalid hash");
498
499 MappedFileRegionArena &Alloc = Impl->File.getAlloc();
500 std::optional<SubtrieHandle> S;
501 auto Err = Trie.getOrCreateRoot(Alloc).moveInto(S);
502 if (LLVM_UNLIKELY(Err))
503 return std::move(Err);
504
505 TrieHashIndexGenerator IndexGen = Trie.getIndexGen(*S, Hash);
506 size_t Index = IndexGen.next();
507
508 // Walk through the hash bytes and insert into correct trie position.
509 std::optional<TrieRawHashMapHandle::RecordData> NewRecord;
510 SubtrieHandle UnusedSubtrie;
511 for (;;) {
512 SubtrieSlotValue Existing = S->load(Index);
513
514 // Try to set it, if it's empty.
515 if (!Existing) {
516 if (!NewRecord) {
517 auto Err = Trie.createRecord(Alloc, Hash).moveInto(NewRecord);
518 if (LLVM_UNLIKELY(Err))
519 return std::move(Err);
520 if (OnConstruct)
521 OnConstruct(NewRecord->Offset.asDataFileOffset(), NewRecord->Proxy);
522 }
523
524 if (S->compare_exchange_strong(Index, Existing, NewRecord->Offset))
525 return pointer(NewRecord->Proxy, NewRecord->Offset.asDataFileOffset());
526
527 // Race means that Existing is no longer empty; fall through...
528 }
529
530 if (Existing.isSubtrie()) {
531 S = SubtrieHandle(Trie.getRegion(), Existing);
532 Index = IndexGen.next();
533 continue;
534 }
535
536 // Check for an exact match.
537 TrieRawHashMapHandle::RecordData ExistingRecord = Trie.getRecord(Existing);
538 if (ExistingRecord.Proxy.Hash == Hash) {
539 if (NewRecord && OnLeak)
540 OnLeak(NewRecord->Offset.asDataFileOffset(), NewRecord->Proxy,
541 ExistingRecord.Offset.asDataFileOffset(), ExistingRecord.Proxy);
542 return pointer(ExistingRecord.Proxy,
543 ExistingRecord.Offset.asDataFileOffset());
544 }
545
546 // Sink the existing content as long as the indexes match.
547 for (;;) {
548 size_t NextIndex = IndexGen.next();
549 size_t NewIndexForExistingContent =
550 IndexGen.getCollidingBits(ExistingRecord.Proxy.Hash);
551
552 auto Err = S->sink(Index, Existing, Alloc, IndexGen.getNumBits(),
553 UnusedSubtrie, NewIndexForExistingContent)
554 .moveInto(S);
555 if (LLVM_UNLIKELY(Err))
556 return std::move(Err);
557 Index = NextIndex;
558
559 // Found the difference.
560 if (NextIndex != NewIndexForExistingContent)
561 break;
562 }
563 }
564}
565
566Expected<SubtrieHandle> SubtrieHandle::sink(size_t I, SubtrieSlotValue V,
568 size_t NumSubtrieBits,
569 SubtrieHandle &UnusedSubtrie,
570 size_t NewI) {
571 std::optional<SubtrieHandle> NewS;
572 if (UnusedSubtrie) {
573 // Steal UnusedSubtrie and initialize it.
574 NewS.emplace();
575 std::swap(*NewS, UnusedSubtrie);
576 NewS->reinitialize(getStartBit() + getNumBits(), NumSubtrieBits);
577 } else {
578 // Allocate a new, empty subtrie.
579 auto Err = SubtrieHandle::create(Alloc, getStartBit() + getNumBits(),
580 NumSubtrieBits)
581 .moveInto(NewS);
582 if (LLVM_UNLIKELY(Err))
583 return std::move(Err);
584 }
585
586 NewS->store(NewI, V);
587 if (compare_exchange_strong(I, V, NewS->getOffset()))
588 return *NewS; // Success!
589
590 // Raced.
591 assert(V.isSubtrie() && "Expected racing sink() to add a subtrie");
592
593 // Wipe out the new slot so NewS can be reused and set the out parameter.
594 NewS->store(NewI, SubtrieSlotValue());
595 UnusedSubtrie = *NewS;
596
597 // Return the subtrie added by the concurrent sink() call.
598 return SubtrieHandle(Alloc.getRegion(), V);
599}
600
602 raw_ostream &OS, function_ref<void(ArrayRef<char>)> PrintRecordData) const {
603 Impl->Trie.print(OS, PrintRecordData);
604}
605
607 function_ref<Error(FileOffset, ConstValueProxy)> RecordVerifier) const {
608 return Impl->Trie.validate(RecordVerifier);
609}
610
611// Helper function that prints hexdigit and have a sub-byte starting position.
612static void printHexDigits(raw_ostream &OS, ArrayRef<uint8_t> Bytes,
613 size_t StartBit, size_t NumBits) {
614 assert(StartBit % 4 == 0);
615 assert(NumBits % 4 == 0);
616 for (size_t I = StartBit, E = StartBit + NumBits; I != E; I += 4) {
617 uint8_t HexPair = Bytes[I / 8];
618 uint8_t HexDigit = I % 8 == 0 ? HexPair >> 4 : HexPair & 0xf;
619 OS << hexdigit(HexDigit, /*LowerCase=*/true);
620 }
621}
622
623static void printBits(raw_ostream &OS, ArrayRef<uint8_t> Bytes, size_t StartBit,
624 size_t NumBits) {
625 assert(StartBit + NumBits <= Bytes.size() * 8u);
626 for (size_t I = StartBit, E = StartBit + NumBits; I != E; ++I) {
627 uint8_t Byte = Bytes[I / 8];
628 size_t ByteOffset = I % 8;
629 if (size_t ByteShift = 8 - ByteOffset - 1)
630 Byte >>= ByteShift;
631 OS << (Byte & 0x1 ? '1' : '0');
632 }
633}
634
635void SubtrieHandle::printHash(raw_ostream &OS, ArrayRef<uint8_t> Bytes) const {
636 // afb[1c:00*01110*0]def
637 size_t EndBit = getStartBit() + getNumBits();
638 size_t HashEndBit = Bytes.size() * 8u;
639
640 size_t FirstBinaryBit = getStartBit() & ~0x3u;
641 printHexDigits(OS, Bytes, 0, FirstBinaryBit);
642
643 size_t LastBinaryBit = (EndBit + 3u) & ~0x3u;
644 OS << "[";
645 printBits(OS, Bytes, FirstBinaryBit, LastBinaryBit - FirstBinaryBit);
646 OS << "]";
647
648 printHexDigits(OS, Bytes, LastBinaryBit, HashEndBit - LastBinaryBit);
649}
650
651static void appendIndexBits(std::string &Prefix, size_t Index,
652 size_t NumSlots) {
653 std::string Bits;
654 for (size_t NumBits = 1u; NumBits < NumSlots; NumBits <<= 1) {
655 Bits.push_back('0' + (Index & 0x1));
656 Index >>= 1;
657 }
658 for (char Ch : llvm::reverse(Bits))
659 Prefix += Ch;
660}
661
662static void printPrefix(raw_ostream &OS, StringRef Prefix) {
663 while (Prefix.size() >= 4) {
664 uint8_t Digit;
665 bool ErrorParsingBinary = Prefix.take_front(4).getAsInteger(2, Digit);
666 assert(!ErrorParsingBinary);
667 (void)ErrorParsingBinary;
668 OS << hexdigit(Digit, /*LowerCase=*/true);
669 Prefix = Prefix.drop_front(4);
670 }
671 if (!Prefix.empty())
672 OS << "[" << Prefix << "]";
673}
674
676
677static Expected<size_t> checkParameter(StringRef Label, size_t Max,
678 std::optional<size_t> Value,
679 std::optional<size_t> Default,
680 StringRef Path, StringRef TableName) {
681 assert(Value || Default);
682 assert(!Default || *Default <= Max);
683 if (!Value)
684 return *Default;
685
686 if (*Value <= Max)
687 return *Value;
689 std::errc::argument_out_of_domain, Path, TableName,
690 "invalid " + Label + ": " + Twine(*Value) + " (max: " + Twine(Max) + ")");
691}
692
693size_t OnDiskTrieRawHashMap::size() const { return Impl->File.size(); }
694size_t OnDiskTrieRawHashMap::capacity() const {
695 return Impl->File.getRegion().size();
696}
697
698Expected<OnDiskTrieRawHashMap>
699OnDiskTrieRawHashMap::create(const Twine &PathTwine, const Twine &TrieNameTwine,
700 size_t NumHashBits, uint64_t DataSize,
701 uint64_t MaxFileSize,
702 std::optional<uint64_t> NewFileInitialSize,
703 std::optional<size_t> NewTableNumRootBits,
704 std::optional<size_t> NewTableNumSubtrieBits) {
705 SmallString<128> PathStorage;
706 StringRef Path = PathTwine.toStringRef(PathStorage);
707 SmallString<128> TrieNameStorage;
708 StringRef TrieName = TrieNameTwine.toStringRef(TrieNameStorage);
709
710 constexpr size_t DefaultNumRootBits = 10;
711 constexpr size_t DefaultNumSubtrieBits = 6;
712
713 size_t NumRootBits;
714 if (Error E = checkParameter(
715 "root bits", TrieRawHashMapHandle::MaxNumRootBits,
716 NewTableNumRootBits, DefaultNumRootBits, Path, TrieName)
717 .moveInto(NumRootBits))
718 return std::move(E);
719
720 size_t NumSubtrieBits;
721 if (Error E = checkParameter("subtrie bits",
722 TrieRawHashMapHandle::MaxNumSubtrieBits,
723 NewTableNumSubtrieBits, DefaultNumSubtrieBits,
724 Path, TrieName)
725 .moveInto(NumSubtrieBits))
726 return std::move(E);
727
728 size_t NumHashBytes = NumHashBits >> 3;
729 if (Error E =
730 checkParameter("hash size", TrieRawHashMapHandle::MaxNumHashBits,
731 NumHashBits, std::nullopt, Path, TrieName)
732 .takeError())
733 return std::move(E);
734 assert(NumHashBits == NumHashBytes << 3 &&
735 "Expected hash size to be byte-aligned");
736 if (NumHashBits != NumHashBytes << 3)
738 std::errc::argument_out_of_domain, Path, TrieName,
739 "invalid hash size: " + Twine(NumHashBits) + " (not byte-aligned)");
740
741 // Constructor for if the file doesn't exist.
742 auto NewDBConstructor = [&](DatabaseFile &DB) -> Error {
743 auto Trie =
744 TrieRawHashMapHandle::create(DB.getAlloc(), TrieName, NumRootBits,
745 NumSubtrieBits, NumHashBits, DataSize);
746 if (LLVM_UNLIKELY(!Trie))
747 return Trie.takeError();
748
749 return DB.addTable(*Trie);
750 };
751
752 // Get or create the file.
753 Expected<DatabaseFile> File =
754 DatabaseFile::create(Path, MaxFileSize, NewDBConstructor);
755 if (!File)
756 return File.takeError();
757
758 // Find the trie and validate it.
759 std::optional<TableHandle> Table = File->findTable(TrieName);
760 if (!Table)
761 return createTableConfigError(std::errc::argument_out_of_domain, Path,
762 TrieName, "table not found");
763 if (Error E = checkTable("table kind", (size_t)TrieRawHashMapHandle::Kind,
764 (size_t)Table->getHeader().Kind, Path, TrieName))
765 return std::move(E);
766 auto Trie = Table->cast<TrieRawHashMapHandle>();
767 assert(Trie && "Already checked the kind");
768
769 // Check the hash and data size.
770 if (Error E = checkTable("hash size", NumHashBits, Trie.getNumHashBits(),
771 Path, TrieName))
772 return std::move(E);
773 if (Error E = checkTable("data size", DataSize, Trie.getRecordDataSize(),
774 Path, TrieName))
775 return std::move(E);
776
777 // No flags supported right now. Either corrupt, or coming from a future
778 // writer.
779 if (size_t Flags = Trie.getFlags())
780 return createTableConfigError(std::errc::invalid_argument, Path, TrieName,
781 "unsupported flags: " + Twine(Flags));
782
783 // Success.
784 OnDiskTrieRawHashMap::ImplType Impl{DatabaseFile(std::move(*File)), Trie};
785 return OnDiskTrieRawHashMap(std::make_unique<ImplType>(std::move(Impl)));
786}
787
788static Error createInvalidTrieError(uint64_t Offset, const Twine &Msg) {
789 return createStringError(make_error_code(std::errc::protocol_error),
790 "invalid trie at 0x" +
791 utohexstr(Offset, /*LowerCase=*/true) + ": " +
792 Msg);
793}
794
795//===----------------------------------------------------------------------===//
796// TrieVisitor data structures.
797//===----------------------------------------------------------------------===//
798
799namespace {
800/// A multi-threaded vistior to traverse the Trie.
801///
802/// TODO: add more sanity checks that isn't just plain data corruption. For
803/// example, some ill-formed data can be constructed to form a cycle using
804/// Sub-Tries and it can lead to inifinite loop when visiting (or inserting
805/// data).
806class TrieVisitor {
807public:
808 TrieVisitor(TrieRawHashMapHandle Trie, unsigned ThreadCount = 0,
809 unsigned ErrorLimit = 50)
810 : Trie(Trie), ErrorLimit(ErrorLimit),
812 virtual ~TrieVisitor() = default;
813 Error visit();
814
815private:
816 // Virtual method to implement the action when visiting a sub-trie.
817 virtual Error visitSubTrie(StringRef Prefix, SubtrieHandle SubTrie) {
818 return Error::success();
819 }
820
821 // Virtual method to implement the action when visiting a slot in a trie node.
822 virtual Error visitSlot(unsigned I, SubtrieHandle Subtrie, StringRef Prefix,
823 SubtrieSlotValue Slot) {
824 return Error::success();
825 }
826
827protected:
828 TrieRawHashMapHandle Trie;
829
830private:
831 Error traverseTrieNode(SubtrieHandle Node, StringRef Prefix);
832
833 Error validateSubTrie(SubtrieHandle Node, bool IsRoot);
834
835 // Helper function to capture errors when visiting the trie nodes.
836 void addError(Error NewError) {
837 assert(NewError && "not an error");
838 std::lock_guard<std::mutex> ErrorLock(Lock);
839 if (NumError >= ErrorLimit) {
840 // Too many errors.
841 consumeError(std::move(NewError));
842 return;
843 }
844
845 if (Err)
846 Err = joinErrors(std::move(*Err), std::move(NewError));
847 else
848 Err = std::move(NewError);
849 NumError++;
850 }
851
852 bool tooManyErrors() {
853 std::lock_guard<std::mutex> ErrorLock(Lock);
854 return (bool)Err && NumError >= ErrorLimit;
855 }
856
857 const unsigned ErrorLimit;
858 std::optional<Error> Err;
859 unsigned NumError = 0;
860 std::mutex Lock;
861 DefaultThreadPool Threads;
862};
863
864/// A visitor that traverse and print the Trie.
865class TriePrinter : public TrieVisitor {
866public:
867 TriePrinter(TrieRawHashMapHandle Trie, raw_ostream &OS,
868 function_ref<void(ArrayRef<char>)> PrintRecordData)
869 : TrieVisitor(Trie, /*ThreadCount=*/1), OS(OS),
870 PrintRecordData(PrintRecordData) {}
871
872 Error printRecords() {
873 if (Records.empty())
874 return Error::success();
875
876 OS << "records\n";
877 llvm::sort(Records);
878 for (int64_t Offset : Records) {
879 TrieRawHashMapHandle::RecordData Record =
880 Trie.getRecord(SubtrieSlotValue::getDataOffset(Offset));
881 if (auto Err = printRecord(Record))
882 return Err;
883 }
884 return Error::success();
885 }
886
887 Error printRecord(TrieRawHashMapHandle::RecordData &Record) {
888 OS << "- addr=" << (void *)Record.getFileOffset().get() << " ";
889 if (PrintRecordData) {
890 PrintRecordData(Record.Proxy.Data);
891 } else {
892 OS << "bytes=";
893 ArrayRef<uint8_t> Data(
894 reinterpret_cast<const uint8_t *>(Record.Proxy.Data.data()),
895 Record.Proxy.Data.size());
896 printHexDigits(OS, Data, 0, Data.size() * 8);
897 }
898 OS << "\n";
899 return Error::success();
900 }
901
902 Error visitSubTrie(StringRef Prefix, SubtrieHandle SubTrie) override {
903 if (Prefix.empty()) {
904 OS << "root";
905 } else {
906 OS << "subtrie=";
907 printPrefix(OS, Prefix);
908 }
909
910 OS << " addr="
911 << (void *)(reinterpret_cast<const char *>(&SubTrie.getHeader()) -
912 Trie.getRegion().data());
913 OS << " num-slots=" << SubTrie.getNumSlots() << "\n";
914 return Error::success();
915 }
916
917 Error visitSlot(unsigned I, SubtrieHandle Subtrie, StringRef Prefix,
918 SubtrieSlotValue Slot) override {
919 OS << "- index=";
920 for (size_t Pad : {10, 100, 1000})
921 if (I < Pad && Subtrie.getNumSlots() >= Pad)
922 OS << "0";
923 OS << I << " ";
924 if (Slot.isSubtrie()) {
925 OS << "addr=" << (void *)Slot.asSubtrie();
926 OS << " subtrie=";
927 printPrefix(OS, Prefix);
928 OS << "\n";
929 return Error::success();
930 }
931 TrieRawHashMapHandle::RecordData Record = Trie.getRecord(Slot);
932 OS << "addr=" << (void *)Record.getFileOffset().get();
933 OS << " content=";
934 Subtrie.printHash(OS, Record.Proxy.Hash);
935 OS << "\n";
936 Records.push_back(Slot.asData());
937 return Error::success();
938 }
939
940private:
941 raw_ostream &OS;
942 function_ref<void(ArrayRef<char>)> PrintRecordData;
944};
945
946/// TrieVerifier that adds additional verification on top of the basic visitor.
947class TrieVerifier : public TrieVisitor {
948public:
949 TrieVerifier(
950 TrieRawHashMapHandle Trie,
951 function_ref<Error(FileOffset, OnDiskTrieRawHashMap::ConstValueProxy)>
952 RecordVerifier)
953 : TrieVisitor(Trie), RecordVerifier(RecordVerifier) {}
954
955private:
956 Error visitSubTrie(StringRef Prefix, SubtrieHandle SubTrie) final {
957 return Error::success();
958 }
959
960 Error visitSlot(unsigned I, SubtrieHandle Subtrie, StringRef Prefix,
961 SubtrieSlotValue Slot) final {
962 if (RecordVerifier && Slot.isData()) {
964 return createInvalidTrieError(Slot.asData(), "mis-aligned data entry");
965
966 TrieRawHashMapHandle::RecordData Record =
967 Trie.getRecord(SubtrieSlotValue::getDataOffset(Slot.asData()));
968 return RecordVerifier(Slot.asDataFileOffset(),
969 OnDiskTrieRawHashMap::ConstValueProxy{
970 Record.Proxy.Hash, Record.Proxy.Data});
971 }
972 return Error::success();
973 }
974
975 function_ref<Error(FileOffset, OnDiskTrieRawHashMap::ConstValueProxy)>
976 RecordVerifier;
977};
978} // namespace
979
980Error TrieVisitor::visit() {
981 auto Root = Trie.getRoot();
982 if (!Root)
983 return Error::success();
984
985 if (auto Err = validateSubTrie(Root, /*IsRoot=*/true))
986 return Err;
987
988 if (auto Err = visitSubTrie("", Root))
989 return Err;
990
992 SmallVector<std::string> Prefixes;
993 const size_t NumSlots = Root.getNumSlots();
994 for (size_t I = 0, E = NumSlots; I != E; ++I) {
995 SubtrieSlotValue Slot = Root.load(I);
996 if (!Slot)
997 continue;
998 uint64_t Offset = Slot.isSubtrie() ? Slot.asSubtrie() : Slot.asData();
999 if (Offset >= (uint64_t)Trie.getRegion().size())
1000 return createInvalidTrieError(Offset, "slot points out of bound");
1001 std::string SubtriePrefix;
1002 appendIndexBits(SubtriePrefix, I, NumSlots);
1003 if (Slot.isSubtrie()) {
1004 SubtrieHandle S(Trie.getRegion(), Slot);
1005 Subs.push_back(S);
1006 Prefixes.push_back(SubtriePrefix);
1007 }
1008 if (auto Err = visitSlot(I, Root, SubtriePrefix, Slot))
1009 return Err;
1010 }
1011
1012 for (size_t I = 0, E = Subs.size(); I != E; ++I) {
1013 Threads.async(
1014 [&](unsigned Idx) {
1015 // Don't run if there is an error already.
1016 if (tooManyErrors())
1017 return;
1018 if (auto Err = traverseTrieNode(Subs[Idx], Prefixes[Idx]))
1019 addError(std::move(Err));
1020 },
1021 I);
1022 }
1023
1024 Threads.wait();
1025 if (Err)
1026 return std::move(*Err);
1027 return Error::success();
1028}
1029
1030Error TrieVisitor::validateSubTrie(SubtrieHandle Node, bool IsRoot) {
1031 char *Addr = reinterpret_cast<char *>(&Node.getHeader());
1032 const int64_t Offset = Node.getFileOffset().get();
1033 if (Addr + Node.getSize() >=
1034 Trie.getRegion().data() + Trie.getRegion().size())
1035 return createInvalidTrieError(Offset, "subtrie node spans out of bound");
1036
1037 if (!IsRoot &&
1038 Node.getStartBit() + Node.getNumBits() > Trie.getNumHashBits()) {
1039 return createInvalidTrieError(Offset,
1040 "subtrie represents too many hash bits");
1041 }
1042
1043 if (IsRoot) {
1044 if (Node.getStartBit() != 0)
1045 return createInvalidTrieError(Offset,
1046 "root node doesn't start at 0 index");
1047
1048 return Error::success();
1049 }
1050
1051 if (Node.getNumBits() > Trie.getNumSubtrieBits())
1052 return createInvalidTrieError(Offset, "subtrie has wrong number of slots");
1053
1054 return Error::success();
1055}
1056
1057Error TrieVisitor::traverseTrieNode(SubtrieHandle Node, StringRef Prefix) {
1058 if (auto Err = validateSubTrie(Node, /*IsRoot=*/false))
1059 return Err;
1060
1061 if (auto Err = visitSubTrie(Prefix, Node))
1062 return Err;
1063
1065 SmallVector<std::string> Prefixes;
1066 const size_t NumSlots = Node.getNumSlots();
1067 for (size_t I = 0, E = NumSlots; I != E; ++I) {
1068 SubtrieSlotValue Slot = Node.load(I);
1069 if (!Slot)
1070 continue;
1071 uint64_t Offset = Slot.isSubtrie() ? Slot.asSubtrie() : Slot.asData();
1072 if (Offset >= (uint64_t)Trie.getRegion().size())
1073 return createInvalidTrieError(Offset, "slot points out of bound");
1074 std::string SubtriePrefix = Prefix.str();
1075 appendIndexBits(SubtriePrefix, I, NumSlots);
1076 if (Slot.isSubtrie()) {
1077 SubtrieHandle S(Trie.getRegion(), Slot);
1078 Subs.push_back(S);
1079 Prefixes.push_back(SubtriePrefix);
1080 }
1081 if (auto Err = visitSlot(I, Node, SubtriePrefix, Slot))
1082 return Err;
1083 }
1084 for (size_t I = 0, E = Subs.size(); I != E; ++I)
1085 if (auto Err = traverseTrieNode(Subs[I], Prefixes[I]))
1086 return Err;
1087
1088 return Error::success();
1089}
1090
1091void TrieRawHashMapHandle::print(
1092 raw_ostream &OS, function_ref<void(ArrayRef<char>)> PrintRecordData) const {
1093 OS << "hash-num-bits=" << getNumHashBits()
1094 << " hash-size=" << getNumHashBytes()
1095 << " record-data-size=" << getRecordDataSize() << "\n";
1096
1097 TriePrinter Printer(*this, OS, PrintRecordData);
1098 if (auto Err = Printer.visit())
1099 OS << "error: " << toString(std::move(Err)) << "\n";
1100
1101 if (auto Err = Printer.printRecords())
1102 OS << "error: " << toString(std::move(Err)) << "\n";
1103
1104 return;
1105}
1106
1107Error TrieRawHashMapHandle::validate(
1109 RecordVerifier) const {
1110 // Use the base TrieVisitor to identify the errors inside trie first.
1111 TrieVisitor BasicVerifier(*this);
1112 if (auto Err = BasicVerifier.visit())
1113 return Err;
1114
1115 // If the trie data structure is sound, do a second pass to verify data and
1116 // verifier function can assume the index is correct. However, there can be
1117 // newly added bad entries that can still produce error.
1118 TrieVerifier Verifier(*this, RecordVerifier);
1119 return Verifier.visit();
1120}
1121
1122#else // !LLVM_ENABLE_ONDISK_CAS
1123
1125
1127OnDiskTrieRawHashMap::create(const Twine &PathTwine, const Twine &TrieNameTwine,
1128 size_t NumHashBits, uint64_t DataSize,
1129 uint64_t MaxFileSize,
1130 std::optional<uint64_t> NewFileInitialSize,
1131 std::optional<size_t> NewTableNumRootBits,
1132 std::optional<size_t> NewTableNumSubtrieBits) {
1133 return createStringError(make_error_code(std::errc::not_supported),
1134 "OnDiskTrieRawHashMap is not supported");
1135}
1136
1139 LazyInsertOnConstructCB OnConstruct,
1140 LazyInsertOnLeakCB OnLeak) {
1141 return createStringError(make_error_code(std::errc::not_supported),
1142 "OnDiskTrieRawHashMap is not supported");
1143}
1144
1147 return createStringError(make_error_code(std::errc::not_supported),
1148 "OnDiskTrieRawHashMap is not supported");
1149}
1150
1155
1157 raw_ostream &OS, function_ref<void(ArrayRef<char>)> PrintRecordData) const {
1158}
1159
1162 RecordVerifier) const {
1163 return createStringError(make_error_code(std::errc::not_supported),
1164 "OnDiskTrieRawHashMap is not supported");
1165}
1166
1167size_t OnDiskTrieRawHashMap::size() const { return 0; }
1168size_t OnDiskTrieRawHashMap::capacity() const { return 0; }
1169
1170#endif // LLVM_ENABLE_ONDISK_CAS
1171
1172OnDiskTrieRawHashMap::OnDiskTrieRawHashMap(std::unique_ptr<ImplType> Impl)
1173 : Impl(std::move(Impl)) {}
1175 default;
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
AMDGPU Mark last scratch load
AMDGPU Prepare AGPR Alloc
static void print(raw_ostream &Out, object::Archive::Kind Kind, T Val)
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
#define LLVM_UNLIKELY(EXPR)
Definition Compiler.h:336
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
Definition Compiler.h:638
dxil pretty DXIL Metadata Pretty Printer
This file declares the common interface for a DatabaseFile that is used to implement OnDiskCAS.
static DeltaTreeNode * getRoot(void *Root)
static bool sink(Instruction &I, LoopInfo *LI, DominatorTree *DT, const Loop *CurLoop, ICFLoopSafetyInfo *SafetyInfo, MemorySSAUpdater &MSSAU, OptimizationRemarkEmitter *ORE)
When an instruction is found to only be used outside of the loop, this function moves it to the exit ...
Definition LICM.cpp:1577
#define I(x, y, z)
Definition MD5.cpp:58
#define H(x, y, z)
Definition MD5.cpp:57
This file declares interface for MappedFileRegionArena, a bump pointer allocator, backed by a memory-...
This file declares interface for OnDiskTrieRawHashMap, a thread-safe and (mostly) lock-free hash map ...
void visit(MachineFunction &MF, MachineBasicBlock &Start, std::function< void(MachineBasicBlock *)> op)
verify safepoint Safepoint IR Verifier
static Split data
This file contains some functions that are useful when dealing with strings.
static RecordT createRecord(const CVSymbol &sym)
static uint32_t getFlags(const Symbol *Sym)
Definition TapiFile.cpp:26
static cl::opt< int > ThreadCount("threads", cl::init(0))
static unsigned getSize(unsigned Kind)
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41
size_t size() const
size - Get the array size.
Definition ArrayRef.h:147
Lightweight error class with error context and mandatory checking.
Definition Error.h:159
static ErrorSuccess success()
Create a success value.
Definition Error.h:336
Tagged union holding either a T or a Error.
Definition Error.h:485
iterator end() const
Definition ArrayRef.h:348
void push_back(const T &Elt)
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82
StringRef toStringRef(SmallVectorImpl< char > &Out) const
This returns the twine as a single StringRef if it can be represented as such.
Definition Twine.h:461
FileOffset is a wrapper around uint64_t to represent the offset of data from the beginning of the fil...
Definition FileOffset.h:24
Allocator for an owned mapped file region that supports thread-safe and process-safe bump pointer all...
static constexpr Align getAlign()
Minimum alignment for allocations, currently hardcoded to 8B.
OnDiskTrieRawHashMap is a persistent trie data structure used as hash maps.
const_pointer find(ArrayRef< uint8_t > Hash) const
Find the value from hash.
OnDiskTrieRawHashMap(OnDiskTrieRawHashMap &&RHS)
Expected< pointer > insertLazy(ArrayRef< uint8_t > Hash, LazyInsertOnConstructCB OnConstruct=nullptr, LazyInsertOnLeakCB OnLeak=nullptr)
Insert lazily.
function_ref< void(FileOffset TentativeOffset, ValueProxy TentativeValue)> LazyInsertOnConstructCB
Error validate(function_ref< Error(FileOffset, ConstValueProxy)> RecordVerifier) const
Validate the trie data structure.
static Expected< OnDiskTrieRawHashMap > create(const Twine &Path, const Twine &TrieName, size_t NumHashBits, uint64_t DataSize, uint64_t MaxFileSize, std::optional< uint64_t > NewFileInitialSize, std::optional< size_t > NewTableNumRootBits=std::nullopt, std::optional< size_t > NewTableNumSubtrieBits=std::nullopt)
Gets or creates a file at Path with a hash-mapped trie named TrieName.
LLVM_DUMP_METHOD void dump() const
Expected< const_pointer > recoverFromFileOffset(FileOffset Offset) const
Helper function to recover a pointer into the trie from file offset.
static bool validOffset(FileOffset Offset)
Check the valid range of file offset for OnDiskTrieRawHashMap.
OnDiskTrieRawHashMap & operator=(OnDiskTrieRawHashMap &&RHS)
void print(raw_ostream &OS, function_ref< void(ArrayRef< char >)> PrintRecordData=nullptr) const
function_ref< void(FileOffset TentativeOffset, ValueProxy TentativeValue, FileOffset FinalOffset, ValueProxy FinalValue)> LazyInsertOnLeakCB
static Expected< DatabaseFile > create(const Twine &Path, uint64_t Capacity, function_ref< Error(DatabaseFile &)> NewDBConstructor)
Create the DatabaseFile at Path with Capacity.
An efficient, type-erasing, non-owning reference to a callable.
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53
llvm::SmallVector< std::shared_ptr< RecordsSlice >, 4 > Records
void validate(const Triple &TT, const FeatureBitset &FeatureBits)
Error createTableConfigError(std::errc ErrC, StringRef Path, StringRef TableName, const Twine &Msg)
MappedFileRegionArena::RegionT MappedFileRegion
Error checkTable(StringRef Label, size_t Expected, size_t Observed, StringRef Path, StringRef TrieName)
NodeAddr< NodeBase * > Node
Definition RDFGraph.h:381
This is an optimization pass for GlobalISel generic memory operations.
ThreadPoolStrategy hardware_concurrency(unsigned ThreadCount=0)
Returns a default thread strategy where all available hardware resources are to be used,...
Definition Threading.h:185
@ Offset
Definition DWP.cpp:477
FunctionAddr VTableAddr Value
Definition InstrProf.h:137
std::error_code make_error_code(BitcodeError E)
bool isAligned(Align Lhs, uint64_t SizeInBytes)
Checks that SizeInBytes is a multiple of the alignment.
Definition Alignment.h:134
FunctionAddr VTableAddr uintptr_t uintptr_t DataSize
Definition InstrProf.h:267
std::string utohexstr(uint64_t X, bool LowerCase=false, unsigned Width=0)
Error createStringError(std::error_code EC, char const *Fmt, const Ts &... Vals)
Create formatted StringError object.
Definition Error.h:1305
static Error getOffset(const SymbolRef &Sym, SectionRef Sec, uint64_t &Result)
auto reverse(ContainerTy &&C)
Definition STLExtras.h:408
Error joinErrors(Error E1, Error E2)
Concatenate errors.
Definition Error.h:442
void sort(IteratorTy Start, IteratorTy End)
Definition STLExtras.h:1624
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207
char hexdigit(unsigned X, bool LowerCase=false)
hexdigit - Return the hexadecimal character for the given number X (which should be less than 16).
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >
FunctionAddr VTableAddr uintptr_t uintptr_t Data
Definition InstrProf.h:189
@ Sub
Subtraction of integers.
SingleThreadExecutor DefaultThreadPool
Definition ThreadPool.h:250
ArrayRef(const T &OneElt) -> ArrayRef< T >
std::string toString(const APInt &I, unsigned Radix, bool Signed, bool formatAsCLiteral=false, bool UpperCase=true, bool InsertSeparators=false)
OutputIt copy(R &&Range, OutputIt Out)
Definition STLExtras.h:1815
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1847
@ Default
The result values are uniform if and only if all operands are uniform.
Definition Uniformity.h:20
void consumeError(Error Err)
Consume a Error without doing anything.
Definition Error.h:1083
Implement std::hash so that hash_code can be used in STL containers.
Definition BitVector.h:870
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:872
size_t getCollidingBits(ArrayRef< uint8_t > CollidingBits) const
Const value proxy to access the records stored in TrieRawHashMap.
Value proxy to access the records stored in TrieRawHashMap.