19#include "llvm/Config/llvm-config.h"
28#if LLVM_ENABLE_ONDISK_CAS
37class TrieRawHashMapHandle;
43class SubtrieSlotValue {
45 explicit operator bool()
const {
return !isEmpty(); }
46 bool isEmpty()
const {
return !
Offset; }
47 bool isData()
const {
return Offset > 0; }
48 bool isSubtrie()
const {
return Offset < 0; }
49 uint64_t asData()
const {
53 uint64_t asSubtrie()
const {
58 FileOffset asSubtrieFileOffset()
const {
return FileOffset(asSubtrie()); }
60 FileOffset asDataFileOffset()
const {
return FileOffset(asData()); }
62 int64_t getRawOffset()
const {
return Offset; }
64 static SubtrieSlotValue getDataOffset(int64_t
Offset) {
65 return SubtrieSlotValue(
Offset);
68 static SubtrieSlotValue getSubtrieOffset(int64_t
Offset) {
69 return SubtrieSlotValue(-
Offset);
72 static SubtrieSlotValue getDataOffset(FileOffset
Offset) {
73 return getDataOffset(
Offset.get());
76 static SubtrieSlotValue getSubtrieOffset(FileOffset
Offset) {
77 return getDataOffset(
Offset.get());
80 static SubtrieSlotValue getFromSlot(std::atomic<int64_t> &Slot) {
81 return SubtrieSlotValue(
Slot.load());
84 SubtrieSlotValue() =
default;
87 friend class SubtrieHandle;
115 using SlotT = std::atomic<int64_t>;
117 static int64_t getSlotsSize(uint32_t NumBits) {
118 return sizeof(int64_t) * (1ull << NumBits);
121 static int64_t
getSize(uint32_t NumBits) {
122 return sizeof(SubtrieHandle::Header) + getSlotsSize(NumBits);
126 size_t getNumSlots()
const {
return Slots.size(); }
128 SubtrieSlotValue
load(
size_t I)
const {
129 return SubtrieSlotValue(Slots[
I].
load());
131 void store(
size_t I, SubtrieSlotValue V) {
132 return Slots[
I].store(
V.getRawOffset());
135 void printHash(raw_ostream &OS, ArrayRef<uint8_t> Bytes)
const;
138 bool compare_exchange_strong(
size_t I, SubtrieSlotValue &Expected,
139 SubtrieSlotValue New) {
140 SubtrieSlotValue SaveExpected(Expected);
141 bool Result = Slots[
I].compare_exchange_strong(Expected.Offset,
New.Offset);
144 SaveExpected.Offset,
New.Offset,
159 Expected<SubtrieHandle>
sink(
size_t I, SubtrieSlotValue V,
160 MappedFileRegionArena &
Alloc,
161 size_t NumSubtrieBits,
162 SubtrieHandle &UnusedSubtrie,
size_t NewI);
165 void reinitialize(uint32_t StartBit, uint32_t NumBits);
168 return SubtrieSlotValue::getSubtrieOffset(
169 reinterpret_cast<const char *
>(
H) -
Region->data());
172 FileOffset getFileOffset()
const {
return getOffset().asSubtrieFileOffset(); }
174 explicit operator bool()
const {
return H; }
176 Header &getHeader()
const {
return *
H; }
177 uint32_t getStartBit()
const {
return H->StartBit; }
178 uint32_t getNumBits()
const {
return H->NumBits; }
180 static Expected<SubtrieHandle> create(MappedFileRegionArena &
Alloc,
181 uint32_t StartBit, uint32_t NumBits,
182 OnDiskCASLogger *Logger);
186 OnDiskCASLogger *Logger) {
187 return SubtrieHandle(Region, SubtrieSlotValue::getSubtrieOffset(
Offset),
191 SubtrieHandle() =
default;
195 OnDiskCASLogger *Logger)
205 OnDiskCASLogger *Logger =
nullptr;
228class TrieRawHashMapHandle {
231 TableHandle::TableKind::TrieRawHashMap;
234 TableHandle::Header GenericHeader;
235 uint8_t NumSubtrieBits;
237 uint16_t NumHashBits;
238 uint32_t RecordDataSize;
239 std::atomic<int64_t> RootTrieOffset;
240 std::atomic<int64_t> AllocatorOffset;
243 operator TableHandle()
const {
245 return TableHandle();
246 return TableHandle(*Region,
H->GenericHeader);
250 OnDiskTrieRawHashMap::ValueProxy Proxy;
252 FileOffset getFileOffset()
const {
return Offset.asDataFileOffset(); }
255 enum Limits :
size_t {
257 MaxNumHashBytes = UINT16_MAX >> 3,
258 MaxNumHashBits = MaxNumHashBytes << 3,
266 MaxNumSubtrieBits = 10,
269 static constexpr size_t getNumHashBytes(
size_t NumHashBits) {
270 assert(NumHashBits % 8 == 0);
271 return NumHashBits / 8;
273 static constexpr size_t getRecordSize(
size_t RecordDataSize,
274 size_t NumHashBits) {
275 return RecordDataSize + getNumHashBytes(NumHashBits);
278 RecordData getRecord(SubtrieSlotValue
Offset);
280 ArrayRef<uint8_t> Hash);
282 explicit operator bool()
const {
return H; }
283 const Header &getHeader()
const {
return *
H; }
285 Expected<SubtrieHandle> getOrCreateRoot(MappedFileRegionArena &
Alloc);
288 size_t getFlags()
const {
return H->Flags; }
289 size_t getNumSubtrieBits()
const {
return H->NumSubtrieBits; }
290 size_t getNumHashBits()
const {
return H->NumHashBits; }
291 size_t getNumHashBytes()
const {
return getNumHashBytes(
H->NumHashBits); }
292 size_t getRecordDataSize()
const {
return H->RecordDataSize; }
293 size_t getRecordSize()
const {
294 return getRecordSize(
H->RecordDataSize,
H->NumHashBits);
297 TrieHashIndexGenerator getIndexGen(SubtrieHandle Root,
298 ArrayRef<uint8_t> Hash) {
299 assert(Root.getStartBit() == 0);
302 return TrieHashIndexGenerator{Root.getNumBits(), getNumSubtrieBits(), Hash};
305 static Expected<TrieRawHashMapHandle>
306 create(MappedFileRegionArena &
Alloc, StringRef Name,
307 std::optional<uint64_t> NumRootBits, uint64_t NumSubtrieBits,
308 uint64_t NumHashBits, uint64_t RecordDataSize,
309 std::shared_ptr<OnDiskCASLogger> Logger);
312 print(raw_ostream &OS,
313 function_ref<
void(ArrayRef<char>)> PrintRecordData =
nullptr)
const;
316 function_ref<
Error(FileOffset, OnDiskTrieRawHashMap::ConstValueProxy)>
317 RecordVerifier)
const;
318 TrieRawHashMapHandle() =
default;
320 std::shared_ptr<OnDiskCASLogger> Logger =
nullptr)
323 std::shared_ptr<OnDiskCASLogger> Logger =
nullptr)
324 : TrieRawHashMapHandle(
326 std::
move(Logger)) {}
328 OnDiskCASLogger *getLogger()
const {
return Logger.get(); }
329 void setLogger(std::shared_ptr<OnDiskCASLogger> Logger) {
330 this->Logger = std::move(Logger);
336 std::shared_ptr<OnDiskCASLogger> Logger;
343 TrieRawHashMapHandle Trie;
350 assert(StartBit <= TrieRawHashMapHandle::MaxNumHashBits);
351 assert(NumBits <= UINT8_MAX);
352 assert(NumBits <= TrieRawHashMapHandle::MaxNumRootBits);
356 return Mem.takeError();
361 for (
auto I = S.Slots.begin(),
E = S.Slots.end();
I !=
E; ++
I)
365 Logger->logSubtrieHandleCreate(
Alloc.data(), S.getOffset().Offset, StartBit,
370SubtrieHandle TrieRawHashMapHandle::getRoot()
const {
371 if (int64_t Root =
H->RootTrieOffset)
372 return SubtrieHandle(getRegion(), SubtrieSlotValue::getSubtrieOffset(Root),
374 return SubtrieHandle();
380 if (SubtrieHandle Root =
getRoot())
385 SubtrieHandle::create(
Alloc, 0,
H->NumSubtrieBits,
Logger.get());
387 return LazyRoot.takeError();
389 if (
H->RootTrieOffset.compare_exchange_strong(
390 Race, LazyRoot->getOffset().asSubtrie()),
397 return SubtrieHandle(getRegion(), SubtrieSlotValue::getSubtrieOffset(Race),
403 std::optional<uint64_t> NumRootBits,
406 std::shared_ptr<OnDiskCASLogger>
Logger) {
410 return Offset.takeError();
413 assert(
Name.size() <= UINT16_MAX &&
"Expected smaller table name");
414 assert(NumSubtrieBits <= UINT8_MAX &&
"Expected valid subtrie bits");
415 assert(NumHashBits <= UINT16_MAX &&
"Expected valid hash size");
416 assert(RecordDataSize <= UINT32_MAX &&
"Expected smaller table name");
426 char *NameStorage =
reinterpret_cast<char *
>(
H + 1);
428 NameStorage[
Name.size()] = 0;
431 TrieRawHashMapHandle Trie(
Alloc.getRegion(), *
H,
Logger);
432 auto Sub = SubtrieHandle::create(
Alloc, 0, *NumRootBits,
Logger.get());
434 return Sub.takeError();
436 H->RootTrieOffset =
Sub->getOffset().asSubtrie();
440TrieRawHashMapHandle::RecordData
441TrieRawHashMapHandle::getRecord(SubtrieSlotValue
Offset) {
447 return RecordData{Proxy,
Offset};
455 auto Offset =
Alloc.allocateOffset(getRecordSize());
457 return Offset.takeError();
459 RecordData
Record = getRecord(SubtrieSlotValue::getDataOffset(*
Offset));
463 Logger->logHashMappedTrieHandleCreateRecord(
474 "unaligned file offset at 0x" +
482 Offset.get() + Impl->Trie.getRecordSize() > Impl->File.getAlloc().size())
484 "file offset too large: 0x" +
488 TrieRawHashMapHandle::RecordData
D =
489 Impl->Trie.getRecord(SubtrieSlotValue::getDataOffset(
Offset));
495 TrieRawHashMapHandle Trie = Impl->Trie;
496 assert(Hash.
size() == Trie.getNumHashBytes() &&
"Invalid hash");
498 SubtrieHandle S = Trie.getRoot();
502 TrieHashIndexGenerator IndexGen = Trie.getIndexGen(S, Hash);
506 SubtrieSlotValue
V = S.load(Index);
512 TrieRawHashMapHandle::RecordData
D = Trie.getRecord(V);
518 S = SubtrieHandle(Trie.getRegion(), V, Trie.getLogger());
523void SubtrieHandle::reinitialize(uint32_t StartBit, uint32_t NumBits) {
524 assert(StartBit >
H->StartBit);
525 assert(NumBits <= H->NumBits);
528 H->StartBit = StartBit;
529 H->NumBits = NumBits;
532Expected<OnDiskTrieRawHashMap::OnDiskPtr>
534 LazyInsertOnConstructCB OnConstruct,
535 LazyInsertOnLeakCB OnLeak) {
536 TrieRawHashMapHandle Trie = Impl->Trie;
537 assert(Hash.
size() == Trie.getNumHashBytes() &&
"Invalid hash");
539 MappedFileRegionArena &
Alloc = Impl->File.getAlloc();
540 std::optional<SubtrieHandle> S;
541 auto Err = Trie.getOrCreateRoot(
Alloc).moveInto(S);
543 return std::move(Err);
545 TrieHashIndexGenerator IndexGen = Trie.getIndexGen(*S, Hash);
549 std::optional<TrieRawHashMapHandle::RecordData> NewRecord;
550 SubtrieHandle UnusedSubtrie;
552 SubtrieSlotValue Existing = S->load(Index);
557 auto Err = Trie.createRecord(
Alloc, Hash).moveInto(NewRecord);
559 return std::move(Err);
561 OnConstruct(NewRecord->Offset.asDataFileOffset(), NewRecord->Proxy);
564 if (S->compare_exchange_strong(Index, Existing, NewRecord->Offset))
566 NewRecord->Offset.asDataFileOffset());
571 if (Existing.isSubtrie()) {
572 S = SubtrieHandle(Trie.getRegion(), Existing, Trie.getLogger());
578 TrieRawHashMapHandle::RecordData ExistingRecord = Trie.getRecord(Existing);
579 if (ExistingRecord.Proxy.Hash == Hash) {
580 if (NewRecord && OnLeak)
581 OnLeak(NewRecord->Offset.asDataFileOffset(), NewRecord->Proxy,
582 ExistingRecord.Offset.asDataFileOffset(), ExistingRecord.Proxy);
584 ExistingRecord.Offset.asDataFileOffset());
589 size_t NextIndex = IndexGen.
next();
590 size_t NewIndexForExistingContent =
594 UnusedSubtrie, NewIndexForExistingContent)
597 return std::move(Err);
601 if (NextIndex != NewIndexForExistingContent)
607Expected<SubtrieHandle> SubtrieHandle::sink(
size_t I, SubtrieSlotValue V,
609 size_t NumSubtrieBits,
610 SubtrieHandle &UnusedSubtrie,
612 std::optional<SubtrieHandle> NewS;
617 NewS->reinitialize(getStartBit() + getNumBits(), NumSubtrieBits);
620 auto Err = SubtrieHandle::create(
Alloc, getStartBit() + getNumBits(),
621 NumSubtrieBits, Logger)
624 return std::move(Err);
627 NewS->store(NewI, V);
628 if (compare_exchange_strong(
I, V, NewS->getOffset()))
632 assert(
V.isSubtrie() &&
"Expected racing sink() to add a subtrie");
635 NewS->store(NewI, SubtrieSlotValue());
636 UnusedSubtrie = *NewS;
639 return SubtrieHandle(
Alloc.getRegion(), V, Logger);
643 raw_ostream &OS, function_ref<
void(ArrayRef<char>)> PrintRecordData)
const {
644 Impl->Trie.print(OS, PrintRecordData);
648 function_ref<
Error(
FileOffset, ConstValueProxy)> RecordVerifier)
const {
649 return Impl->Trie.validate(RecordVerifier);
653static void printHexDigits(raw_ostream &OS, ArrayRef<uint8_t> Bytes,
654 size_t StartBit,
size_t NumBits) {
655 assert(StartBit % 4 == 0);
657 for (
size_t I = StartBit,
E = StartBit + NumBits;
I !=
E;
I += 4) {
658 uint8_t HexPair = Bytes[
I / 8];
659 uint8_t HexDigit =
I % 8 == 0 ? HexPair >> 4 : HexPair & 0xf;
664static void printBits(raw_ostream &OS, ArrayRef<uint8_t> Bytes,
size_t StartBit,
666 assert(StartBit + NumBits <= Bytes.
size() * 8u);
667 for (
size_t I = StartBit,
E = StartBit + NumBits;
I !=
E; ++
I) {
668 uint8_t
Byte = Bytes[
I / 8];
669 size_t ByteOffset =
I % 8;
670 if (
size_t ByteShift = 8 - ByteOffset - 1)
672 OS << (
Byte & 0x1 ?
'1' :
'0');
676void SubtrieHandle::printHash(raw_ostream &OS, ArrayRef<uint8_t> Bytes)
const {
678 size_t EndBit = getStartBit() + getNumBits();
679 size_t HashEndBit = Bytes.
size() * 8u;
681 size_t FirstBinaryBit = getStartBit() & ~0x3u;
682 printHexDigits(OS, Bytes, 0, FirstBinaryBit);
684 size_t LastBinaryBit = (EndBit + 3u) & ~0x3u;
686 printBits(OS, Bytes, FirstBinaryBit, LastBinaryBit - FirstBinaryBit);
689 printHexDigits(OS, Bytes, LastBinaryBit, HashEndBit - LastBinaryBit);
692static void appendIndexBits(std::string &Prefix,
size_t Index,
695 for (
size_t NumBits = 1u; NumBits < NumSlots; NumBits <<= 1) {
696 Bits.push_back(
'0' + (Index & 0x1));
703static void printPrefix(raw_ostream &OS, StringRef Prefix) {
704 while (
Prefix.size() >= 4) {
706 bool ErrorParsingBinary =
Prefix.take_front(4).getAsInteger(2, Digit);
707 assert(!ErrorParsingBinary);
708 (void)ErrorParsingBinary;
713 OS <<
"[" <<
Prefix <<
"]";
718static Expected<size_t> checkParameter(StringRef Label,
size_t Max,
719 std::optional<size_t>
Value,
721 StringRef Path, StringRef TableName) {
730 std::errc::argument_out_of_domain, Path, TableName,
731 "invalid " + Label +
": " + Twine(*
Value) +
" (max: " + Twine(Max) +
")");
736 return Impl->File.getRegion().size();
739Expected<OnDiskTrieRawHashMap>
741 size_t NumHashBits, uint64_t
DataSize,
742 uint64_t MaxFileSize,
743 std::optional<uint64_t> NewFileInitialSize,
744 std::shared_ptr<OnDiskCASLogger> Logger,
745 std::optional<size_t> NewTableNumRootBits,
746 std::optional<size_t> NewTableNumSubtrieBits) {
747 SmallString<128> PathStorage;
749 SmallString<128> TrieNameStorage;
750 StringRef TrieName = TrieNameTwine.
toStringRef(TrieNameStorage);
752 constexpr size_t DefaultNumRootBits = 10;
753 constexpr size_t DefaultNumSubtrieBits = 6;
756 if (
Error E = checkParameter(
757 "root bits", TrieRawHashMapHandle::MaxNumRootBits,
758 NewTableNumRootBits, DefaultNumRootBits, Path, TrieName)
759 .moveInto(NumRootBits))
762 size_t NumSubtrieBits;
763 if (
Error E = checkParameter(
"subtrie bits",
764 TrieRawHashMapHandle::MaxNumSubtrieBits,
765 NewTableNumSubtrieBits, DefaultNumSubtrieBits,
767 .moveInto(NumSubtrieBits))
770 size_t NumHashBytes = NumHashBits >> 3;
772 checkParameter(
"hash size", TrieRawHashMapHandle::MaxNumHashBits,
773 NumHashBits, std::nullopt, Path, TrieName)
776 assert(NumHashBits == NumHashBytes << 3 &&
777 "Expected hash size to be byte-aligned");
778 if (NumHashBits != NumHashBytes << 3)
780 std::errc::argument_out_of_domain, Path, TrieName,
781 "invalid hash size: " + Twine(NumHashBits) +
" (not byte-aligned)");
784 auto NewDBConstructor = [&](DatabaseFile &
DB) ->
Error {
785 auto Trie = TrieRawHashMapHandle::create(
DB.getAlloc(), TrieName,
786 NumRootBits, NumSubtrieBits,
789 return Trie.takeError();
791 return DB.addTable(*Trie);
795 Expected<DatabaseFile>
File =
798 return File.takeError();
801 std::optional<TableHandle> Table =
File->findTable(TrieName);
804 TrieName,
"table not found");
806 (
size_t)Table->getHeader().Kind, Path, TrieName))
808 auto Trie = Table->cast<TrieRawHashMapHandle>();
809 Trie.setLogger(Logger);
810 assert(Trie &&
"Already checked the kind");
822 if (
size_t Flags = Trie.getFlags())
824 "unsupported flags: " + Twine(Flags));
827 OnDiskTrieRawHashMap::ImplType Impl{DatabaseFile(std::move(*File)), Trie};
831static Error createInvalidTrieError(uint64_t
Offset,
const Twine &Msg) {
833 "invalid trie at 0x" +
851 TrieVisitor(TrieRawHashMapHandle Trie,
unsigned ThreadCount = 0,
852 unsigned ErrorLimit = 50)
853 : Trie(Trie), ErrorLimit(ErrorLimit),
855 virtual ~TrieVisitor() =
default;
860 virtual Error visitSubTrie(StringRef Prefix, SubtrieHandle SubTrie) {
865 virtual Error visitSlot(
unsigned I, SubtrieHandle Subtrie, StringRef Prefix,
866 SubtrieSlotValue Slot) {
871 TrieRawHashMapHandle Trie;
874 Error traverseTrieNode(SubtrieHandle Node, StringRef Prefix);
876 Error validateSubTrie(SubtrieHandle Node,
bool IsRoot);
879 void addError(
Error NewError) {
880 assert(NewError &&
"not an error");
881 std::lock_guard<std::mutex> ErrorLock(Lock);
882 if (NumError >= ErrorLimit) {
889 Err =
joinErrors(std::move(*Err), std::move(NewError));
891 Err = std::move(NewError);
895 bool tooManyErrors() {
896 std::lock_guard<std::mutex> ErrorLock(Lock);
897 return (
bool)Err && NumError >= ErrorLimit;
900 const unsigned ErrorLimit;
901 std::optional<Error> Err;
902 unsigned NumError = 0;
908class TriePrinter :
public TrieVisitor {
910 TriePrinter(TrieRawHashMapHandle Trie, raw_ostream &OS,
911 function_ref<
void(ArrayRef<char>)> PrintRecordData)
912 : TrieVisitor(Trie, 1), OS(OS),
913 PrintRecordData(PrintRecordData) {}
915 Error printRecords() {
921 for (int64_t
Offset : Records) {
922 TrieRawHashMapHandle::RecordData
Record =
923 Trie.getRecord(SubtrieSlotValue::getDataOffset(
Offset));
924 if (
auto Err = printRecord(Record))
930 Error printRecord(TrieRawHashMapHandle::RecordData &Record) {
931 OS <<
"- addr=" << (
void *)
Record.getFileOffset().get() <<
" ";
932 if (PrintRecordData) {
933 PrintRecordData(
Record.Proxy.Data);
936 ArrayRef<uint8_t>
Data(
937 reinterpret_cast<const uint8_t *
>(
Record.Proxy.Data.data()),
938 Record.Proxy.Data.size());
939 printHexDigits(OS,
Data, 0,
Data.size() * 8);
945 Error visitSubTrie(StringRef Prefix, SubtrieHandle SubTrie)
override {
950 printPrefix(OS, Prefix);
954 << (
void *)(
reinterpret_cast<const char *
>(&SubTrie.getHeader()) -
955 Trie.getRegion().data());
956 OS <<
" num-slots=" << SubTrie.getNumSlots() <<
"\n";
960 Error visitSlot(
unsigned I, SubtrieHandle Subtrie, StringRef Prefix,
961 SubtrieSlotValue Slot)
override {
963 for (
size_t Pad : {10, 100, 1000})
964 if (
I < Pad && Subtrie.getNumSlots() >= Pad)
967 if (
Slot.isSubtrie()) {
968 OS <<
"addr=" << (
void *)
Slot.asSubtrie();
970 printPrefix(OS, Prefix);
974 TrieRawHashMapHandle::RecordData
Record = Trie.getRecord(Slot);
975 OS <<
"addr=" << (
void *)
Record.getFileOffset().get();
977 Subtrie.printHash(OS,
Record.Proxy.Hash);
985 function_ref<void(ArrayRef<char>)> PrintRecordData;
990class TrieVerifier :
public TrieVisitor {
993 TrieRawHashMapHandle Trie,
994 function_ref<
Error(FileOffset, OnDiskTrieRawHashMap::ConstValueProxy)>
996 : TrieVisitor(Trie), RecordVerifier(RecordVerifier) {}
999 Error visitSubTrie(StringRef Prefix, SubtrieHandle SubTrie)
final {
1003 Error visitSlot(
unsigned I, SubtrieHandle Subtrie, StringRef Prefix,
1004 SubtrieSlotValue Slot)
final {
1005 if (RecordVerifier &&
Slot.isData()) {
1007 return createInvalidTrieError(
Slot.asData(),
"mis-aligned data entry");
1009 TrieRawHashMapHandle::RecordData
Record =
1010 Trie.getRecord(SubtrieSlotValue::getDataOffset(
Slot.asData()));
1011 return RecordVerifier(
Slot.asDataFileOffset(),
1012 OnDiskTrieRawHashMap::ConstValueProxy{
1013 Record.Proxy.Hash, Record.Proxy.Data});
1018 function_ref<
Error(FileOffset, OnDiskTrieRawHashMap::ConstValueProxy)>
1023Error TrieVisitor::visit() {
1024 auto Root = Trie.getRoot();
1028 if (
auto Err = validateSubTrie(Root,
true))
1031 if (
auto Err = visitSubTrie(
"", Root))
1035 SmallVector<std::string> Prefixes;
1036 const size_t NumSlots = Root.getNumSlots();
1037 for (
size_t I = 0,
E = NumSlots;
I !=
E; ++
I) {
1038 SubtrieSlotValue
Slot = Root.load(
I);
1042 if (
Offset >= (uint64_t)Trie.getRegion().size())
1043 return createInvalidTrieError(
Offset,
"slot points out of bound");
1044 std::string SubtriePrefix;
1045 appendIndexBits(SubtriePrefix,
I, NumSlots);
1046 if (
Slot.isSubtrie()) {
1047 SubtrieHandle S(Trie.getRegion(), Slot, Trie.getLogger());
1051 if (
auto Err = visitSlot(
I, Root, SubtriePrefix, Slot))
1055 for (
size_t I = 0,
E = Subs.
size();
I !=
E; ++
I) {
1059 if (tooManyErrors())
1061 if (
auto Err = traverseTrieNode(Subs[Idx], Prefixes[Idx]))
1062 addError(std::move(Err));
1069 return std::move(*Err);
1073Error TrieVisitor::validateSubTrie(SubtrieHandle Node,
bool IsRoot) {
1074 char *Addr =
reinterpret_cast<char *
>(&
Node.getHeader());
1075 const int64_t
Offset =
Node.getFileOffset().get();
1076 if (Addr +
Node.getSize() >=
1077 Trie.getRegion().data() + Trie.getRegion().size())
1078 return createInvalidTrieError(
Offset,
"subtrie node spans out of bound");
1081 Node.getStartBit() +
Node.getNumBits() > Trie.getNumHashBits()) {
1082 return createInvalidTrieError(
Offset,
1083 "subtrie represents too many hash bits");
1087 if (
Node.getStartBit() != 0)
1088 return createInvalidTrieError(
Offset,
1089 "root node doesn't start at 0 index");
1094 if (
Node.getNumBits() > Trie.getNumSubtrieBits())
1095 return createInvalidTrieError(
Offset,
"subtrie has wrong number of slots");
1100Error TrieVisitor::traverseTrieNode(SubtrieHandle Node, StringRef Prefix) {
1101 if (
auto Err = validateSubTrie(Node,
false))
1104 if (
auto Err = visitSubTrie(Prefix, Node))
1108 SmallVector<std::string> Prefixes;
1109 const size_t NumSlots =
Node.getNumSlots();
1110 for (
size_t I = 0,
E = NumSlots;
I !=
E; ++
I) {
1115 if (
Offset >= (uint64_t)Trie.getRegion().size())
1116 return createInvalidTrieError(
Offset,
"slot points out of bound");
1117 std::string SubtriePrefix =
Prefix.str();
1118 appendIndexBits(SubtriePrefix,
I, NumSlots);
1119 if (
Slot.isSubtrie()) {
1120 SubtrieHandle S(Trie.getRegion(), Slot, Trie.getLogger());
1124 if (
auto Err = visitSlot(
I, Node, SubtriePrefix, Slot))
1127 for (
size_t I = 0,
E = Subs.
size();
I !=
E; ++
I)
1128 if (
auto Err = traverseTrieNode(Subs[
I], Prefixes[
I]))
1134void TrieRawHashMapHandle::print(
1135 raw_ostream &OS, function_ref<
void(ArrayRef<char>)> PrintRecordData)
const {
1136 OS <<
"hash-num-bits=" << getNumHashBits()
1137 <<
" hash-size=" << getNumHashBytes()
1138 <<
" record-data-size=" << getRecordDataSize() <<
"\n";
1140 TriePrinter
Printer(*
this, OS, PrintRecordData);
1141 if (
auto Err =
Printer.visit())
1142 OS <<
"error: " <<
toString(std::move(Err)) <<
"\n";
1144 if (
auto Err =
Printer.printRecords())
1145 OS <<
"error: " <<
toString(std::move(Err)) <<
"\n";
1148Error TrieRawHashMapHandle::validate(
1150 RecordVerifier)
const {
1152 TrieVisitor BasicVerifier(*
this);
1153 if (
auto Err = BasicVerifier.visit())
1159 TrieVerifier
Verifier(*
this, RecordVerifier);
1171 std::optional<uint64_t> NewFileInitialSize,
1172 std::shared_ptr<OnDiskCASLogger>
Logger,
1173 std::optional<size_t> NewTableNumRootBits,
1174 std::optional<size_t> NewTableNumSubtrieBits) {
1176 "OnDiskTrieRawHashMap is not supported");
1184 "OnDiskTrieRawHashMap is not supported");
1190 "OnDiskTrieRawHashMap is not supported");
1204 RecordVerifier)
const {
1206 "OnDiskTrieRawHashMap is not supported");
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
AMDGPU Mark last scratch load
AMDGPU Prepare AGPR Alloc
static void print(raw_ostream &Out, object::Archive::Kind Kind, T Val)
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
#define LLVM_UNLIKELY(EXPR)
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
dxil pretty DXIL Metadata Pretty Printer
This file declares the common interface for a DatabaseFile that is used to implement OnDiskCAS.
static DeltaTreeNode * getRoot(void *Root)
static bool sink(Instruction &I, LoopInfo *LI, DominatorTree *DT, const Loop *CurLoop, ICFLoopSafetyInfo *SafetyInfo, MemorySSAUpdater &MSSAU, OptimizationRemarkEmitter *ORE)
When an instruction is found to only be used outside of the loop, this function moves it to the exit ...
This file declares interface for MappedFileRegionArena, a bump pointer allocator, backed by a memory-...
This file declares interface for OnDiskCASLogger, an interface that can be used to log CAS events to ...
This file declares interface for OnDiskTrieRawHashMap, a thread-safe and (mostly) lock-free hash map ...
void visit(MachineFunction &MF, MachineBasicBlock &Start, std::function< void(MachineBasicBlock *)> op)
verify safepoint Safepoint IR Verifier
static RecordT createRecord(const CVSymbol &sym)
static uint32_t getFlags(const Symbol *Sym)
static cl::opt< int > ThreadCount("threads", cl::init(0))
static unsigned getSize(unsigned Kind)
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
size_t size() const
size - Get the array size.
Lightweight error class with error context and mandatory checking.
static ErrorSuccess success()
Create a success value.
Tagged union holding either a T or a Error.
Logging utility - given an ordered specification of features, and assuming a scalar reward,...
void push_back(const T &Elt)
StringRef - Represent a constant reference to a string, i.e.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
StringRef toStringRef(SmallVectorImpl< char > &Out) const
This returns the twine as a single StringRef if it can be represented as such.
FileOffset is a wrapper around uint64_t to represent the offset of data from the beginning of the fil...
Allocator for an owned mapped file region that supports thread-safe and process-safe bump pointer all...
static constexpr Align getAlign()
Minimum alignment for allocations, currently hardcoded to 8B.
OnDiskTrieRawHashMap is a persistent trie data structure used as hash maps.
LLVM_ABI_FOR_TEST OnDiskTrieRawHashMap(OnDiskTrieRawHashMap &&RHS)
function_ref< void(FileOffset TentativeOffset, ValueProxy TentativeValue)> LazyInsertOnConstructCB
LLVM_ABI_FOR_TEST Error validate(function_ref< Error(FileOffset, ConstValueProxy)> RecordVerifier) const
Validate the trie data structure.
LLVM_ABI_FOR_TEST ConstOnDiskPtr find(ArrayRef< uint8_t > Hash) const
Find the value from hash.
LLVM_DUMP_METHOD void dump() const
static LLVM_ABI_FOR_TEST Expected< OnDiskTrieRawHashMap > create(const Twine &Path, const Twine &TrieName, size_t NumHashBits, uint64_t DataSize, uint64_t MaxFileSize, std::optional< uint64_t > NewFileInitialSize, std::shared_ptr< ondisk::OnDiskCASLogger > Logger=nullptr, std::optional< size_t > NewTableNumRootBits=std::nullopt, std::optional< size_t > NewTableNumSubtrieBits=std::nullopt)
Gets or creates a file at Path with a hash-mapped trie named TrieName.
LLVM_ABI_FOR_TEST size_t size() const
static bool validOffset(FileOffset Offset)
Check the valid range of file offset for OnDiskTrieRawHashMap.
LLVM_ABI_FOR_TEST Expected< OnDiskPtr > insertLazy(ArrayRef< uint8_t > Hash, LazyInsertOnConstructCB OnConstruct=nullptr, LazyInsertOnLeakCB OnLeak=nullptr)
Insert lazily.
LLVM_ABI_FOR_TEST size_t capacity() const
LLVM_ABI_FOR_TEST Expected< ConstOnDiskPtr > recoverFromFileOffset(FileOffset Offset) const
Helper function to recover a pointer into the trie from file offset.
LLVM_ABI_FOR_TEST OnDiskTrieRawHashMap & operator=(OnDiskTrieRawHashMap &&RHS)
void print(raw_ostream &OS, function_ref< void(ArrayRef< char >)> PrintRecordData=nullptr) const
function_ref< void(FileOffset TentativeOffset, ValueProxy TentativeValue, FileOffset FinalOffset, ValueProxy FinalValue)> LazyInsertOnLeakCB
LLVM_ABI_FOR_TEST ~OnDiskTrieRawHashMap()
static Expected< DatabaseFile > create(const Twine &Path, uint64_t Capacity, std::shared_ptr< OnDiskCASLogger > Logger, function_ref< Error(DatabaseFile &)> NewDBConstructor)
Create the DatabaseFile at Path with Capacity.
Interface for logging low-level on-disk cas operations.
An efficient, type-erasing, non-owning reference to a callable.
This class implements an extremely fast bulk output stream that can only output to a stream.
llvm::SmallVector< std::shared_ptr< RecordsSlice >, 4 > Records
void validate(const Triple &TT, const FeatureBitset &FeatureBits)
Error createTableConfigError(std::errc ErrC, StringRef Path, StringRef TableName, const Twine &Msg)
MappedFileRegionArena::RegionT MappedFileRegion
Error checkTable(StringRef Label, size_t Expected, size_t Observed, StringRef Path, StringRef TrieName)
NodeAddr< NodeBase * > Node
This is an optimization pass for GlobalISel generic memory operations.
ThreadPoolStrategy hardware_concurrency(unsigned ThreadCount=0)
Returns a default thread strategy where all available hardware resources are to be used,...
FunctionAddr VTableAddr Value
std::error_code make_error_code(BitcodeError E)
bool isAligned(Align Lhs, uint64_t SizeInBytes)
Checks that SizeInBytes is a multiple of the alignment.
FunctionAddr VTableAddr uintptr_t uintptr_t DataSize
std::string utohexstr(uint64_t X, bool LowerCase=false, unsigned Width=0)
Error createStringError(std::error_code EC, char const *Fmt, const Ts &... Vals)
Create formatted StringError object.
static Error getOffset(const SymbolRef &Sym, SectionRef Sec, uint64_t &Result)
auto reverse(ContainerTy &&C)
Error joinErrors(Error E1, Error E2)
Concatenate errors.
void sort(IteratorTy Start, IteratorTy End)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
char hexdigit(unsigned X, bool LowerCase=false)
hexdigit - Return the hexadecimal character for the given number X (which should be less than 16).
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >
FunctionAddr VTableAddr uintptr_t uintptr_t Data
@ Sub
Subtraction of integers.
SingleThreadExecutor DefaultThreadPool
ArrayRef(const T &OneElt) -> ArrayRef< T >
std::string toString(const APInt &I, unsigned Radix, bool Signed, bool formatAsCLiteral=false, bool UpperCase=true, bool InsertSeparators=false)
OutputIt copy(R &&Range, OutputIt Out)
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
@ Default
The result values are uniform if and only if all operands are uniform.
void consumeError(Error Err)
Consume a Error without doing anything.
Implement std::hash so that hash_code can be used in STL containers.
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
size_t getNumBits() const
size_t getCollidingBits(ArrayRef< uint8_t > CollidingBits) const
Const value proxy to access the records stored in TrieRawHashMap.
Value proxy to access the records stored in TrieRawHashMap.
MutableArrayRef< char > Data