1 //===- DataLayout.cpp - Data size & alignment routines ---------------------==//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file defines layout properties related to datatype size/offset/alignment
10 // information.
11 //
12 // This structure should be created once, filled in if the defaults are not
13 // correct and then passed around by const&.  None of the members functions
14 // require modification to the object.
15 //
16 //===----------------------------------------------------------------------===//
17 
18 #include "llvm/IR/DataLayout.h"
19 #include "llvm/ADT/DenseMap.h"
20 #include "llvm/ADT/StringRef.h"
21 #include "llvm/IR/Constants.h"
22 #include "llvm/IR/DerivedTypes.h"
23 #include "llvm/IR/GetElementPtrTypeIterator.h"
24 #include "llvm/IR/GlobalVariable.h"
25 #include "llvm/IR/Module.h"
26 #include "llvm/IR/Type.h"
27 #include "llvm/IR/Value.h"
28 #include "llvm/Support/Casting.h"
29 #include "llvm/Support/Error.h"
30 #include "llvm/Support/ErrorHandling.h"
31 #include "llvm/Support/MathExtras.h"
32 #include "llvm/Support/MemAlloc.h"
33 #include "llvm/Support/TypeSize.h"
34 #include "llvm/TargetParser/Triple.h"
35 #include <algorithm>
36 #include <cassert>
37 #include <cstdint>
38 #include <cstdlib>
39 #include <new>
40 #include <utility>
41 
42 using namespace llvm;
43 
44 //===----------------------------------------------------------------------===//
45 // Support for StructLayout
46 //===----------------------------------------------------------------------===//
47 
48 StructLayout::StructLayout(StructType *ST, const DataLayout &DL)
49     : StructSize(TypeSize::getFixed(0)) {
50   assert(!ST->isOpaque() && "Cannot get layout of opaque structs");
51   IsPadded = false;
52   NumElements = ST->getNumElements();
53 
54   // Loop over each of the elements, placing them in memory.
55   for (unsigned i = 0, e = NumElements; i != e; ++i) {
56     Type *Ty = ST->getElementType(i);
57     if (i == 0 && Ty->isScalableTy())
58       StructSize = TypeSize::getScalable(0);
59 
60     const Align TyAlign = ST->isPacked() ? Align(1) : DL.getABITypeAlign(Ty);
61 
62     // Add padding if necessary to align the data element properly.
63     // Currently the only structure with scalable size will be the homogeneous
64     // scalable vector types. Homogeneous scalable vector types have members of
65     // the same data type so no alignment issue will happen. The condition here
66     // assumes so and needs to be adjusted if this assumption changes (e.g. we
67     // support structures with arbitrary scalable data type, or structure that
68     // contains both fixed size and scalable size data type members).
69     if (!StructSize.isScalable() && !isAligned(TyAlign, StructSize)) {
70       IsPadded = true;
71       StructSize = TypeSize::getFixed(alignTo(StructSize, TyAlign));
72     }
73 
74     // Keep track of maximum alignment constraint.
75     StructAlignment = std::max(TyAlign, StructAlignment);
76 
77     getMemberOffsets()[i] = StructSize;
78     // Consume space for this data item
79     StructSize += DL.getTypeAllocSize(Ty);
80   }
81 
82   // Add padding to the end of the struct so that it could be put in an array
83   // and all array elements would be aligned correctly.
84   if (!StructSize.isScalable() && !isAligned(StructAlignment, StructSize)) {
85     IsPadded = true;
86     StructSize = TypeSize::getFixed(alignTo(StructSize, StructAlignment));
87   }
88 }
89 
90 /// getElementContainingOffset - Given a valid offset into the structure,
91 /// return the structure index that contains it.
92 unsigned StructLayout::getElementContainingOffset(uint64_t FixedOffset) const {
93   assert(!StructSize.isScalable() &&
94          "Cannot get element at offset for structure containing scalable "
95          "vector types");
96   TypeSize Offset = TypeSize::getFixed(FixedOffset);
97   ArrayRef<TypeSize> MemberOffsets = getMemberOffsets();
98 
99   const auto *SI =
100       std::upper_bound(MemberOffsets.begin(), MemberOffsets.end(), Offset,
101                        [](TypeSize LHS, TypeSize RHS) -> bool {
102                          return TypeSize::isKnownLT(LHS, RHS);
103                        });
104   assert(SI != MemberOffsets.begin() && "Offset not in structure type!");
105   --SI;
106   assert(TypeSize::isKnownLE(*SI, Offset) && "upper_bound didn't work");
107   assert(
108       (SI == MemberOffsets.begin() || TypeSize::isKnownLE(*(SI - 1), Offset)) &&
109       (SI + 1 == MemberOffsets.end() ||
110        TypeSize::isKnownGT(*(SI + 1), Offset)) &&
111       "Upper bound didn't work!");
112 
113   // Multiple fields can have the same offset if any of them are zero sized.
114   // For example, in { i32, [0 x i32], i32 }, searching for offset 4 will stop
115   // at the i32 element, because it is the last element at that offset.  This is
116   // the right one to return, because anything after it will have a higher
117   // offset, implying that this element is non-empty.
118   return SI - MemberOffsets.begin();
119 }
120 
121 //===----------------------------------------------------------------------===//
122 // LayoutAlignElem, LayoutAlign support
123 //===----------------------------------------------------------------------===//
124 
125 LayoutAlignElem LayoutAlignElem::get(Align ABIAlign, Align PrefAlign,
126                                      uint32_t BitWidth) {
127   assert(ABIAlign <= PrefAlign && "Preferred alignment worse than ABI!");
128   LayoutAlignElem retval;
129   retval.ABIAlign = ABIAlign;
130   retval.PrefAlign = PrefAlign;
131   retval.TypeBitWidth = BitWidth;
132   return retval;
133 }
134 
135 bool LayoutAlignElem::operator==(const LayoutAlignElem &rhs) const {
136   return ABIAlign == rhs.ABIAlign && PrefAlign == rhs.PrefAlign &&
137          TypeBitWidth == rhs.TypeBitWidth;
138 }
139 
140 //===----------------------------------------------------------------------===//
141 // PointerAlignElem, PointerAlign support
142 //===----------------------------------------------------------------------===//
143 
144 PointerAlignElem PointerAlignElem::getInBits(uint32_t AddressSpace,
145                                              Align ABIAlign, Align PrefAlign,
146                                              uint32_t TypeBitWidth,
147                                              uint32_t IndexBitWidth) {
148   assert(ABIAlign <= PrefAlign && "Preferred alignment worse than ABI!");
149   PointerAlignElem retval;
150   retval.AddressSpace = AddressSpace;
151   retval.ABIAlign = ABIAlign;
152   retval.PrefAlign = PrefAlign;
153   retval.TypeBitWidth = TypeBitWidth;
154   retval.IndexBitWidth = IndexBitWidth;
155   return retval;
156 }
157 
158 bool
159 PointerAlignElem::operator==(const PointerAlignElem &rhs) const {
160   return (ABIAlign == rhs.ABIAlign && AddressSpace == rhs.AddressSpace &&
161           PrefAlign == rhs.PrefAlign && TypeBitWidth == rhs.TypeBitWidth &&
162           IndexBitWidth == rhs.IndexBitWidth);
163 }
164 
165 //===----------------------------------------------------------------------===//
166 //                       DataLayout Class Implementation
167 //===----------------------------------------------------------------------===//
168 
169 const char *DataLayout::getManglingComponent(const Triple &T) {
170   if (T.isOSBinFormatGOFF())
171     return "-m:l";
172   if (T.isOSBinFormatMachO())
173     return "-m:o";
174   if ((T.isOSWindows() || T.isUEFI()) && T.isOSBinFormatCOFF())
175     return T.getArch() == Triple::x86 ? "-m:x" : "-m:w";
176   if (T.isOSBinFormatXCOFF())
177     return "-m:a";
178   return "-m:e";
179 }
180 
181 static const std::pair<AlignTypeEnum, LayoutAlignElem> DefaultAlignments[] = {
182     {INTEGER_ALIGN, {1, Align(1), Align(1)}},    // i1
183     {INTEGER_ALIGN, {8, Align(1), Align(1)}},    // i8
184     {INTEGER_ALIGN, {16, Align(2), Align(2)}},   // i16
185     {INTEGER_ALIGN, {32, Align(4), Align(4)}},   // i32
186     {INTEGER_ALIGN, {64, Align(4), Align(8)}},   // i64
187     {FLOAT_ALIGN, {16, Align(2), Align(2)}},     // half, bfloat
188     {FLOAT_ALIGN, {32, Align(4), Align(4)}},     // float
189     {FLOAT_ALIGN, {64, Align(8), Align(8)}},     // double
190     {FLOAT_ALIGN, {128, Align(16), Align(16)}},  // ppcf128, quad, ...
191     {VECTOR_ALIGN, {64, Align(8), Align(8)}},    // v2i32, v1i64, ...
192     {VECTOR_ALIGN, {128, Align(16), Align(16)}}, // v16i8, v8i16, v4i32, ...
193 };
194 
195 void DataLayout::reset(StringRef Desc) {
196   clear();
197 
198   LayoutMap = nullptr;
199   BigEndian = false;
200   AllocaAddrSpace = 0;
201   StackNaturalAlign.reset();
202   ProgramAddrSpace = 0;
203   DefaultGlobalsAddrSpace = 0;
204   FunctionPtrAlign.reset();
205   TheFunctionPtrAlignType = FunctionPtrAlignType::Independent;
206   ManglingMode = MM_None;
207   NonIntegralAddressSpaces.clear();
208   StructAlignment = LayoutAlignElem::get(Align(1), Align(8), 0);
209 
210   // Default alignments
211   for (const auto &[Kind, Layout] : DefaultAlignments) {
212     if (Error Err = setAlignment(Kind, Layout.ABIAlign, Layout.PrefAlign,
213                                  Layout.TypeBitWidth))
214       return report_fatal_error(std::move(Err));
215   }
216   if (Error Err = setPointerAlignmentInBits(0, Align(8), Align(8), 64, 64))
217     return report_fatal_error(std::move(Err));
218 
219   if (Error Err = parseSpecifier(Desc))
220     return report_fatal_error(std::move(Err));
221 }
222 
223 Expected<DataLayout> DataLayout::parse(StringRef LayoutDescription) {
224   DataLayout Layout("");
225   if (Error Err = Layout.parseSpecifier(LayoutDescription))
226     return std::move(Err);
227   return Layout;
228 }
229 
230 static Error reportError(const Twine &Message) {
231   return createStringError(inconvertibleErrorCode(), Message);
232 }
233 
234 /// Checked version of split, to ensure mandatory subparts.
235 static Error split(StringRef Str, char Separator,
236                    std::pair<StringRef, StringRef> &Split) {
237   assert(!Str.empty() && "parse error, string can't be empty here");
238   Split = Str.split(Separator);
239   if (Split.second.empty() && Split.first != Str)
240     return reportError("Trailing separator in datalayout string");
241   if (!Split.second.empty() && Split.first.empty())
242     return reportError("Expected token before separator in datalayout string");
243   return Error::success();
244 }
245 
246 /// Get an unsigned integer, including error checks.
247 template <typename IntTy> static Error getInt(StringRef R, IntTy &Result) {
248   bool error = R.getAsInteger(10, Result); (void)error;
249   if (error)
250     return reportError("not a number, or does not fit in an unsigned int");
251   return Error::success();
252 }
253 
254 /// Get an unsigned integer representing the number of bits and convert it into
255 /// bytes. Error out of not a byte width multiple.
256 template <typename IntTy>
257 static Error getIntInBytes(StringRef R, IntTy &Result) {
258   if (Error Err = getInt<IntTy>(R, Result))
259     return Err;
260   if (Result % 8)
261     return reportError("number of bits must be a byte width multiple");
262   Result /= 8;
263   return Error::success();
264 }
265 
266 static Error getAddrSpace(StringRef R, unsigned &AddrSpace) {
267   if (Error Err = getInt(R, AddrSpace))
268     return Err;
269   if (!isUInt<24>(AddrSpace))
270     return reportError("Invalid address space, must be a 24-bit integer");
271   return Error::success();
272 }
273 
274 Error DataLayout::parseSpecifier(StringRef Desc) {
275   StringRepresentation = std::string(Desc);
276   while (!Desc.empty()) {
277     // Split at '-'.
278     std::pair<StringRef, StringRef> Split;
279     if (Error Err = ::split(Desc, '-', Split))
280       return Err;
281     Desc = Split.second;
282 
283     // Split at ':'.
284     if (Error Err = ::split(Split.first, ':', Split))
285       return Err;
286 
287     // Aliases used below.
288     StringRef &Tok  = Split.first;  // Current token.
289     StringRef &Rest = Split.second; // The rest of the string.
290 
291     if (Tok == "ni") {
292       do {
293         if (Error Err = ::split(Rest, ':', Split))
294           return Err;
295         Rest = Split.second;
296         unsigned AS;
297         if (Error Err = getInt(Split.first, AS))
298           return Err;
299         if (AS == 0)
300           return reportError("Address space 0 can never be non-integral");
301         NonIntegralAddressSpaces.push_back(AS);
302       } while (!Rest.empty());
303 
304       continue;
305     }
306 
307     char Specifier = Tok.front();
308     Tok = Tok.substr(1);
309 
310     switch (Specifier) {
311     case 's':
312       // Deprecated, but ignoring here to preserve loading older textual llvm
313       // ASM file
314       break;
315     case 'E':
316       BigEndian = true;
317       break;
318     case 'e':
319       BigEndian = false;
320       break;
321     case 'p': {
322       // Address space.
323       unsigned AddrSpace = 0;
324       if (!Tok.empty())
325         if (Error Err = getInt(Tok, AddrSpace))
326           return Err;
327       if (!isUInt<24>(AddrSpace))
328         return reportError("Invalid address space, must be a 24-bit integer");
329 
330       // Size.
331       if (Rest.empty())
332         return reportError(
333             "Missing size specification for pointer in datalayout string");
334       if (Error Err = ::split(Rest, ':', Split))
335         return Err;
336       unsigned PointerMemSize;
337       if (Error Err = getInt(Tok, PointerMemSize))
338         return Err;
339       if (!PointerMemSize)
340         return reportError("Invalid pointer size of 0 bytes");
341 
342       // ABI alignment.
343       if (Rest.empty())
344         return reportError(
345             "Missing alignment specification for pointer in datalayout string");
346       if (Error Err = ::split(Rest, ':', Split))
347         return Err;
348       unsigned PointerABIAlign;
349       if (Error Err = getIntInBytes(Tok, PointerABIAlign))
350         return Err;
351       if (!isPowerOf2_64(PointerABIAlign))
352         return reportError("Pointer ABI alignment must be a power of 2");
353 
354       // Size of index used in GEP for address calculation.
355       // The parameter is optional. By default it is equal to size of pointer.
356       unsigned IndexSize = PointerMemSize;
357 
358       // Preferred alignment.
359       unsigned PointerPrefAlign = PointerABIAlign;
360       if (!Rest.empty()) {
361         if (Error Err = ::split(Rest, ':', Split))
362           return Err;
363         if (Error Err = getIntInBytes(Tok, PointerPrefAlign))
364           return Err;
365         if (!isPowerOf2_64(PointerPrefAlign))
366           return reportError(
367               "Pointer preferred alignment must be a power of 2");
368 
369         // Now read the index. It is the second optional parameter here.
370         if (!Rest.empty()) {
371           if (Error Err = ::split(Rest, ':', Split))
372             return Err;
373           if (Error Err = getInt(Tok, IndexSize))
374             return Err;
375           if (!IndexSize)
376             return reportError("Invalid index size of 0 bytes");
377         }
378       }
379       if (Error Err = setPointerAlignmentInBits(
380               AddrSpace, assumeAligned(PointerABIAlign),
381               assumeAligned(PointerPrefAlign), PointerMemSize, IndexSize))
382         return Err;
383       break;
384     }
385     case 'i':
386     case 'v':
387     case 'f':
388     case 'a': {
389       AlignTypeEnum AlignType;
390       switch (Specifier) {
391       default: llvm_unreachable("Unexpected specifier!");
392       case 'i': AlignType = INTEGER_ALIGN; break;
393       case 'v': AlignType = VECTOR_ALIGN; break;
394       case 'f': AlignType = FLOAT_ALIGN; break;
395       case 'a': AlignType = AGGREGATE_ALIGN; break;
396       }
397 
398       // Bit size.
399       unsigned Size = 0;
400       if (!Tok.empty())
401         if (Error Err = getInt(Tok, Size))
402           return Err;
403 
404       if (AlignType == AGGREGATE_ALIGN && Size != 0)
405         return reportError(
406             "Sized aggregate specification in datalayout string");
407 
408       // ABI alignment.
409       if (Rest.empty())
410         return reportError(
411             "Missing alignment specification in datalayout string");
412       if (Error Err = ::split(Rest, ':', Split))
413         return Err;
414       unsigned ABIAlign;
415       if (Error Err = getIntInBytes(Tok, ABIAlign))
416         return Err;
417       if (AlignType != AGGREGATE_ALIGN && !ABIAlign)
418         return reportError(
419             "ABI alignment specification must be >0 for non-aggregate types");
420 
421       if (!isUInt<16>(ABIAlign))
422         return reportError("Invalid ABI alignment, must be a 16bit integer");
423       if (ABIAlign != 0 && !isPowerOf2_64(ABIAlign))
424         return reportError("Invalid ABI alignment, must be a power of 2");
425       if (AlignType == INTEGER_ALIGN && Size == 8 && ABIAlign != 1)
426         return reportError(
427             "Invalid ABI alignment, i8 must be naturally aligned");
428 
429       // Preferred alignment.
430       unsigned PrefAlign = ABIAlign;
431       if (!Rest.empty()) {
432         if (Error Err = ::split(Rest, ':', Split))
433           return Err;
434         if (Error Err = getIntInBytes(Tok, PrefAlign))
435           return Err;
436       }
437 
438       if (!isUInt<16>(PrefAlign))
439         return reportError(
440             "Invalid preferred alignment, must be a 16bit integer");
441       if (PrefAlign != 0 && !isPowerOf2_64(PrefAlign))
442         return reportError("Invalid preferred alignment, must be a power of 2");
443 
444       if (Error Err = setAlignment(AlignType, assumeAligned(ABIAlign),
445                                    assumeAligned(PrefAlign), Size))
446         return Err;
447 
448       break;
449     }
450     case 'n':  // Native integer types.
451       while (true) {
452         unsigned Width;
453         if (Error Err = getInt(Tok, Width))
454           return Err;
455         if (Width == 0)
456           return reportError(
457               "Zero width native integer type in datalayout string");
458         LegalIntWidths.push_back(Width);
459         if (Rest.empty())
460           break;
461         if (Error Err = ::split(Rest, ':', Split))
462           return Err;
463       }
464       break;
465     case 'S': { // Stack natural alignment.
466       uint64_t Alignment;
467       if (Error Err = getIntInBytes(Tok, Alignment))
468         return Err;
469       if (Alignment != 0 && !llvm::isPowerOf2_64(Alignment))
470         return reportError("Alignment is neither 0 nor a power of 2");
471       StackNaturalAlign = MaybeAlign(Alignment);
472       break;
473     }
474     case 'F': {
475       switch (Tok.front()) {
476       case 'i':
477         TheFunctionPtrAlignType = FunctionPtrAlignType::Independent;
478         break;
479       case 'n':
480         TheFunctionPtrAlignType = FunctionPtrAlignType::MultipleOfFunctionAlign;
481         break;
482       default:
483         return reportError("Unknown function pointer alignment type in "
484                            "datalayout string");
485       }
486       Tok = Tok.substr(1);
487       uint64_t Alignment;
488       if (Error Err = getIntInBytes(Tok, Alignment))
489         return Err;
490       if (Alignment != 0 && !llvm::isPowerOf2_64(Alignment))
491         return reportError("Alignment is neither 0 nor a power of 2");
492       FunctionPtrAlign = MaybeAlign(Alignment);
493       break;
494     }
495     case 'P': { // Function address space.
496       if (Error Err = getAddrSpace(Tok, ProgramAddrSpace))
497         return Err;
498       break;
499     }
500     case 'A': { // Default stack/alloca address space.
501       if (Error Err = getAddrSpace(Tok, AllocaAddrSpace))
502         return Err;
503       break;
504     }
505     case 'G': { // Default address space for global variables.
506       if (Error Err = getAddrSpace(Tok, DefaultGlobalsAddrSpace))
507         return Err;
508       break;
509     }
510     case 'm':
511       if (!Tok.empty())
512         return reportError("Unexpected trailing characters after mangling "
513                            "specifier in datalayout string");
514       if (Rest.empty())
515         return reportError("Expected mangling specifier in datalayout string");
516       if (Rest.size() > 1)
517         return reportError("Unknown mangling specifier in datalayout string");
518       switch(Rest[0]) {
519       default:
520         return reportError("Unknown mangling in datalayout string");
521       case 'e':
522         ManglingMode = MM_ELF;
523         break;
524       case 'l':
525         ManglingMode = MM_GOFF;
526         break;
527       case 'o':
528         ManglingMode = MM_MachO;
529         break;
530       case 'm':
531         ManglingMode = MM_Mips;
532         break;
533       case 'w':
534         ManglingMode = MM_WinCOFF;
535         break;
536       case 'x':
537         ManglingMode = MM_WinCOFFX86;
538         break;
539       case 'a':
540         ManglingMode = MM_XCOFF;
541         break;
542       }
543       break;
544     default:
545       return reportError("Unknown specifier in datalayout string");
546       break;
547     }
548   }
549 
550   return Error::success();
551 }
552 
553 DataLayout::DataLayout(const Module *M) {
554   init(M);
555 }
556 
557 void DataLayout::init(const Module *M) { *this = M->getDataLayout(); }
558 
559 bool DataLayout::operator==(const DataLayout &Other) const {
560   bool Ret = BigEndian == Other.BigEndian &&
561              AllocaAddrSpace == Other.AllocaAddrSpace &&
562              StackNaturalAlign == Other.StackNaturalAlign &&
563              ProgramAddrSpace == Other.ProgramAddrSpace &&
564              DefaultGlobalsAddrSpace == Other.DefaultGlobalsAddrSpace &&
565              FunctionPtrAlign == Other.FunctionPtrAlign &&
566              TheFunctionPtrAlignType == Other.TheFunctionPtrAlignType &&
567              ManglingMode == Other.ManglingMode &&
568              LegalIntWidths == Other.LegalIntWidths &&
569              IntAlignments == Other.IntAlignments &&
570              FloatAlignments == Other.FloatAlignments &&
571              VectorAlignments == Other.VectorAlignments &&
572              StructAlignment == Other.StructAlignment &&
573              Pointers == Other.Pointers;
574   // Note: getStringRepresentation() might differs, it is not canonicalized
575   return Ret;
576 }
577 
578 static SmallVectorImpl<LayoutAlignElem>::const_iterator
579 findAlignmentLowerBound(const SmallVectorImpl<LayoutAlignElem> &Alignments,
580                         uint32_t BitWidth) {
581   return partition_point(Alignments, [BitWidth](const LayoutAlignElem &E) {
582     return E.TypeBitWidth < BitWidth;
583   });
584 }
585 
586 Error DataLayout::setAlignment(AlignTypeEnum AlignType, Align ABIAlign,
587                                Align PrefAlign, uint32_t BitWidth) {
588   // AlignmentsTy::ABIAlign and AlignmentsTy::PrefAlign were once stored as
589   // uint16_t, it is unclear if there are requirements for alignment to be less
590   // than 2^16 other than storage. In the meantime we leave the restriction as
591   // an assert. See D67400 for context.
592   assert(Log2(ABIAlign) < 16 && Log2(PrefAlign) < 16 && "Alignment too big");
593   if (!isUInt<24>(BitWidth))
594     return reportError("Invalid bit width, must be a 24-bit integer");
595   if (PrefAlign < ABIAlign)
596     return reportError(
597         "Preferred alignment cannot be less than the ABI alignment");
598 
599   SmallVectorImpl<LayoutAlignElem> *Alignments;
600   switch (AlignType) {
601   case AGGREGATE_ALIGN:
602     StructAlignment.ABIAlign = ABIAlign;
603     StructAlignment.PrefAlign = PrefAlign;
604     return Error::success();
605   case INTEGER_ALIGN:
606     Alignments = &IntAlignments;
607     break;
608   case FLOAT_ALIGN:
609     Alignments = &FloatAlignments;
610     break;
611   case VECTOR_ALIGN:
612     Alignments = &VectorAlignments;
613     break;
614   }
615 
616   auto I = partition_point(*Alignments, [BitWidth](const LayoutAlignElem &E) {
617     return E.TypeBitWidth < BitWidth;
618   });
619   if (I != Alignments->end() && I->TypeBitWidth == BitWidth) {
620     // Update the abi, preferred alignments.
621     I->ABIAlign = ABIAlign;
622     I->PrefAlign = PrefAlign;
623   } else {
624     // Insert before I to keep the vector sorted.
625     Alignments->insert(I, LayoutAlignElem::get(ABIAlign, PrefAlign, BitWidth));
626   }
627   return Error::success();
628 }
629 
630 const PointerAlignElem &
631 DataLayout::getPointerAlignElem(uint32_t AddressSpace) const {
632   if (AddressSpace != 0) {
633     auto I = lower_bound(Pointers, AddressSpace,
634                          [](const PointerAlignElem &A, uint32_t AddressSpace) {
635       return A.AddressSpace < AddressSpace;
636     });
637     if (I != Pointers.end() && I->AddressSpace == AddressSpace)
638       return *I;
639   }
640 
641   assert(Pointers[0].AddressSpace == 0);
642   return Pointers[0];
643 }
644 
645 Error DataLayout::setPointerAlignmentInBits(uint32_t AddrSpace, Align ABIAlign,
646                                             Align PrefAlign,
647                                             uint32_t TypeBitWidth,
648                                             uint32_t IndexBitWidth) {
649   if (PrefAlign < ABIAlign)
650     return reportError(
651         "Preferred alignment cannot be less than the ABI alignment");
652   if (IndexBitWidth > TypeBitWidth)
653     return reportError("Index width cannot be larger than pointer width");
654 
655   auto I = lower_bound(Pointers, AddrSpace,
656                        [](const PointerAlignElem &A, uint32_t AddressSpace) {
657     return A.AddressSpace < AddressSpace;
658   });
659   if (I == Pointers.end() || I->AddressSpace != AddrSpace) {
660     Pointers.insert(I,
661                     PointerAlignElem::getInBits(AddrSpace, ABIAlign, PrefAlign,
662                                                 TypeBitWidth, IndexBitWidth));
663   } else {
664     I->ABIAlign = ABIAlign;
665     I->PrefAlign = PrefAlign;
666     I->TypeBitWidth = TypeBitWidth;
667     I->IndexBitWidth = IndexBitWidth;
668   }
669   return Error::success();
670 }
671 
672 Align DataLayout::getIntegerAlignment(uint32_t BitWidth,
673                                       bool abi_or_pref) const {
674   auto I = findAlignmentLowerBound(IntAlignments, BitWidth);
675   // If we don't have an exact match, use alignment of next larger integer
676   // type. If there is none, use alignment of largest integer type by going
677   // back one element.
678   if (I == IntAlignments.end())
679     --I;
680   return abi_or_pref ? I->ABIAlign : I->PrefAlign;
681 }
682 
683 namespace {
684 
685 class StructLayoutMap {
686   using LayoutInfoTy = DenseMap<StructType*, StructLayout*>;
687   LayoutInfoTy LayoutInfo;
688 
689 public:
690   ~StructLayoutMap() {
691     // Remove any layouts.
692     for (const auto &I : LayoutInfo) {
693       StructLayout *Value = I.second;
694       Value->~StructLayout();
695       free(Value);
696     }
697   }
698 
699   StructLayout *&operator[](StructType *STy) {
700     return LayoutInfo[STy];
701   }
702 };
703 
704 } // end anonymous namespace
705 
706 void DataLayout::clear() {
707   LegalIntWidths.clear();
708   IntAlignments.clear();
709   FloatAlignments.clear();
710   VectorAlignments.clear();
711   Pointers.clear();
712   delete static_cast<StructLayoutMap *>(LayoutMap);
713   LayoutMap = nullptr;
714 }
715 
716 DataLayout::~DataLayout() {
717   clear();
718 }
719 
720 const StructLayout *DataLayout::getStructLayout(StructType *Ty) const {
721   if (!LayoutMap)
722     LayoutMap = new StructLayoutMap();
723 
724   StructLayoutMap *STM = static_cast<StructLayoutMap*>(LayoutMap);
725   StructLayout *&SL = (*STM)[Ty];
726   if (SL) return SL;
727 
728   // Otherwise, create the struct layout.  Because it is variable length, we
729   // malloc it, then use placement new.
730   StructLayout *L = (StructLayout *)safe_malloc(
731       StructLayout::totalSizeToAlloc<TypeSize>(Ty->getNumElements()));
732 
733   // Set SL before calling StructLayout's ctor.  The ctor could cause other
734   // entries to be added to TheMap, invalidating our reference.
735   SL = L;
736 
737   new (L) StructLayout(Ty, *this);
738 
739   return L;
740 }
741 
742 Align DataLayout::getPointerABIAlignment(unsigned AS) const {
743   return getPointerAlignElem(AS).ABIAlign;
744 }
745 
746 Align DataLayout::getPointerPrefAlignment(unsigned AS) const {
747   return getPointerAlignElem(AS).PrefAlign;
748 }
749 
750 unsigned DataLayout::getPointerSize(unsigned AS) const {
751   return divideCeil(getPointerAlignElem(AS).TypeBitWidth, 8);
752 }
753 
754 unsigned DataLayout::getMaxIndexSize() const {
755   unsigned MaxIndexSize = 0;
756   for (auto &P : Pointers)
757     MaxIndexSize =
758         std::max(MaxIndexSize, (unsigned)divideCeil(P.TypeBitWidth, 8));
759 
760   return MaxIndexSize;
761 }
762 
763 unsigned DataLayout::getPointerTypeSizeInBits(Type *Ty) const {
764   assert(Ty->isPtrOrPtrVectorTy() &&
765          "This should only be called with a pointer or pointer vector type");
766   Ty = Ty->getScalarType();
767   return getPointerSizeInBits(cast<PointerType>(Ty)->getAddressSpace());
768 }
769 
770 unsigned DataLayout::getIndexSize(unsigned AS) const {
771   return divideCeil(getPointerAlignElem(AS).IndexBitWidth, 8);
772 }
773 
774 unsigned DataLayout::getIndexTypeSizeInBits(Type *Ty) const {
775   assert(Ty->isPtrOrPtrVectorTy() &&
776          "This should only be called with a pointer or pointer vector type");
777   Ty = Ty->getScalarType();
778   return getIndexSizeInBits(cast<PointerType>(Ty)->getAddressSpace());
779 }
780 
781 /*!
782   \param abi_or_pref Flag that determines which alignment is returned. true
783   returns the ABI alignment, false returns the preferred alignment.
784   \param Ty The underlying type for which alignment is determined.
785 
786   Get the ABI (\a abi_or_pref == true) or preferred alignment (\a abi_or_pref
787   == false) for the requested type \a Ty.
788  */
789 Align DataLayout::getAlignment(Type *Ty, bool abi_or_pref) const {
790   assert(Ty->isSized() && "Cannot getTypeInfo() on a type that is unsized!");
791   switch (Ty->getTypeID()) {
792   // Early escape for the non-numeric types.
793   case Type::LabelTyID:
794     return abi_or_pref ? getPointerABIAlignment(0) : getPointerPrefAlignment(0);
795   case Type::PointerTyID: {
796     unsigned AS = cast<PointerType>(Ty)->getAddressSpace();
797     return abi_or_pref ? getPointerABIAlignment(AS)
798                        : getPointerPrefAlignment(AS);
799     }
800   case Type::ArrayTyID:
801     return getAlignment(cast<ArrayType>(Ty)->getElementType(), abi_or_pref);
802 
803   case Type::StructTyID: {
804     // Packed structure types always have an ABI alignment of one.
805     if (cast<StructType>(Ty)->isPacked() && abi_or_pref)
806       return Align(1);
807 
808     // Get the layout annotation... which is lazily created on demand.
809     const StructLayout *Layout = getStructLayout(cast<StructType>(Ty));
810     const Align Align =
811         abi_or_pref ? StructAlignment.ABIAlign : StructAlignment.PrefAlign;
812     return std::max(Align, Layout->getAlignment());
813   }
814   case Type::IntegerTyID:
815     return getIntegerAlignment(Ty->getIntegerBitWidth(), abi_or_pref);
816   case Type::HalfTyID:
817   case Type::BFloatTyID:
818   case Type::FloatTyID:
819   case Type::DoubleTyID:
820   // PPC_FP128TyID and FP128TyID have different data contents, but the
821   // same size and alignment, so they look the same here.
822   case Type::PPC_FP128TyID:
823   case Type::FP128TyID:
824   case Type::X86_FP80TyID: {
825     unsigned BitWidth = getTypeSizeInBits(Ty).getFixedValue();
826     auto I = findAlignmentLowerBound(FloatAlignments, BitWidth);
827     if (I != FloatAlignments.end() && I->TypeBitWidth == BitWidth)
828       return abi_or_pref ? I->ABIAlign : I->PrefAlign;
829 
830     // If we still couldn't find a reasonable default alignment, fall back
831     // to a simple heuristic that the alignment is the first power of two
832     // greater-or-equal to the store size of the type.  This is a reasonable
833     // approximation of reality, and if the user wanted something less
834     // less conservative, they should have specified it explicitly in the data
835     // layout.
836     return Align(PowerOf2Ceil(BitWidth / 8));
837   }
838   case Type::X86_MMXTyID:
839   case Type::FixedVectorTyID:
840   case Type::ScalableVectorTyID: {
841     unsigned BitWidth = getTypeSizeInBits(Ty).getKnownMinValue();
842     auto I = findAlignmentLowerBound(VectorAlignments, BitWidth);
843     if (I != VectorAlignments.end() && I->TypeBitWidth == BitWidth)
844       return abi_or_pref ? I->ABIAlign : I->PrefAlign;
845 
846     // By default, use natural alignment for vector types. This is consistent
847     // with what clang and llvm-gcc do.
848     //
849     // We're only calculating a natural alignment, so it doesn't have to be
850     // based on the full size for scalable vectors. Using the minimum element
851     // count should be enough here.
852     return Align(PowerOf2Ceil(getTypeStoreSize(Ty).getKnownMinValue()));
853   }
854   case Type::X86_AMXTyID:
855     return Align(64);
856   case Type::TargetExtTyID: {
857     Type *LayoutTy = cast<TargetExtType>(Ty)->getLayoutType();
858     return getAlignment(LayoutTy, abi_or_pref);
859   }
860   default:
861     llvm_unreachable("Bad type for getAlignment!!!");
862   }
863 }
864 
865 Align DataLayout::getABITypeAlign(Type *Ty) const {
866   return getAlignment(Ty, true);
867 }
868 
869 /// TODO: Remove this function once the transition to Align is over.
870 uint64_t DataLayout::getPrefTypeAlignment(Type *Ty) const {
871   return getPrefTypeAlign(Ty).value();
872 }
873 
874 Align DataLayout::getPrefTypeAlign(Type *Ty) const {
875   return getAlignment(Ty, false);
876 }
877 
878 IntegerType *DataLayout::getIntPtrType(LLVMContext &C,
879                                        unsigned AddressSpace) const {
880   return IntegerType::get(C, getPointerSizeInBits(AddressSpace));
881 }
882 
883 Type *DataLayout::getIntPtrType(Type *Ty) const {
884   assert(Ty->isPtrOrPtrVectorTy() &&
885          "Expected a pointer or pointer vector type.");
886   unsigned NumBits = getPointerTypeSizeInBits(Ty);
887   IntegerType *IntTy = IntegerType::get(Ty->getContext(), NumBits);
888   if (VectorType *VecTy = dyn_cast<VectorType>(Ty))
889     return VectorType::get(IntTy, VecTy);
890   return IntTy;
891 }
892 
893 Type *DataLayout::getSmallestLegalIntType(LLVMContext &C, unsigned Width) const {
894   for (unsigned LegalIntWidth : LegalIntWidths)
895     if (Width <= LegalIntWidth)
896       return Type::getIntNTy(C, LegalIntWidth);
897   return nullptr;
898 }
899 
900 unsigned DataLayout::getLargestLegalIntTypeSizeInBits() const {
901   auto Max = std::max_element(LegalIntWidths.begin(), LegalIntWidths.end());
902   return Max != LegalIntWidths.end() ? *Max : 0;
903 }
904 
905 IntegerType *DataLayout::getIndexType(LLVMContext &C,
906                                       unsigned AddressSpace) const {
907   return IntegerType::get(C, getIndexSizeInBits(AddressSpace));
908 }
909 
910 Type *DataLayout::getIndexType(Type *Ty) const {
911   assert(Ty->isPtrOrPtrVectorTy() &&
912          "Expected a pointer or pointer vector type.");
913   unsigned NumBits = getIndexTypeSizeInBits(Ty);
914   IntegerType *IntTy = IntegerType::get(Ty->getContext(), NumBits);
915   if (VectorType *VecTy = dyn_cast<VectorType>(Ty))
916     return VectorType::get(IntTy, VecTy);
917   return IntTy;
918 }
919 
920 int64_t DataLayout::getIndexedOffsetInType(Type *ElemTy,
921                                            ArrayRef<Value *> Indices) const {
922   int64_t Result = 0;
923 
924   generic_gep_type_iterator<Value* const*>
925     GTI = gep_type_begin(ElemTy, Indices),
926     GTE = gep_type_end(ElemTy, Indices);
927   for (; GTI != GTE; ++GTI) {
928     Value *Idx = GTI.getOperand();
929     if (StructType *STy = GTI.getStructTypeOrNull()) {
930       assert(Idx->getType()->isIntegerTy(32) && "Illegal struct idx");
931       unsigned FieldNo = cast<ConstantInt>(Idx)->getZExtValue();
932 
933       // Get structure layout information...
934       const StructLayout *Layout = getStructLayout(STy);
935 
936       // Add in the offset, as calculated by the structure layout info...
937       Result += Layout->getElementOffset(FieldNo);
938     } else {
939       if (int64_t ArrayIdx = cast<ConstantInt>(Idx)->getSExtValue())
940         Result += ArrayIdx * GTI.getSequentialElementStride(*this);
941     }
942   }
943 
944   return Result;
945 }
946 
947 static APInt getElementIndex(TypeSize ElemSize, APInt &Offset) {
948   // Skip over scalable or zero size elements. Also skip element sizes larger
949   // than the positive index space, because the arithmetic below may not be
950   // correct in that case.
951   unsigned BitWidth = Offset.getBitWidth();
952   if (ElemSize.isScalable() || ElemSize == 0 ||
953       !isUIntN(BitWidth - 1, ElemSize)) {
954     return APInt::getZero(BitWidth);
955   }
956 
957   APInt Index = Offset.sdiv(ElemSize);
958   Offset -= Index * ElemSize;
959   if (Offset.isNegative()) {
960     // Prefer a positive remaining offset to allow struct indexing.
961     --Index;
962     Offset += ElemSize;
963     assert(Offset.isNonNegative() && "Remaining offset shouldn't be negative");
964   }
965   return Index;
966 }
967 
968 std::optional<APInt> DataLayout::getGEPIndexForOffset(Type *&ElemTy,
969                                                       APInt &Offset) const {
970   if (auto *ArrTy = dyn_cast<ArrayType>(ElemTy)) {
971     ElemTy = ArrTy->getElementType();
972     return getElementIndex(getTypeAllocSize(ElemTy), Offset);
973   }
974 
975   if (isa<VectorType>(ElemTy)) {
976     // Vector GEPs are partially broken (e.g. for overaligned element types),
977     // and may be forbidden in the future, so avoid generating GEPs into
978     // vectors. See https://discourse.llvm.org/t/67497
979     return std::nullopt;
980   }
981 
982   if (auto *STy = dyn_cast<StructType>(ElemTy)) {
983     const StructLayout *SL = getStructLayout(STy);
984     uint64_t IntOffset = Offset.getZExtValue();
985     if (IntOffset >= SL->getSizeInBytes())
986       return std::nullopt;
987 
988     unsigned Index = SL->getElementContainingOffset(IntOffset);
989     Offset -= SL->getElementOffset(Index);
990     ElemTy = STy->getElementType(Index);
991     return APInt(32, Index);
992   }
993 
994   // Non-aggregate type.
995   return std::nullopt;
996 }
997 
998 SmallVector<APInt> DataLayout::getGEPIndicesForOffset(Type *&ElemTy,
999                                                       APInt &Offset) const {
1000   assert(ElemTy->isSized() && "Element type must be sized");
1001   SmallVector<APInt> Indices;
1002   Indices.push_back(getElementIndex(getTypeAllocSize(ElemTy), Offset));
1003   while (Offset != 0) {
1004     std::optional<APInt> Index = getGEPIndexForOffset(ElemTy, Offset);
1005     if (!Index)
1006       break;
1007     Indices.push_back(*Index);
1008   }
1009 
1010   return Indices;
1011 }
1012 
1013 /// getPreferredAlign - Return the preferred alignment of the specified global.
1014 /// This includes an explicitly requested alignment (if the global has one).
1015 Align DataLayout::getPreferredAlign(const GlobalVariable *GV) const {
1016   MaybeAlign GVAlignment = GV->getAlign();
1017   // If a section is specified, always precisely honor explicit alignment,
1018   // so we don't insert padding into a section we don't control.
1019   if (GVAlignment && GV->hasSection())
1020     return *GVAlignment;
1021 
1022   // If no explicit alignment is specified, compute the alignment based on
1023   // the IR type. If an alignment is specified, increase it to match the ABI
1024   // alignment of the IR type.
1025   //
1026   // FIXME: Not sure it makes sense to use the alignment of the type if
1027   // there's already an explicit alignment specification.
1028   Type *ElemType = GV->getValueType();
1029   Align Alignment = getPrefTypeAlign(ElemType);
1030   if (GVAlignment) {
1031     if (*GVAlignment >= Alignment)
1032       Alignment = *GVAlignment;
1033     else
1034       Alignment = std::max(*GVAlignment, getABITypeAlign(ElemType));
1035   }
1036 
1037   // If no explicit alignment is specified, and the global is large, increase
1038   // the alignment to 16.
1039   // FIXME: Why 16, specifically?
1040   if (GV->hasInitializer() && !GVAlignment) {
1041     if (Alignment < Align(16)) {
1042       // If the global is not external, see if it is large.  If so, give it a
1043       // larger alignment.
1044       if (getTypeSizeInBits(ElemType) > 128)
1045         Alignment = Align(16); // 16-byte alignment.
1046     }
1047   }
1048   return Alignment;
1049 }
1050