lib/CodeGen/PatternInit.cpp

22989816SDimitry Andric//===--- PatternInit.cpp - Pattern Initialization -------------------------===//
22989816SDimitry Andric//
22989816SDimitry Andric// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
22989816SDimitry Andric// See https://llvm.org/LICENSE.txt for license information.
22989816SDimitry Andric// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
22989816SDimitry Andric//
22989816SDimitry Andric//===----------------------------------------------------------------------===//
22989816SDimitry Andric
22989816SDimitry Andric#include "PatternInit.h"
22989816SDimitry Andric#include "CodeGenModule.h"
cfca06d7SDimitry Andric#include "clang/Basic/TargetInfo.h"
22989816SDimitry Andric#include "llvm/IR/Constant.h"
22989816SDimitry Andric#include "llvm/IR/Type.h"
22989816SDimitry Andric
22989816SDimitry Andricllvm::Constant *clang::CodeGen::initializationPatternFor(CodeGenModule &CGM,
22989816SDimitry Andric                                                         llvm::Type *Ty) {
22989816SDimitry Andric  // The following value is a guaranteed unmappable pointer value and has a
22989816SDimitry Andric  // repeated byte-pattern which makes it easier to synthesize. We use it for
22989816SDimitry Andric  // pointers as well as integers so that aggregates are likely to be
22989816SDimitry Andric  // initialized with this repeated value.
22989816SDimitry Andric  // For 32-bit platforms it's a bit trickier because, across systems, only the
22989816SDimitry Andric  // zero page can reasonably be expected to be unmapped. We use max 0xFFFFFFFF
22989816SDimitry Andric  // assuming that memory access will overlap into zero page.
22989816SDimitry Andric  const uint64_t IntValue =
22989816SDimitry Andric      CGM.getContext().getTargetInfo().getMaxPointerWidth() < 64
22989816SDimitry Andric          ? 0xFFFFFFFFFFFFFFFFull
22989816SDimitry Andric          : 0xAAAAAAAAAAAAAAAAull;
22989816SDimitry Andric  // Floating-point values are initialized as NaNs because they propagate. Using
22989816SDimitry Andric  // a repeated byte pattern means that it will be easier to initialize
22989816SDimitry Andric  // all-floating-point aggregates and arrays with memset. Further, aggregates
22989816SDimitry Andric  // which mix integral and a few floats might also initialize with memset
22989816SDimitry Andric  // followed by a handful of stores for the floats. Using fairly unique NaNs
22989816SDimitry Andric  // also means they'll be easier to distinguish in a crash.
22989816SDimitry Andric  constexpr bool NegativeNaN = true;
22989816SDimitry Andric  constexpr uint64_t NaNPayload = 0xFFFFFFFFFFFFFFFFull;
22989816SDimitry Andric  if (Ty->isIntOrIntVectorTy()) {
cfca06d7SDimitry Andric    unsigned BitWidth =
cfca06d7SDimitry Andric        cast<llvm::IntegerType>(Ty->getScalarType())->getBitWidth();
22989816SDimitry Andric    if (BitWidth <= 64)
22989816SDimitry Andric      return llvm::ConstantInt::get(Ty, IntValue);
22989816SDimitry Andric    return llvm::ConstantInt::get(
22989816SDimitry Andric        Ty, llvm::APInt::getSplat(BitWidth, llvm::APInt(64, IntValue)));
22989816SDimitry Andric  }
22989816SDimitry Andric  if (Ty->isPtrOrPtrVectorTy()) {
cfca06d7SDimitry Andric    auto *PtrTy = cast<llvm::PointerType>(Ty->getScalarType());
e3b55780SDimitry Andric    unsigned PtrWidth =
e3b55780SDimitry Andric        CGM.getDataLayout().getPointerSizeInBits(PtrTy->getAddressSpace());
22989816SDimitry Andric    if (PtrWidth > 64)
22989816SDimitry Andric      llvm_unreachable("pattern initialization of unsupported pointer width");
22989816SDimitry Andric    llvm::Type *IntTy = llvm::IntegerType::get(CGM.getLLVMContext(), PtrWidth);
22989816SDimitry Andric    auto *Int = llvm::ConstantInt::get(IntTy, IntValue);
22989816SDimitry Andric    return llvm::ConstantExpr::getIntToPtr(Int, PtrTy);
22989816SDimitry Andric  }
22989816SDimitry Andric  if (Ty->isFPOrFPVectorTy()) {
22989816SDimitry Andric    unsigned BitWidth = llvm::APFloat::semanticsSizeInBits(
cfca06d7SDimitry Andric        Ty->getScalarType()->getFltSemantics());
22989816SDimitry Andric    llvm::APInt Payload(64, NaNPayload);
22989816SDimitry Andric    if (BitWidth >= 64)
22989816SDimitry Andric      Payload = llvm::APInt::getSplat(BitWidth, Payload);
22989816SDimitry Andric    return llvm::ConstantFP::getQNaN(Ty, NegativeNaN, &Payload);
22989816SDimitry Andric  }
22989816SDimitry Andric  if (Ty->isArrayTy()) {
22989816SDimitry Andric    // Note: this doesn't touch tail padding (at the end of an object, before
22989816SDimitry Andric    // the next array object). It is instead handled by replaceUndef.
22989816SDimitry Andric    auto *ArrTy = cast<llvm::ArrayType>(Ty);
22989816SDimitry Andric    llvm::SmallVector<llvm::Constant *, 8> Element(
22989816SDimitry Andric        ArrTy->getNumElements(),
22989816SDimitry Andric        initializationPatternFor(CGM, ArrTy->getElementType()));
22989816SDimitry Andric    return llvm::ConstantArray::get(ArrTy, Element);
22989816SDimitry Andric  }
22989816SDimitry Andric
22989816SDimitry Andric  // Note: this doesn't touch struct padding. It will initialize as much union
22989816SDimitry Andric  // padding as is required for the largest type in the union. Padding is
22989816SDimitry Andric  // instead handled by replaceUndef. Stores to structs with volatile members
22989816SDimitry Andric  // don't have a volatile qualifier when initialized according to C++. This is
22989816SDimitry Andric  // fine because stack-based volatiles don't really have volatile semantics
22989816SDimitry Andric  // anyways, and the initialization shouldn't be observable.
22989816SDimitry Andric  auto *StructTy = cast<llvm::StructType>(Ty);
22989816SDimitry Andric  llvm::SmallVector<llvm::Constant *, 8> Struct(StructTy->getNumElements());
22989816SDimitry Andric  for (unsigned El = 0; El != Struct.size(); ++El)
22989816SDimitry Andric    Struct[El] = initializationPatternFor(CGM, StructTy->getElementType(El));
22989816SDimitry Andric  return llvm::ConstantStruct::get(StructTy, Struct);
22989816SDimitry Andric}