blob: 45c2406e5b2199dda020e3144076c87464acd086 [file] [log] [blame]
//===-- go-llvm-cabi-oracle.cpp - implementation of CABIOracle ------------===//
//
// Copyright 2018 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.
//
//===----------------------------------------------------------------------===//
//
// Methods for CABIOracle class.
//
//===----------------------------------------------------------------------===//
#include "go-llvm-cabi-oracle.h"
#include "go-llvm-typemanager.h"
#include "llvm/IR/DataLayout.h"
#include "llvm/Support/raw_ostream.h"
//......................................................................
// Given an LLVM type, classify it according to whether it would
// need to be passed in an integer or SSE register (or if it is
// some combination of entirely empty structs/arrays).
enum TypDisp { FlavSSE, FlavSIMDFP, FlavInt, FlavEmpty };
// Arm64 ABI AAPCS64 defines HFA as follows:
// An Homogeneous Floating-point Aggregate (HFA) is an Homogeneous Aggregate with
// a Fundamental Data Type that is a Floating-Point type and at most four uniquely
// addressable members.
struct HFAInfo {
unsigned number;
llvm::Type *type;
};
// Here "meet" is in the dataflow anlysis sense (meet operator on lattice
// values).
static TypDisp dispMeet(TypDisp d1, TypDisp d2) {
if (d1 == d2)
return d1;
if (d1 == FlavEmpty)
return d2;
if (d2 == FlavEmpty)
return d1;
if (d1 == FlavSSE && d2 == FlavSSE)
return FlavSSE;
return FlavInt;
}
static TypDisp getTypDisp(llvm::Type *typ) {
if (typ->isFloatTy() || typ->isDoubleTy())
return FlavSSE;
return FlavInt;
}
//......................................................................
// Q: split off this class into a separate file, so as to unit test it?
// The AMD64 ABI classification scheme for aggregates (section 3.2.3
// third page) talks about dividing up the contents of an array or
// struct info 8-byte chunks or regions; this container class holds
// info on a region. A given 8-byte region may contain something
// simple like a field of type "double", a pair of floats, or there
// may be a mix of floating point and integer fields within a struct.
// The "types" and "offsets" hold the LLVM types and offsets of
// elements relative to the start of the object; "abiDirectType" holds
// the type used to pass the elements if we're passing the entire
// object directly (in registers) as opposed in on the stack.
//
// Implementation of Arm64 ABI AAPCS64 reused this struct.
struct EightByteRegion {
EightByteRegion() : abiDirectType(nullptr), attr(AttrNone) { }
TypDisp getRegionTypDisp() const;
std::vector<llvm::Type*> types;
std::vector<uint64_t> offsets;
llvm::Type *abiDirectType;
CABIParamAttr attr;
void dump();
void osdump(llvm::raw_ostream &os);
};
TypDisp EightByteRegion::getRegionTypDisp() const {
TypDisp disp = FlavEmpty;
for (auto &t : types)
disp = dispMeet(getTypDisp(t), disp);
return disp;
}
void EightByteRegion::dump()
{
std::string s;
llvm::raw_string_ostream os(s);
osdump(os);
std::cerr << os.str();
}
void EightByteRegion::osdump(llvm::raw_ostream &os)
{
os << "types:\n";
for (auto &t : types) {
os << " ";
t->print(os);
os << "\n";
}
os << "offsets:\n";
for (auto &o : offsets) {
os << " " << o << "\n";
}
}
// This class is a container for zero or more EightByteRegion objects
// that correspond to the contents of an object of some type that
// we're going to be passing to or returning from a function.
class EightByteInfo {
public:
EightByteInfo(Btype *bt, TypeManager *tm);
std::vector<EightByteRegion> &regions() { return ebrs_; }
HFAInfo &getHFA() { return hfa_; }
void getRegisterRequirements(unsigned *numInt, unsigned *numSSE);
private:
std::vector<EightByteRegion> ebrs_;
HFAInfo hfa_;
TypeManager *typeManager_;
typedef std::pair<Btype *, unsigned> typAndOffset;
void addLeafTypes(Btype *bt, unsigned off, std::vector<typAndOffset> *leaves);
void explode(Btype *bt);
void setHFA();
void explodeStruct(Btype *bst);
void explodeArray(BArrayType *bat);
void incorporateScalar(Btype *bt);
void determineABITypesForARM_AAPCS();
void determineABITypesForX86_64_SysV();
TypeManager *tm() const { return typeManager_; }
};
EightByteInfo::EightByteInfo(Btype *bt, TypeManager *tmgr)
: typeManager_(tmgr)
{
explode(bt);
llvm::CallingConv::ID cconv = tmgr->callingConv();
switch (cconv) {
case llvm::CallingConv::X86_64_SysV:
determineABITypesForX86_64_SysV();
break;
case llvm::CallingConv::ARM_AAPCS:
setHFA();
if (getHFA().number == 0 && tmgr->typeSize(bt) <= 16) {
// For HFA and indirect cases, we don't need do this.
determineABITypesForARM_AAPCS();
}
break;
default:
llvm::errs() << "unsupported llvm::CallingConv::ID " << cconv << "\n";
break;
}
}
// Perform a pre-order walk of a type, collecting the various leaf
// elements within the type. The general idea is to flatten out any
// nested structs/arrays and expose each of the underlying scalar
// elements of the type along with their offsets. Return value is a
// list of type/offset pairs, where the offset represents the location
// of the scalar type within the larger aggregate type. Example:
//
// struct {
// f1 int8
// f2 [0]uint64
// struct {
// f1 int8
// }
// }
//
// The return for the struct above in "preserve" mode would be:
//
// { int8, 0 }, { int8, 8 }
//
void EightByteInfo::addLeafTypes(Btype *bt,
unsigned offset,
std::vector<typAndOffset> *leaves)
{
assert(bt && leaves);
BStructType *bst = bt->castToBStructType();
if (bst) {
unsigned numFields = bst->fields().size();
for (unsigned fidx = 0; fidx < numFields; ++fidx) {
unsigned foff = tm()->typeFieldOffset(bst, fidx);
addLeafTypes(bst->fieldType(fidx), offset + foff, leaves);
}
return;
}
BArrayType *bat = bt->castToBArrayType();
if (bat) {
Btype *et = bat->elemType();
for (unsigned elidx = 0; elidx < bat->nelSize(); ++elidx) {
unsigned eloff = elidx * tm()->typeSize(et);
addLeafTypes(et, offset + eloff, leaves);
}
return;
}
BComplexType *bct = bt->castToBComplexType();
if (bct) {
unsigned bits = bct->bits() / 2;
for (unsigned fidx = 0; fidx < 2; ++fidx) {
Btype *leaf = tm()->floatType(bits);
unsigned foff = tm()->typeFieldOffset(bct, fidx);
leaves->push_back(std::make_pair(leaf, foff));
}
return;
}
assert(bt->flavor() != Btype::AuxT && bt->flavor() != Btype::FunctionT);
leaves->push_back(std::make_pair(bt, offset));
}
// Given a struct type, explode it into zero, one or multiple EightByteRegion
// descriptors. Examples of the contents of EightByteInfo structs
// for various Go types follow. The first type (empty struct) results
// in a single EightByteRegion struct with empty vectors. The second
// type results in a single EightByteRegion, and the third yields two
// EightByteRegion.
//
// Go struct type: Computed EightByteRegions:
// C types: offsets:
//
// type empty struct { } [0] <no types> <no offsets>
//
// type foo struct {
// f1 uint8; [0] unsigned char 0
// f2 uint16; unsigned short 16
// f4 float32; float 32
// }
//
// type bar struct {
// f1 double; [0] double 0
// f2 uint8; [1] unsigned char 64
// f3 int16; short 80
// }
//
void EightByteInfo::explodeStruct(Btype *bst)
{
std::vector<typAndOffset> leafTypes;
addLeafTypes(bst, 0, &leafTypes);
// collect offsets and field types
EightByteRegion *cur8 = nullptr;
unsigned curOffset = 0;
for (auto &pair : leafTypes) {
Btype *lt = pair.first;
unsigned offset = pair.second;
if (cur8 == nullptr || (offset - curOffset >= 8)) {
ebrs_.push_back(EightByteRegion());
cur8 = &ebrs_.back();
curOffset = offset;
}
cur8->types.push_back(lt->type());
cur8->offsets.push_back(offset);
}
}
// Given an array type, explode it into zero, one or multiple EightByteInfo
// descriptors. Examples appear below; the first array type results
// in a single EightByteInfo with empty type/offset vectors, then the second
// array type results in a single EightByteInfo, and the thrd array
// type results in two EightByteInfo structs:
//
// Go type: Computed EightByteInfo:
// C types: offsets:
//
// [0]float32 [0] <no types> <no offsets>
//
// [3]uint8 [0] unsigned char 0
// unsigned char 8
// unsigned char 16
//
// [6]uint16 [0] unsigned short 0
// unsigned short 16
// unsigned short 32
// unsigned short 48
// [1] unsigned short 64
// unsigned short 80
void EightByteInfo::explodeArray(BArrayType *bat)
{
EightByteRegion *cur8 = nullptr;
unsigned curOffset = 0;
unsigned elSize = tm()->typeSize(bat->elemType());
for (unsigned elidx = 0; elidx < bat->nelSize(); ++elidx) {
unsigned offset = elidx * elSize;
if (cur8 == nullptr || (offset - curOffset >= 8)) {
ebrs_.push_back(EightByteRegion());
cur8 = &ebrs_.back();
curOffset = offset;
}
// note that elem type here may be composite
cur8->types.push_back(bat->elemType()->type());
cur8->offsets.push_back(offset);
}
}
void EightByteInfo::incorporateScalar(Btype *bt)
{
assert(tm()->typeSize(bt) <= 8);
EightByteRegion ebr;
ebr.types.push_back(bt->type());
ebr.offsets.push_back(0u);
ebr.abiDirectType = bt->type();
BIntegerType *bit = bt->castToBIntegerType();
if (bit && tm()->typeSize(bit) < 4)
ebr.attr = (bit->isUnsigned() ? AttrZext : AttrSext);
ebrs_.push_back(ebr);
}
// Convert a Btype into EightByteRegions.
void EightByteInfo::explode(Btype *bt)
{
BStructType *bst = bt->castToBStructType();
BComplexType *bct = bt->castToBComplexType();
BArrayType *bat = bt->castToBArrayType();
if (bst || bct || bat) {
// Flatten all composite types.
explodeStruct(bt);
} else {
incorporateScalar(bt);
}
}
void EightByteInfo::getRegisterRequirements(unsigned *numInt, unsigned *numSSE)
{
*numInt = 0;
*numSSE = 0;
for (auto &ebr : ebrs_)
if (ebr.getRegionTypDisp() == FlavSSE)
*numSSE += 1;
else
*numInt += 1;
}
// Check if the parameter is an Homogeneous Floating-point Aggregates (HFA),
// and set hfa_ according to the result.
void EightByteInfo::setHFA() {
if (ebrs_.empty()) {
hfa_ = HFAInfo{0, nullptr};
return;
}
unsigned num = 0;
llvm::Type *typ = ebrs_[0].types[0];
if (typ != tm()->llvmDoubleType() && typ != tm()->llvmFloatType()) {
hfa_ = HFAInfo{0, nullptr};
return;
}
for (auto &ebr : ebrs_) {
for (auto &t : ebr.types) {
if (t != typ || num > 3) {
hfa_ = HFAInfo{0, nullptr};
return;
}
++num;
}
}
hfa_ = HFAInfo{num, typ};
}
// Select the appropriate abi type for each eight-byte region within
// an EightByteInfo. HFA and arguments larger than 16 bytes have been
// processed, so the arguments processed here can only be integer types,
// pointer types or a mix of integer and non-integer, mapped it onto
// the pointer type or the appropriately sized integer type.
//
// Problems arise in the code below when dealing with structures with
// constructs that inject additional padding. For example, consider
// the following struct passed by value:
//
// struct {
// f1 int8
// f2 [0]uint64
// f3 int8
// }
//
// Without taking into account the over-alignment of field f3, we would
// wind up with two regions, each with type int8. This in itself is not so
// bad, but creating a struct from these two types (via ::computeABIStructType)
// would give us { int8, int8 }, in which the second field doesn't have
// the correct alignment. Work around this by checking for such situations
// and promoting the type of the first EBR to 64 bits.
//
void EightByteInfo::determineABITypesForARM_AAPCS() {
assert(ebrs_.size() <= 2);
for (auto &ebr : ebrs_) {
if (ebr.abiDirectType != nullptr)
continue;
// Preserve pointerness for the use of GC.
// TODO: this assumes pointer is 8 byte, so we never pack pointer
// and other stuff together.
if (ebr.types[0]->isPointerTy()) {
ebr.abiDirectType = tm()->llvmPtrType();
continue;
}
unsigned nel = ebr.offsets.size();
unsigned bytes = ebr.offsets[nel - 1] - ebr.offsets[0] +
tm()->llvmTypeSize(ebr.types[nel - 1]);
assert(bytes && bytes <= 8);
ebr.abiDirectType = tm()->llvmArbitraryIntegerType(bytes);
}
// See the example above for more on why this is needed.
if (ebrs_.size() == 2 && ebrs_[0].abiDirectType->isIntegerTy()) {
ebrs_[0].abiDirectType = tm()->llvmArbitraryIntegerType(8);
}
}
// Select the appropriate abi type for each eight-byte region within
// an EightByteInfo. Pure floating point types are mapped onto float,
// double, or <2 x float> (a vector type), integer types (or something
// that is a mix of integer and non-integer) are mapped onto the
// appropriately sized integer type.
//
// Problems arise in the code below when dealing with structures with
// constructs that inject additional padding. For example, consider
// the following struct passed by value:
//
// struct {
// f1 int8
// f2 [0]uint64
// f3 int8
// }
//
// Without taking into account the over-alignment of field f3, we would
// wind up with two regions, each with type int8. This in itself is not so
// bad, but creating a struct from these two types (via ::computeABIStructType)
// would give us { int8, int8 }, in which the second field doesn't have
// the correct alignment. Work around this by checking for such situations
// and promoting the type of the first EBR to 64 bits.
//
void EightByteInfo::determineABITypesForX86_64_SysV()
{
// In the direct case, ebrs_.size() cannot be greater than 2 because parameters
// larger than 16 bytes are passed indirectly.
assert(ebrs_.size() <= 2);
unsigned intRegions = 0;
unsigned floatRegions = 0;
for (auto &ebr : ebrs_) {
if (ebr.abiDirectType != nullptr)
continue;
TypDisp regionDisp = ebr.getRegionTypDisp();
if (regionDisp == FlavSSE) {
// Case 1: two floats -> vector
if (ebr.types.size() == 2)
ebr.abiDirectType = tm()->llvmTwoFloatVecType();
else if (ebr.types.size() == 1) {
assert(ebr.types[0] == tm()->llvmDoubleType() ||
ebr.types[0] == tm()->llvmFloatType());
ebr.abiDirectType = ebr.types[0];
} else {
assert(false && "this should never happen");
}
floatRegions += 1;
} else {
unsigned nel = ebr.offsets.size();
unsigned bytes = ebr.offsets[nel-1] - ebr.offsets[0] +
tm()->llvmTypeSize(ebr.types[nel-1]);
assert(bytes && bytes <= 8);
// Preserve pointerness for the use of GC.
// TODO: this assumes pointer is 8 byte, so we never pack pointer
// and other stuff together.
if (ebr.types[0]->isPointerTy())
ebr.abiDirectType = tm()->llvmPtrType();
else
ebr.abiDirectType = tm()->llvmArbitraryIntegerType(bytes);
intRegions += 1;
}
}
// See the example above for more on why this is needed.
if (intRegions == 2 &&
ebrs_[0].abiDirectType->isIntegerTy())
ebrs_[0].abiDirectType = tm()->llvmArbitraryIntegerType(8);
else if (floatRegions == 2 &&
ebrs_[0].abiDirectType == tm()->llvmFloatType())
ebrs_[0].abiDirectType = tm()->llvmDoubleType();
}
//......................................................................
llvm::Type *CABIParamInfo::computeABIStructType(TypeManager *tm) const
{
assert(tm);
if (abiTypes_.size() == 1) {
assert(abiTypes_[0]->isStructTy());
return abiTypes_[0];
}
assert(abiTypes_.size() <= CABIParamInfo::ABI_TYPES_MAX_SIZE);
llvm::Type *llst = tm->makeLLVMStructType(abiTypes_);
return llst;
}
void CABIParamInfo::dump()
{
std::string s;
llvm::raw_string_ostream os(s);
osdump(os);
std::cerr << os.str();
}
void CABIParamInfo::osdump(llvm::raw_ostream &os)
{
os << (disp() == ParmDirect ? "Direct" :
(disp() == ParmIgnore ? "Ignore" :
(disp() == ParmIndirect ? "Indirect" : "<unknown>")));
if (attr() != AttrNone)
os << (attr() == AttrStructReturn ? " AttrStructReturn" :
(attr() == AttrByVal ? " AttrByVal" :
(attr() == AttrNest ? " AttrNest" :
(attr() == AttrZext ? " AttrZext" :
(attr() == AttrSext ? " AttrSext" :
(attr() == AttrDoCopy ? " AttrDoCopy" : " <unknown>"))))));
os << " { ";
unsigned idx = 0;
for (auto &abit : abiTypes_) {
os << (idx++ != 0 ? ", " : "");
abit->print(os);
}
os << " }";
os << " sigOffset: " << sigOffset() << "\n";
}
//......................................................................
// Helper struct to track state information during ABI param
// classification. Keeps track of arg count (args in final ABI-cooked
// signature) along with available int/sse regs.
class ABIState {
public:
ABIState(TypeManager *typm) : argCount_(0) {
assert(typm != nullptr);
llvm::CallingConv::ID cconv = typm->callingConv();
switch (cconv) {
case llvm::CallingConv::X86_64_SysV:
availIntRegs_ = 6;
availSSERegs_ = 8;
break;
case llvm::CallingConv::ARM_AAPCS:
availIntRegs_ = 8;
availSIMDFPRegs_ = 8;
break;
default:
llvm::errs() << "unsupported llvm::CallingConv::ID " << cconv << "\n";
break;
}
}
void addDirectIntArg() {
if (availIntRegs_)
availIntRegs_ -= 1;
argCount_ += 1;
}
void addDirectSSEArg() {
if (availSSERegs_)
availSSERegs_ -= 1;
argCount_ += 1;
}
// For ARM_AAPCS HFA, one argument may takes multiple registers.
void addDirectSIMDFPArg(unsigned sr = 1) {
unsigned t = availSIMDFPRegs_ - sr;
if (availSIMDFPRegs_ > t)
availSIMDFPRegs_ = t;
argCount_ += 1;
}
void addIndirectArg() { argCount_ += 1; }
void addIndirectReturn() {
if (availIntRegs_)
availIntRegs_ -= 1;
argCount_ += 1;
}
// ARM_AAPCS uses separate x8 to store return address.
void addIndirectReturnForARM_AAPCS() { argCount_ += 1; }
void addChainArg() { argCount_ += 1; }
unsigned argCount() const { return argCount_; }
unsigned availIntRegs() const { return availIntRegs_; }
unsigned availSSERegs() const { return availSSERegs_; }
unsigned availSIMDFPRegs() const { return availSIMDFPRegs_; }
void clearAvailIntRegs() { availIntRegs_ = 0; }
void clearAvailSIMDFPRegs() { availSIMDFPRegs_ = 0; }
private:
unsigned availIntRegs_;
unsigned availSSERegs_;
unsigned availSIMDFPRegs_;
unsigned argCount_;
};
//......................................................................
CABIOracle::CABIOracle(const std::vector<Btype *> &fcnParamTypes,
Btype *fcnResultType,
bool followsCabi,
TypeManager *typeManager)
: fcnParamTypes_(fcnParamTypes)
, fcnResultType_(fcnResultType)
, fcnTypeForABI_(nullptr)
, typeManager_(typeManager)
, followsCabi_(followsCabi)
, ccID_(llvm::CallingConv::MaxID)
, cc_(nullptr)
{
setCC();
analyze();
}
CABIOracle::CABIOracle(BFunctionType *ft,
TypeManager *typeManager)
: fcnParamTypes_(ft->paramTypes())
, fcnResultType_(ft->resultType())
, fcnTypeForABI_(nullptr)
, typeManager_(typeManager)
, followsCabi_(ft->followsCabi())
, ccID_(llvm::CallingConv::MaxID)
, cc_(nullptr)
{
setCC();
analyze();
}
void CABIOracle::setCC()
{
assert(typeManager_ != nullptr);
ccID_ = typeManager_->callingConv();
// Supported architectures at present.
assert(ccID_ == llvm::CallingConv::X86_64_SysV ||
ccID_ == llvm::CallingConv::ARM_AAPCS);
if (cc_ != nullptr) {
return;
}
switch (ccID_) {
case llvm::CallingConv::X86_64_SysV:
cc_ = std::unique_ptr<CABIOracleArgumentAnalyzer>(new CABIOracleX86_64_SysV(typeManager_));
break;
case llvm::CallingConv::ARM_AAPCS:
cc_ = std::unique_ptr<CABIOracleArgumentAnalyzer>(new CABIOracleARM_AAPCS(typeManager_));
break;
default:
llvm::errs() << "unsupported llvm::CallingConv::ID " << ccID_ << "\n";
break;
}
}
TypeManager *CABIOracle::tm() const
{
return typeManager_;
}
llvm::FunctionType *CABIOracle::getFunctionTypeForABI()
{
assert(cc_ != nullptr);
return fcnTypeForABI_;
}
const CABIParamInfo &CABIOracle::paramInfo(unsigned idx)
{
assert(cc_ != nullptr);
// Slot 0: return info
// Slot 1: static chain param
// Slot 2: first argument / parameter
unsigned pidx = idx + 2;
assert(pidx < infov_.size());
return infov_[pidx];
}
const CABIParamInfo &CABIOracle::returnInfo()
{
assert(cc_ != nullptr);
unsigned ridx = 0;
assert(ridx < infov_.size());
return infov_[ridx];
}
const CABIParamInfo &CABIOracle::chainInfo()
{
assert(cc_ != nullptr);
unsigned ridx = 1;
assert(ridx < infov_.size());
return infov_[ridx];
}
void CABIOracle::dump()
{
std::cerr << toString();
}
std::string CABIOracle::toString()
{
std::string s;
llvm::raw_string_ostream os(s);
osdump(os);
return os.str();
}
void CABIOracle::osdump(llvm::raw_ostream &os)
{
os << "Return: ";
infov_[0].osdump(os);
for (unsigned pidx = 1; pidx < infov_.size(); pidx++) {
os << "Param " << pidx << ": ";
infov_[pidx].osdump(os);
}
}
// Fill in parameter / return / type information for a builtin function,
// e.g. all values passed + returned directly, no static chain param.
void CABIOracle::analyzeRaw()
{
//if (fcnTypeForABI_)
//return;
// First slot in the info vector will be for the return.
llvm::Type *rtyp = fcnResultType_->type();
CABIParamInfo rinfo(rtyp, ParmDirect, AttrNone, -1);
infov_.push_back(rinfo);
// No static chain, but we'll create an entry for the chain marked
// as ignored.
CABIParamInfo cinfo(tm()->llvmPtrType(), ParmIgnore, AttrNest, -1);
infov_.push_back(cinfo);
// Now process the params.
llvm::SmallVector<llvm::Type *, 8> elems(0);
for (unsigned idx = 0; idx < fcnParamTypes_.size(); ++idx) {
Btype *pType = fcnParamTypes_[idx];
CABIParamInfo pinfo(pType->type(), ParmDirect, AttrNone, idx);
infov_.push_back(pinfo);
elems.push_back(pType->type());
}
// Build the proper LLVM function type
const bool isVarargs = false;
fcnTypeForABI_ = llvm::FunctionType::get(rtyp, elems, isVarargs);
}
void CABIOracle::analyze()
{
if (fcnTypeForABI_)
return;
if (! followsCabi_) {
analyzeRaw();
return;
}
ABIState state(tm());
assert(cc_ != nullptr);
// First slot in the info vector will be for the return.
infov_.push_back(cc_->analyzeABIReturn(fcnResultType_, state));
// Static chain parameter
int sigOff = state.argCount();
state.addChainArg();
CABIParamInfo cparm(tm()->llvmPtrType(), ParmDirect, AttrNest, sigOff);
infov_.push_back(cparm);
// Now process the params.
for (unsigned idx = 0; idx < fcnParamTypes_.size(); ++idx) {
Btype *pType = fcnParamTypes_[idx];
auto d = cc_->analyzeABIParam(pType, state);
infov_.push_back(d);
}
llvm::SmallVector<llvm::Type *, 8> elems(0);
llvm::Type *rtyp = nullptr;
if (infov_[0].disp() == ParmIndirect) {
rtyp = tm()->llvmVoidType();
elems.push_back(infov_[0].abiType());
} else {
rtyp = infov_[0].abiType();
}
for (unsigned pidx = 1; pidx < infov_.size(); pidx++) {
if (infov_[pidx].disp() == ParmIgnore)
continue;
for (auto &abit : infov_[pidx].abiTypes())
elems.push_back(abit);
}
const bool isVarargs = false;
fcnTypeForABI_ = llvm::FunctionType::get(rtyp, elems, isVarargs);
}
//......................................................................
CABIOracleX86_64_SysV::CABIOracleX86_64_SysV(TypeManager *typeManager)
: CABIOracleArgumentAnalyzer(typeManager) {}
// For full C++ (with long double, unions, vector types) the
// rules here are a good deal more complicated, but for Go
// it all boils down to the size of the type.
CABIParamDisp CABIOracleX86_64_SysV::classifyArgType(Btype *btype)
{
int64_t sz = tm_->typeSize(btype);
return (sz == 0 ? ParmIgnore : ((sz <= 16) ? ParmDirect : ParmIndirect));
}
// Given the number of registers that we think a param is going to consume, and
// a state object storing the registers used so far, canPassDirectly() makes a
// decision as to whether a given param can be passed directly in registers vs
// in memory.
//
// Note the first clause, "if (regsInt + regsSSE == 1) return true". This may
// seem counter-intuitive (why no check against the state object?), but this way
// of doing things is the convention used by other front ends (e.g. clang). What
// is happening here is that for larger aggregate/array params (things that
// don't fit into a single register), we'll make the pass-through-memory
// semantics explicit in the function signature and generate the explict code to
// copy things into memory. For params that do fit into a single register,
// however, we just leave them all as by-value parameters and then assume that
// the back end will do the right thing (e.g. pass the first few in registers
// and then the remaining ones in memory).
//
// Doing things this way has performance advantages in that the middle-end
// (all of the machine-independent LLVM optimization passes) won't have
// to deal with the additional chunks of stack memory and code to copy
// things onto and off of the stack (not to mention the aliasing concerns
// when a local variable's address is taken and then passed in a function
// call).
bool CABIOracleX86_64_SysV::canPassDirectly(unsigned regsInt,
unsigned regsSSE,
ABIState &state)
{
if (regsInt + regsSSE == 1) // see comment above
return true;
if (regsInt <= state.availIntRegs() && regsSSE <= state.availSSERegs())
return true;
return false;
}
CABIParamInfo CABIOracleX86_64_SysV::analyzeABIParam(Btype *paramType,
ABIState &state)
{
llvm::Type *ptyp = paramType->type();
// The only situations in which we should be seeing AuxT types here is
// in cases where we're analyzing the signatures of builtin functions,
// meaning that there should be no structures or arrays.
assert(paramType->flavor() != Btype::AuxT || ptyp->isVoidTy() ||
!(ptyp->isStructTy() || ptyp->isArrayTy() || ptyp->isVectorTy() ||
ptyp->isEmptyTy() || ptyp->isIntegerTy(8) || ptyp->isIntegerTy(16)));
CABIParamDisp pdisp = classifyArgType(paramType);
if (pdisp == ParmIgnore) {
// Empty struct or array
llvm::Type *voidType = tm_->llvmVoidType();
return CABIParamInfo(voidType, ParmIgnore, AttrNone, -1);
}
int sigOff = state.argCount();
if (pdisp == ParmIndirect) {
// Value will be passed in memory on stack.
// Stack is always in address space 0.
llvm::Type *ptrTyp = llvm::PointerType::get(ptyp, 0);
state.addIndirectArg();
return CABIParamInfo(ptrTyp, ParmIndirect, AttrByVal, sigOff);
}
// Figure out what to do in the direct case
assert(pdisp == ParmDirect);
EightByteInfo ebi(paramType, tm_);
// Figure out how many registers it would take to pass this parm directly
unsigned regsInt = 0, regsSSE = 0;
ebi.getRegisterRequirements(&regsInt, &regsSSE);
// Make direct/indirect decision
CABIParamAttr attr = AttrNone;
if (canPassDirectly(regsInt, regsSSE, state)) {
std::vector<llvm::Type *> abiTypes;
for (auto &ebr : ebi.regions()) {
abiTypes.push_back(ebr.abiDirectType);
if (ebr.attr != AttrNone) {
assert(attr == AttrNone || attr == ebr.attr);
attr = ebr.attr;
}
if (ebr.getRegionTypDisp() == FlavSSE)
state.addDirectSSEArg();
else
state.addDirectIntArg();
}
return CABIParamInfo(abiTypes, ParmDirect, attr, sigOff);
} else {
state.addIndirectArg();
llvm::Type *ptrTyp = llvm::PointerType::get(ptyp, 0);
return CABIParamInfo(ptrTyp, ParmIndirect, AttrByVal, sigOff);
}
}
CABIParamInfo CABIOracleX86_64_SysV::analyzeABIReturn(Btype *resultType,
ABIState &state) {
llvm::Type *rtyp = resultType->type();
CABIParamDisp rdisp =
(rtyp == tm_->llvmVoidType() ? ParmIgnore
: classifyArgType(resultType));
if (rdisp == ParmIgnore) {
// This corresponds to a function with no returns or
// returning an empty composite.
llvm::Type *voidType = tm_->llvmVoidType();
return CABIParamInfo(voidType, ParmIgnore, AttrNone, -1);
}
if (rdisp == ParmIndirect) {
// Return value will be passed in memory, via a hidden
// struct return param.
// It is on stack, therefore address space 0.
llvm::Type *ptrTyp = llvm::PointerType::get(rtyp, 0);
state.addIndirectReturn();
return CABIParamInfo(ptrTyp, ParmIndirect, AttrStructReturn, 0);
}
// Figure out what to do in the direct case
assert(rdisp == ParmDirect);
EightByteInfo ebi(resultType, tm_);
auto &regions = ebi.regions();
if (regions.size() == 1) {
// Single value
return CABIParamInfo(regions[0].abiDirectType,
ParmDirect, regions[0].attr, -1);
}
// Two-element struct
assert(regions.size() == 2);
llvm::Type *abiTyp =
tm_->makeLLVMTwoElementStructType(regions[0].abiDirectType,
regions[1].abiDirectType);
return CABIParamInfo(abiTyp, ParmDirect, AttrNone, -1);
}
//......................................................................
CABIOracleARM_AAPCS::CABIOracleARM_AAPCS(TypeManager *typeManager)
: CABIOracleArgumentAnalyzer(typeManager) {}
// Given the number of registers that we think a param is going to consume, and
// a state object storing the registers used so far, canPassDirectly() makes a
// decision as to whether a given param can be passed directly in registers vs
// in memory.
//
// Note the first clause, "if (regsInt + regsSIMDFP == 1) return true". This may
// seem counter-intuitive (why no check against the state object?), but this way
// of doing things is the convention used by other front ends (e.g. clang). What
// is happening here is that for larger aggregate/array params (things that
// don't fit into a single register), we'll make the pass-through-memory
// semantics explicit in the function signature and generate the explict code to
// copy things into memory. For params that do fit into a single register,
// however, we just leave them all as by-value parameters and then assume that
// the back end will do the right thing (e.g. pass the first few in registers
// and then the remaining ones in memory).
//
// Doing things this way has performance advantages in that the middle-end
// (all of the machine-independent LLVM optimization passes) won't have
// to deal with the additional chunks of stack memory and code to copy
// things onto and off of the stack (not to mention the aliasing concerns
// when a local variable's address is taken and then passed in a function
// call).
bool CABIOracleARM_AAPCS::canPassDirectly(unsigned regsInt,
unsigned regsSIMDFP,
ABIState &state)
{
if (regsInt + regsSIMDFP == 1) // see comment above
return true;
if (regsInt <= state.availIntRegs() && regsSIMDFP <= state.availSIMDFPRegs())
return true;
return false;
}
CABIParamInfo CABIOracleARM_AAPCS::analyzeABIParam(Btype *paramType, ABIState &state)
{
llvm::Type *ptyp = paramType->type();
// The only situations in which we should be seeing AuxT types here is
// in cases where we're analyzing the signatures of builtin functions,
// meaning that there should be no structures or arrays.
assert(paramType->flavor() != Btype::AuxT || ptyp->isVoidTy() ||
!(ptyp->isStructTy() || ptyp->isArrayTy() || ptyp->isVectorTy() ||
ptyp->isEmptyTy() || ptyp->isIntegerTy(8) || ptyp->isIntegerTy(16)));
if (ptyp == tm_->llvmVoidType()) {
// Empty struct or array
llvm::Type *voidType = tm_->llvmVoidType();
return CABIParamInfo(voidType, ParmIgnore, AttrNone, -1);
}
// If ptyp is llvmVoidType, we may not able to get the size of it,
// so we can't combine the following if statement with the above one.
int64_t sz = tm_->typeSize(paramType);
if (sz == 0) {
// Empty struct or array
llvm::Type *voidType = tm_->llvmVoidType();
return CABIParamInfo(voidType, ParmIgnore, AttrNone, -1);
}
int sigOff = state.argCount();
// Go has only two floating point types: float32 and float64, so the size of
// an HFA does not exceed 32 bytes.
if (sz > 32) {
// Value will be passed in memory on stack.
// Stack is always in address space 0.
llvm::Type *ptrTyp = llvm::PointerType::get(ptyp, 0);
state.addIndirectArg();
return CABIParamInfo(ptrTyp, ParmIndirect, AttrDoCopy, sigOff);
}
EightByteInfo ebi(paramType, tm_);
auto &hfa = ebi.getHFA();
if (hfa.number != 0) {
// Is HFA.
llvm::Type * abiType = hfa.type;
if (hfa.number > 1) {
// If it contains multiple elements, make the param as an Array
// type. This ensures that an HFA is passed as a whole.
abiType = llvm::ArrayType::get(hfa.type, hfa.number);
}
if (canPassDirectly(0, hfa.number, state)) {
state.addDirectSIMDFPArg(hfa.number);
} else {
state.clearAvailSIMDFPRegs();
state.addIndirectArg();
}
// Whether or not an HFA can be passed in registers, we use
// ParmDirect. This is because HFA is passed by value on stack
// in indirect cases, and we happen to be able to reuse the
// processing logic of the direct cases.
return CABIParamInfo(abiType, ParmDirect, AttrNone, sigOff);
}
if (sz > 16) {
// Not an HFA,value will be passed in memory on stack.
// Stack is always in address space 0.
llvm::Type *ptrTyp = llvm::PointerType::get(ptyp, 0);
state.addIndirectArg();
return CABIParamInfo(ptrTyp, ParmIndirect, AttrDoCopy, sigOff);
}
// Direct case.
auto &regions = ebi.regions();
// Make direct/indirect decision
CABIParamAttr attr = AttrNone;
if (canPassDirectly(regions.size(), 0, state)) {
std::vector<llvm::Type *> abiTypes;
for (auto &ebr : regions) {
abiTypes.push_back(ebr.abiDirectType);
if (ebr.attr != AttrNone) {
assert(attr == AttrNone || attr == ebr.attr);
attr = ebr.attr;
}
state.addDirectIntArg();
}
return CABIParamInfo(abiTypes, ParmDirect, attr, sigOff);
} else {
state.clearAvailIntRegs();
state.addIndirectArg();
llvm::Type *abiType = regions[0].abiDirectType;
if (regions.size() > 1) {
// Convert the argument to an array type so that the backend considers it as a
// whole whether it can be passed through registers.
abiType = llvm::ArrayType::get(tm_->llvmArbitraryIntegerType(8), regions.size());
}
// Pass by value on stack, so use ParmDirect.
return CABIParamInfo(abiType, ParmDirect, AttrNone, sigOff);
}
}
CABIParamInfo CABIOracleARM_AAPCS::analyzeABIReturn(Btype *resultType,
ABIState &state) {
llvm::Type *rtyp = resultType->type();
if (rtyp == tm_->llvmVoidType()) {
// This corresponds to a function with no returns or
// returning an empty composite.
llvm::Type *voidType = tm_->llvmVoidType();
return CABIParamInfo(voidType, ParmIgnore, AttrNone, -1);
}
// If rtyp is llvmVoidType, we may not able to get the size of it,
// so we can't combine the following if statement with the above one.
int64_t sz = tm_->typeSize(resultType);
if (sz == 0) {
// This corresponds to a function with no returns or
// returning an empty composite.
llvm::Type *voidType = tm_->llvmVoidType();
return CABIParamInfo(voidType, ParmIgnore, AttrNone, -1);
}
// Go has only two floating point types: float32 and float64, so the size of
// an HFA does not exceed 32 bytes.
if (sz > 32) {
// Return value will be passed in memory, via a hidden
// struct return param.
// It is on stack, therefore address space 0.
llvm::Type *ptrTyp = llvm::PointerType::get(rtyp, 0);
// Indirect return value is passed by register R8, so doesn't occupy any int
// register.
state.addIndirectReturnForARM_AAPCS();
return CABIParamInfo(ptrTyp, ParmIndirect, AttrStructReturn, 0);
}
EightByteInfo ebi(resultType, tm_);
auto &hfa = ebi.getHFA();
if (hfa.number != 0) {
// Is HFA.
// If only one element, don't bother to make a llvm struct type.
if (hfa.number == 1) {
return CABIParamInfo(hfa.type, ParmDirect, AttrNone, -1);
}
std::vector<llvm::Type *> fields;
for (unsigned i = 0; i < hfa.number; ++i) {
fields.push_back(hfa.type);
}
llvm::Type *abiTyp = tm_->makeLLVMStructType(fields);
return CABIParamInfo(abiTyp, ParmDirect, AttrNone, -1);
}
// The return value is not an HFA and its size exceeds 16 bytes,
// be passed in memory, via a hidden struct return param.
if (sz > 16) {
llvm::Type *ptrTyp = llvm::PointerType::get(rtyp, 0);
state.addIndirectReturnForARM_AAPCS();
return CABIParamInfo(ptrTyp, ParmIndirect, AttrStructReturn, 0);
}
// Direct case
auto &regions = ebi.regions();
if (regions.size() == 1) {
// Single value
return CABIParamInfo(regions[0].abiDirectType, ParmDirect, regions[0].attr,
-1);
}
// Two-element struct
assert(regions.size() == 2);
llvm::Type *abiTyp = tm_->makeLLVMTwoElementStructType(
regions[0].abiDirectType, regions[1].abiDirectType);
return CABIParamInfo(abiTyp, ParmDirect, AttrNone, -1);
}
//......................................................................