//===-- abi-x86-64.cpp ----------------------------------------------------===// // // LDC – the LLVM D compiler // // This file is distributed under the BSD-style LDC license. See the LICENSE // file for details. // //===----------------------------------------------------------------------===// // // extern(C) implements the C calling convention for x86-64, as found in // http://www.x86-64.org/documentation/abi-0.99.pdf // // Note: // Where a discrepancy was found between llvm-gcc and the ABI documentation, // llvm-gcc behavior was used for compatibility (after it was verified that // regular gcc has the same behavior). // // LLVM gets it right for most types, but complex numbers, structs and static // arrays need some help. To make sure it gets those right we essentially // bitcast these types to a type to which LLVM assigns the appropriate // registers (using DMD's toArgTypes() machinery), and pass that instead. // Structs that are required to be passed in memory are marked with the ByVal // attribute to ensure no part of them ends up in registers when only a subset // of the desired registers are available. // //===----------------------------------------------------------------------===// #include "gen/abi-x86-64.h" #include "aggregate.h" #include "declaration.h" #include "ldcbindings.h" #include "mtype.h" #include "gen/abi-generic.h" #include "gen/abi-x86-64.h" #include "gen/abi.h" #include "gen/dvalue.h" #include "gen/irstate.h" #include "gen/llvm.h" #include "gen/llvmhelpers.h" #include "gen/logger.h" #include "gen/tollvm.h" #include "ir/irfunction.h" #include #include #include #include TypeTuple *toArgTypes(Type *t); // in dmd2/argtypes.c namespace { namespace dmd_abi { // Structs, static arrays and cfloats may be rewritten to exploit registers. // This function returns the rewritten type, or null if no transformation is // needed. LLType *getAbiType(Type *ty) { // First, check if there's any need of a transformation: if (!(ty->ty == Tcomplex32 || ty->ty == Tstruct || ty->ty == Tsarray)) { return nullptr; // Nothing to do } // Okay, we may need to transform. Figure out a canonical type: TypeTuple *argTypes = toArgTypes(ty); if (!argTypes || argTypes->arguments->empty()) { return nullptr; // don't rewrite } LLType *abiTy = nullptr; if (argTypes->arguments->size() == 1) { abiTy = DtoType((*argTypes->arguments->begin())->type); // don't rewrite to a single bit (assertions in tollvm.cpp), choose a byte // instead abiTy = i1ToI8(abiTy); } else { std::vector parts; for (auto param : *argTypes->arguments) { LLType *partType = DtoType(param->type); // round up the DMD argtype for an eightbyte of a struct to a // corresponding 64-bit type // this makes sure that 64 bits of the chosen register are used and thus // makes sure all potential padding bytes of a struct are copied if (partType->isIntegerTy()) { partType = LLType::getInt64Ty(gIR->context()); } else if (partType->isFloatTy()) { partType = LLType::getDoubleTy(gIR->context()); } parts.push_back(partType); } abiTy = LLStructType::get(gIR->context(), parts); } return abiTy; } bool passByVal(Type *ty) { TypeTuple *argTypes = toArgTypes(ty); if (!argTypes) { return false; } return argTypes->arguments->empty(); // empty => cannot be passed in registers } } // namespace dmd_abi LLType *getAbiType(Type *ty) { return dmd_abi::getAbiType(ty->toBasetype()); } struct RegCount { char int_regs, sse_regs; RegCount() : int_regs(6), sse_regs(8) {} explicit RegCount(LLType *ty) : int_regs(0), sse_regs(0) { if (LLStructType *structTy = isaStruct(ty)) { for (unsigned i = 0; i < structTy->getNumElements(); ++i) { RegCount elementRegCount(structTy->getElementType(i)); int_regs += elementRegCount.int_regs; sse_regs += elementRegCount.sse_regs; } assert(int_regs + sse_regs <= 2); } else { // not a struct if (ty->isIntegerTy() || ty->isPointerTy()) { ++int_regs; } else if (ty->isFloatingPointTy() || ty->isVectorTy()) { // X87 reals are passed on the stack if (!ty->isX86_FP80Ty()) { ++sse_regs; } } else { unsigned sizeInBits = gDataLayout->getTypeSizeInBits(ty); IF_LOG Logger::cout() << "SysV RegCount: assuming 1 GP register for type " << *ty << " (" << sizeInBits << " bits)\n"; assert(sizeInBits > 0 && sizeInBits <= 64); ++int_regs; } } } enum SubtractionResult { ArgumentFitsIn, ArgumentWouldFitInPartially, ArgumentDoesntFitIn }; SubtractionResult trySubtract(const IrFuncTyArg &arg) { const RegCount wanted(arg.ltype); const bool anyRegAvailable = (wanted.int_regs > 0 && int_regs > 0) || (wanted.sse_regs > 0 && sse_regs > 0); if (!anyRegAvailable) { return ArgumentDoesntFitIn; } if (int_regs < wanted.int_regs || sse_regs < wanted.sse_regs) { return ArgumentWouldFitInPartially; } int_regs -= wanted.int_regs; sse_regs -= wanted.sse_regs; return ArgumentFitsIn; } }; } /** * This type performs the actual struct/cfloat rewriting by simply storing to * memory so that it's then readable as the other type (i.e., bit-casting). */ struct X86_64_C_struct_rewrite : ABIRewrite { LLValue *put(DValue *v) override { LLValue *address = getAddressOf(v); LLType *abiTy = getAbiType(v->type); assert(abiTy && "Why are we rewriting a non-rewritten type?"); return loadFromMemory(address, abiTy, ".X86_64_C_struct_rewrite_putResult"); } LLValue *getLVal(Type *dty, LLValue *v) override { return DtoAllocaDump(v, dty, ".X86_64_C_struct_rewrite_dump"); } LLType *type(Type *t) override { return getAbiType(t); } }; /** * This type is used to force LLVM to pass a LL struct in memory, * on the function arguments stack. We need this to prevent LLVM * from passing a LL struct partially in registers, partially in * memory. * This is achieved by passing a pointer to the struct and using * the ByVal LLVM attribute. */ struct ImplicitByvalRewrite : ABIRewrite { LLValue *put(DValue *v) override { return getAddressOf(v); } LLValue *getLVal(Type *dty, LLValue *v) override { return v; } LLType *type(Type *t) override { return DtoPtrToType(t); } }; struct X86_64TargetABI : TargetABI { X86_64_C_struct_rewrite struct_rewrite; ImplicitByvalRewrite byvalRewrite; bool returnInArg(TypeFunction *tf) override; bool passByVal(Type *t) override; void rewriteFunctionType(TypeFunction *tf, IrFuncTy &fty) override; void rewriteVarargs(IrFuncTy &fty, std::vector &args) override; void rewriteArgument(IrFuncTy &fty, IrFuncTyArg &arg) override; void rewriteArgument(IrFuncTyArg &arg, RegCount ®Count); LLValue *prepareVaStart(DLValue *ap) override; void vaCopy(DLValue *dest, DValue *src) override; LLValue *prepareVaArg(DLValue *ap) override; Type *vaListType() override; const char *objcMsgSendFunc(Type *ret, IrFuncTy &fty) override; private: LLType *getValistType(); RegCount &getRegCount(IrFuncTy &fty) { return reinterpret_cast(fty.tag); } }; // The public getter for abi.cpp TargetABI *getX86_64TargetABI() { return new X86_64TargetABI; } bool X86_64TargetABI::returnInArg(TypeFunction *tf) { if (tf->isref) { return false; } Type *rt = tf->next; return passByVal(rt); } bool X86_64TargetABI::passByVal(Type *t) { return dmd_abi::passByVal(t->toBasetype()); } void X86_64TargetABI::rewriteArgument(IrFuncTy &fty, IrFuncTyArg &arg) { llvm_unreachable("Please use the other overload explicitly."); } void X86_64TargetABI::rewriteArgument(IrFuncTyArg &arg, RegCount ®Count) { LLType *originalLType = arg.ltype; Type *t = arg.type->toBasetype(); LLType *abiTy = getAbiType(t); if (abiTy && !LLTypeMemoryLayout::typesAreEquivalent(abiTy, originalLType)) { IF_LOG { Logger::println("Rewriting argument type %s", t->toChars()); LOG_SCOPE; Logger::cout() << *originalLType << " => " << *abiTy << '\n'; } arg.rewrite = &struct_rewrite; arg.ltype = abiTy; } if (regCount.trySubtract(arg) == RegCount::ArgumentWouldFitInPartially) { // pass LL structs implicitly ByVal, otherwise LLVM passes // them partially in registers, partially in memory assert(originalLType->isStructTy()); IF_LOG Logger::cout() << "Passing implicitly ByVal: " << arg.type->toChars() << " (" << *originalLType << ")\n"; arg.rewrite = &byvalRewrite; arg.ltype = originalLType->getPointerTo(); arg.attrs.addByVal(DtoAlignment(arg.type)); } } void X86_64TargetABI::rewriteFunctionType(TypeFunction *tf, IrFuncTy &fty) { RegCount ®Count = getRegCount(fty); regCount = RegCount(); // initialize // RETURN VALUE if (!fty.ret->byref && fty.ret->type->toBasetype()->ty != Tvoid) { Logger::println("x86-64 ABI: Transforming return type"); LOG_SCOPE; RegCount dummy; rewriteArgument(*fty.ret, dummy); } // IMPLICIT PARAMETERS if (fty.arg_sret) { regCount.int_regs--; } if (fty.arg_this || fty.arg_nest) { regCount.int_regs--; } if (fty.arg_arguments) { regCount.int_regs -= 2; // dynamic array } // EXPLICIT PARAMETERS Logger::println("x86-64 ABI: Transforming argument types"); LOG_SCOPE; // extern(D): reverse parameter order for non variadics, for DMD-compliance if (tf->linkage == LINKd && tf->varargs != 1 && fty.args.size() > 1) { fty.reverseParams = true; } int begin = 0, end = fty.args.size(), step = 1; if (fty.reverseParams) { begin = end - 1; end = -1; step = -1; } for (int i = begin; i != end; i += step) { IrFuncTyArg &arg = *fty.args[i]; if (arg.byref) { if (!arg.isByVal() && regCount.int_regs > 0) { regCount.int_regs--; } continue; } rewriteArgument(arg, regCount); } // regCount (fty.tag) is now in the state after all implicit & formal args, // ready to serve as initial state for each vararg call site, see below } void X86_64TargetABI::rewriteVarargs(IrFuncTy &fty, std::vector &args) { // use a dedicated RegCount copy for each call site and initialize it with // fty.tag RegCount regCount = getRegCount(fty); for (auto arg : args) { if (!arg->byref) { // don't rewrite ByVal arguments rewriteArgument(*arg, regCount); } } } /** * The System V AMD64 ABI uses a special native va_list type - a 24-bytes struct * passed by reference. * In druntime, the struct is defined as core.stdc.stdarg.__va_list; the * actually used core.stdc.stdarg.va_list type is a raw char* pointer though to * achieve byref semantics. * This requires a little bit of compiler magic in the following * implementations. */ LLType *X86_64TargetABI::getValistType() { LLType *uintType = LLType::getInt32Ty(gIR->context()); LLType *voidPointerType = getVoidPtrType(); std::vector parts; // struct __va_list { parts.push_back(uintType); // uint gp_offset; parts.push_back(uintType); // uint fp_offset; parts.push_back(voidPointerType); // void* overflow_arg_area; parts.push_back(voidPointerType); // void* reg_save_area; } return LLStructType::get(gIR->context(), parts); } LLValue *X86_64TargetABI::prepareVaStart(DLValue *ap) { // Since the user only created a char* pointer (ap) on the stack before // invoking va_start, we first need to allocate the actual __va_list struct // and set `ap` to its address. LLValue *valistmem = DtoRawAlloca(getValistType(), 0, "__va_list_mem"); DtoStore(valistmem, DtoBitCast(DtoLVal(ap), getPtrToType(valistmem->getType()))); // Pass a i8* pointer to the actual struct to LLVM's va_start intrinsic. return DtoBitCast(valistmem, getVoidPtrType()); } void X86_64TargetABI::vaCopy(DLValue *dest, DValue *src) { // Analog to va_start, we first need to allocate a new __va_list struct on the // stack and set `dest` to its address. LLValue *valistmem = DtoRawAlloca(getValistType(), 0, "__va_list_mem"); DtoStore(valistmem, DtoBitCast(DtoLVal(dest), getPtrToType(valistmem->getType()))); // Then fill the new struct with a bitcopy of the source struct. // `src` is a char* pointer to the source struct. DtoMemCpy(valistmem, DtoRVal(src)); } LLValue *X86_64TargetABI::prepareVaArg(DLValue *ap) { // Pass a i8* pointer to the actual __va_list struct to LLVM's va_arg // intrinsic. return DtoRVal(ap); } Type *X86_64TargetABI::vaListType() { // We need to pass the actual va_list type for correct mangling. Simply // using TypeIdentifier here is a bit wonky but works, as long as the name // is actually available in the scope (this is what DMD does, so if a better // solution is found there, this should be adapted). static const llvm::StringRef ident = "__va_list_tag"; return (createTypeIdentifier(Loc(), Identifier::idPool(ident.data(), ident.size()))) ->pointerTo(); } const char *X86_64TargetABI::objcMsgSendFunc(Type *ret, IrFuncTy &fty) { // see objc/message.h for objc_msgSend selection rules if (fty.arg_sret) { return "objc_msgSend_stret"; } if (ret) { // complex long double return if (ret->ty == Tcomplex80) { return "objc_msgSend_fp2ret"; } // long double return if (ret->ty == Tfloat80 || ret->ty == Timaginary80) { return "objc_msgSend_fpret"; } } return "objc_msgSend"; }