ARMCallLowering.cpp 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582
  1. //===- llvm/lib/Target/ARM/ARMCallLowering.cpp - Call lowering ------------===//
  2. //
  3. // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
  4. // See https://llvm.org/LICENSE.txt for license information.
  5. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  6. //
  7. //===----------------------------------------------------------------------===//
  8. //
  9. /// \file
  10. /// This file implements the lowering of LLVM calls to machine code calls for
  11. /// GlobalISel.
  12. //
  13. //===----------------------------------------------------------------------===//
  14. #include "ARMCallLowering.h"
  15. #include "ARMBaseInstrInfo.h"
  16. #include "ARMISelLowering.h"
  17. #include "ARMSubtarget.h"
  18. #include "Utils/ARMBaseInfo.h"
  19. #include "llvm/ADT/SmallVector.h"
  20. #include "llvm/CodeGen/Analysis.h"
  21. #include "llvm/CodeGen/CallingConvLower.h"
  22. #include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
  23. #include "llvm/CodeGen/GlobalISel/Utils.h"
  24. #include "llvm/CodeGen/LowLevelType.h"
  25. #include "llvm/CodeGen/MachineBasicBlock.h"
  26. #include "llvm/CodeGen/MachineFrameInfo.h"
  27. #include "llvm/CodeGen/MachineFunction.h"
  28. #include "llvm/CodeGen/MachineInstrBuilder.h"
  29. #include "llvm/CodeGen/MachineMemOperand.h"
  30. #include "llvm/CodeGen/MachineOperand.h"
  31. #include "llvm/CodeGen/MachineRegisterInfo.h"
  32. #include "llvm/CodeGen/TargetRegisterInfo.h"
  33. #include "llvm/CodeGen/TargetSubtargetInfo.h"
  34. #include "llvm/CodeGen/ValueTypes.h"
  35. #include "llvm/IR/Attributes.h"
  36. #include "llvm/IR/DataLayout.h"
  37. #include "llvm/IR/DerivedTypes.h"
  38. #include "llvm/IR/Function.h"
  39. #include "llvm/IR/Type.h"
  40. #include "llvm/IR/Value.h"
  41. #include "llvm/Support/Casting.h"
  42. #include "llvm/Support/LowLevelTypeImpl.h"
  43. #include "llvm/Support/MachineValueType.h"
  44. #include <algorithm>
  45. #include <cassert>
  46. #include <cstdint>
  47. #include <utility>
  48. using namespace llvm;
  49. ARMCallLowering::ARMCallLowering(const ARMTargetLowering &TLI)
  50. : CallLowering(&TLI) {}
  51. static bool isSupportedType(const DataLayout &DL, const ARMTargetLowering &TLI,
  52. Type *T) {
  53. if (T->isArrayTy())
  54. return isSupportedType(DL, TLI, T->getArrayElementType());
  55. if (T->isStructTy()) {
  56. // For now we only allow homogeneous structs that we can manipulate with
  57. // G_MERGE_VALUES and G_UNMERGE_VALUES
  58. auto StructT = cast<StructType>(T);
  59. for (unsigned i = 1, e = StructT->getNumElements(); i != e; ++i)
  60. if (StructT->getElementType(i) != StructT->getElementType(0))
  61. return false;
  62. return isSupportedType(DL, TLI, StructT->getElementType(0));
  63. }
  64. EVT VT = TLI.getValueType(DL, T, true);
  65. if (!VT.isSimple() || VT.isVector() ||
  66. !(VT.isInteger() || VT.isFloatingPoint()))
  67. return false;
  68. unsigned VTSize = VT.getSimpleVT().getSizeInBits();
  69. if (VTSize == 64)
  70. // FIXME: Support i64 too
  71. return VT.isFloatingPoint();
  72. return VTSize == 1 || VTSize == 8 || VTSize == 16 || VTSize == 32;
  73. }
  74. namespace {
  75. /// Helper class for values going out through an ABI boundary (used for handling
  76. /// function return values and call parameters).
  77. struct ARMOutgoingValueHandler : public CallLowering::OutgoingValueHandler {
  78. ARMOutgoingValueHandler(MachineIRBuilder &MIRBuilder,
  79. MachineRegisterInfo &MRI, MachineInstrBuilder &MIB,
  80. CCAssignFn *AssignFn)
  81. : OutgoingValueHandler(MIRBuilder, MRI, AssignFn), MIB(MIB) {}
  82. Register getStackAddress(uint64_t Size, int64_t Offset,
  83. MachinePointerInfo &MPO) override {
  84. assert((Size == 1 || Size == 2 || Size == 4 || Size == 8) &&
  85. "Unsupported size");
  86. LLT p0 = LLT::pointer(0, 32);
  87. LLT s32 = LLT::scalar(32);
  88. auto SPReg = MIRBuilder.buildCopy(p0, Register(ARM::SP));
  89. auto OffsetReg = MIRBuilder.buildConstant(s32, Offset);
  90. auto AddrReg = MIRBuilder.buildPtrAdd(p0, SPReg, OffsetReg);
  91. MPO = MachinePointerInfo::getStack(MIRBuilder.getMF(), Offset);
  92. return AddrReg.getReg(0);
  93. }
  94. void assignValueToReg(Register ValVReg, Register PhysReg,
  95. CCValAssign &VA) override {
  96. assert(VA.isRegLoc() && "Value shouldn't be assigned to reg");
  97. assert(VA.getLocReg() == PhysReg && "Assigning to the wrong reg?");
  98. assert(VA.getValVT().getSizeInBits() <= 64 && "Unsupported value size");
  99. assert(VA.getLocVT().getSizeInBits() <= 64 && "Unsupported location size");
  100. Register ExtReg = extendRegister(ValVReg, VA);
  101. MIRBuilder.buildCopy(PhysReg, ExtReg);
  102. MIB.addUse(PhysReg, RegState::Implicit);
  103. }
  104. void assignValueToAddress(Register ValVReg, Register Addr, uint64_t Size,
  105. MachinePointerInfo &MPO, CCValAssign &VA) override {
  106. assert((Size == 1 || Size == 2 || Size == 4 || Size == 8) &&
  107. "Unsupported size");
  108. Register ExtReg = extendRegister(ValVReg, VA);
  109. auto MMO = MIRBuilder.getMF().getMachineMemOperand(
  110. MPO, MachineMemOperand::MOStore, VA.getLocVT().getStoreSize(),
  111. Align(1));
  112. MIRBuilder.buildStore(ExtReg, Addr, *MMO);
  113. }
  114. unsigned assignCustomValue(const CallLowering::ArgInfo &Arg,
  115. ArrayRef<CCValAssign> VAs) override {
  116. assert(Arg.Regs.size() == 1 && "Can't handle multple regs yet");
  117. CCValAssign VA = VAs[0];
  118. assert(VA.needsCustom() && "Value doesn't need custom handling");
  119. // Custom lowering for other types, such as f16, is currently not supported
  120. if (VA.getValVT() != MVT::f64)
  121. return 0;
  122. CCValAssign NextVA = VAs[1];
  123. assert(NextVA.needsCustom() && "Value doesn't need custom handling");
  124. assert(NextVA.getValVT() == MVT::f64 && "Unsupported type");
  125. assert(VA.getValNo() == NextVA.getValNo() &&
  126. "Values belong to different arguments");
  127. assert(VA.isRegLoc() && "Value should be in reg");
  128. assert(NextVA.isRegLoc() && "Value should be in reg");
  129. Register NewRegs[] = {MRI.createGenericVirtualRegister(LLT::scalar(32)),
  130. MRI.createGenericVirtualRegister(LLT::scalar(32))};
  131. MIRBuilder.buildUnmerge(NewRegs, Arg.Regs[0]);
  132. bool IsLittle = MIRBuilder.getMF().getSubtarget<ARMSubtarget>().isLittle();
  133. if (!IsLittle)
  134. std::swap(NewRegs[0], NewRegs[1]);
  135. assignValueToReg(NewRegs[0], VA.getLocReg(), VA);
  136. assignValueToReg(NewRegs[1], NextVA.getLocReg(), NextVA);
  137. return 1;
  138. }
  139. bool assignArg(unsigned ValNo, MVT ValVT, MVT LocVT,
  140. CCValAssign::LocInfo LocInfo,
  141. const CallLowering::ArgInfo &Info, ISD::ArgFlagsTy Flags,
  142. CCState &State) override {
  143. if (AssignFn(ValNo, ValVT, LocVT, LocInfo, Flags, State))
  144. return true;
  145. StackSize =
  146. std::max(StackSize, static_cast<uint64_t>(State.getNextStackOffset()));
  147. return false;
  148. }
  149. MachineInstrBuilder &MIB;
  150. uint64_t StackSize = 0;
  151. };
  152. } // end anonymous namespace
  153. void ARMCallLowering::splitToValueTypes(const ArgInfo &OrigArg,
  154. SmallVectorImpl<ArgInfo> &SplitArgs,
  155. MachineFunction &MF) const {
  156. const ARMTargetLowering &TLI = *getTLI<ARMTargetLowering>();
  157. LLVMContext &Ctx = OrigArg.Ty->getContext();
  158. const DataLayout &DL = MF.getDataLayout();
  159. const Function &F = MF.getFunction();
  160. SmallVector<EVT, 4> SplitVTs;
  161. ComputeValueVTs(TLI, DL, OrigArg.Ty, SplitVTs, nullptr, nullptr, 0);
  162. assert(OrigArg.Regs.size() == SplitVTs.size() && "Regs / types mismatch");
  163. if (SplitVTs.size() == 1) {
  164. // Even if there is no splitting to do, we still want to replace the
  165. // original type (e.g. pointer type -> integer).
  166. auto Flags = OrigArg.Flags[0];
  167. Flags.setOrigAlign(DL.getABITypeAlign(OrigArg.Ty));
  168. SplitArgs.emplace_back(OrigArg.Regs[0], SplitVTs[0].getTypeForEVT(Ctx),
  169. Flags, OrigArg.IsFixed);
  170. return;
  171. }
  172. // Create one ArgInfo for each virtual register.
  173. for (unsigned i = 0, e = SplitVTs.size(); i != e; ++i) {
  174. EVT SplitVT = SplitVTs[i];
  175. Type *SplitTy = SplitVT.getTypeForEVT(Ctx);
  176. auto Flags = OrigArg.Flags[0];
  177. Flags.setOrigAlign(DL.getABITypeAlign(SplitTy));
  178. bool NeedsConsecutiveRegisters =
  179. TLI.functionArgumentNeedsConsecutiveRegisters(
  180. SplitTy, F.getCallingConv(), F.isVarArg());
  181. if (NeedsConsecutiveRegisters) {
  182. Flags.setInConsecutiveRegs();
  183. if (i == e - 1)
  184. Flags.setInConsecutiveRegsLast();
  185. }
  186. // FIXME: We also want to split SplitTy further.
  187. Register PartReg = OrigArg.Regs[i];
  188. SplitArgs.emplace_back(PartReg, SplitTy, Flags, OrigArg.IsFixed);
  189. }
  190. }
  191. /// Lower the return value for the already existing \p Ret. This assumes that
  192. /// \p MIRBuilder's insertion point is correct.
  193. bool ARMCallLowering::lowerReturnVal(MachineIRBuilder &MIRBuilder,
  194. const Value *Val, ArrayRef<Register> VRegs,
  195. MachineInstrBuilder &Ret) const {
  196. if (!Val)
  197. // Nothing to do here.
  198. return true;
  199. auto &MF = MIRBuilder.getMF();
  200. const auto &F = MF.getFunction();
  201. auto DL = MF.getDataLayout();
  202. auto &TLI = *getTLI<ARMTargetLowering>();
  203. if (!isSupportedType(DL, TLI, Val->getType()))
  204. return false;
  205. ArgInfo OrigRetInfo(VRegs, Val->getType());
  206. setArgFlags(OrigRetInfo, AttributeList::ReturnIndex, DL, F);
  207. SmallVector<ArgInfo, 4> SplitRetInfos;
  208. splitToValueTypes(OrigRetInfo, SplitRetInfos, MF);
  209. CCAssignFn *AssignFn =
  210. TLI.CCAssignFnForReturn(F.getCallingConv(), F.isVarArg());
  211. ARMOutgoingValueHandler RetHandler(MIRBuilder, MF.getRegInfo(), Ret,
  212. AssignFn);
  213. return handleAssignments(MIRBuilder, SplitRetInfos, RetHandler);
  214. }
  215. bool ARMCallLowering::lowerReturn(MachineIRBuilder &MIRBuilder,
  216. const Value *Val, ArrayRef<Register> VRegs,
  217. FunctionLoweringInfo &FLI) const {
  218. assert(!Val == VRegs.empty() && "Return value without a vreg");
  219. auto const &ST = MIRBuilder.getMF().getSubtarget<ARMSubtarget>();
  220. unsigned Opcode = ST.getReturnOpcode();
  221. auto Ret = MIRBuilder.buildInstrNoInsert(Opcode).add(predOps(ARMCC::AL));
  222. if (!lowerReturnVal(MIRBuilder, Val, VRegs, Ret))
  223. return false;
  224. MIRBuilder.insertInstr(Ret);
  225. return true;
  226. }
  227. namespace {
  228. /// Helper class for values coming in through an ABI boundary (used for handling
  229. /// formal arguments and call return values).
  230. struct ARMIncomingValueHandler : public CallLowering::IncomingValueHandler {
  231. ARMIncomingValueHandler(MachineIRBuilder &MIRBuilder,
  232. MachineRegisterInfo &MRI, CCAssignFn AssignFn)
  233. : IncomingValueHandler(MIRBuilder, MRI, AssignFn) {}
  234. Register getStackAddress(uint64_t Size, int64_t Offset,
  235. MachinePointerInfo &MPO) override {
  236. assert((Size == 1 || Size == 2 || Size == 4 || Size == 8) &&
  237. "Unsupported size");
  238. auto &MFI = MIRBuilder.getMF().getFrameInfo();
  239. int FI = MFI.CreateFixedObject(Size, Offset, true);
  240. MPO = MachinePointerInfo::getFixedStack(MIRBuilder.getMF(), FI);
  241. return MIRBuilder.buildFrameIndex(LLT::pointer(MPO.getAddrSpace(), 32), FI)
  242. .getReg(0);
  243. }
  244. void assignValueToAddress(Register ValVReg, Register Addr, uint64_t Size,
  245. MachinePointerInfo &MPO, CCValAssign &VA) override {
  246. assert((Size == 1 || Size == 2 || Size == 4 || Size == 8) &&
  247. "Unsupported size");
  248. if (VA.getLocInfo() == CCValAssign::SExt ||
  249. VA.getLocInfo() == CCValAssign::ZExt) {
  250. // If the value is zero- or sign-extended, its size becomes 4 bytes, so
  251. // that's what we should load.
  252. Size = 4;
  253. assert(MRI.getType(ValVReg).isScalar() && "Only scalars supported atm");
  254. auto LoadVReg = buildLoad(LLT::scalar(32), Addr, Size, MPO);
  255. MIRBuilder.buildTrunc(ValVReg, LoadVReg);
  256. } else {
  257. // If the value is not extended, a simple load will suffice.
  258. buildLoad(ValVReg, Addr, Size, MPO);
  259. }
  260. }
  261. MachineInstrBuilder buildLoad(const DstOp &Res, Register Addr, uint64_t Size,
  262. MachinePointerInfo &MPO) {
  263. MachineFunction &MF = MIRBuilder.getMF();
  264. auto MMO = MF.getMachineMemOperand(MPO, MachineMemOperand::MOLoad, Size,
  265. inferAlignFromPtrInfo(MF, MPO));
  266. return MIRBuilder.buildLoad(Res, Addr, *MMO);
  267. }
  268. void assignValueToReg(Register ValVReg, Register PhysReg,
  269. CCValAssign &VA) override {
  270. assert(VA.isRegLoc() && "Value shouldn't be assigned to reg");
  271. assert(VA.getLocReg() == PhysReg && "Assigning to the wrong reg?");
  272. uint64_t ValSize = VA.getValVT().getFixedSizeInBits();
  273. uint64_t LocSize = VA.getLocVT().getFixedSizeInBits();
  274. assert(ValSize <= 64 && "Unsupported value size");
  275. assert(LocSize <= 64 && "Unsupported location size");
  276. markPhysRegUsed(PhysReg);
  277. if (ValSize == LocSize) {
  278. MIRBuilder.buildCopy(ValVReg, PhysReg);
  279. } else {
  280. assert(ValSize < LocSize && "Extensions not supported");
  281. // We cannot create a truncating copy, nor a trunc of a physical register.
  282. // Therefore, we need to copy the content of the physical register into a
  283. // virtual one and then truncate that.
  284. auto PhysRegToVReg = MIRBuilder.buildCopy(LLT::scalar(LocSize), PhysReg);
  285. MIRBuilder.buildTrunc(ValVReg, PhysRegToVReg);
  286. }
  287. }
  288. unsigned assignCustomValue(const ARMCallLowering::ArgInfo &Arg,
  289. ArrayRef<CCValAssign> VAs) override {
  290. assert(Arg.Regs.size() == 1 && "Can't handle multple regs yet");
  291. CCValAssign VA = VAs[0];
  292. assert(VA.needsCustom() && "Value doesn't need custom handling");
  293. // Custom lowering for other types, such as f16, is currently not supported
  294. if (VA.getValVT() != MVT::f64)
  295. return 0;
  296. CCValAssign NextVA = VAs[1];
  297. assert(NextVA.needsCustom() && "Value doesn't need custom handling");
  298. assert(NextVA.getValVT() == MVT::f64 && "Unsupported type");
  299. assert(VA.getValNo() == NextVA.getValNo() &&
  300. "Values belong to different arguments");
  301. assert(VA.isRegLoc() && "Value should be in reg");
  302. assert(NextVA.isRegLoc() && "Value should be in reg");
  303. Register NewRegs[] = {MRI.createGenericVirtualRegister(LLT::scalar(32)),
  304. MRI.createGenericVirtualRegister(LLT::scalar(32))};
  305. assignValueToReg(NewRegs[0], VA.getLocReg(), VA);
  306. assignValueToReg(NewRegs[1], NextVA.getLocReg(), NextVA);
  307. bool IsLittle = MIRBuilder.getMF().getSubtarget<ARMSubtarget>().isLittle();
  308. if (!IsLittle)
  309. std::swap(NewRegs[0], NewRegs[1]);
  310. MIRBuilder.buildMerge(Arg.Regs[0], NewRegs);
  311. return 1;
  312. }
  313. /// Marking a physical register as used is different between formal
  314. /// parameters, where it's a basic block live-in, and call returns, where it's
  315. /// an implicit-def of the call instruction.
  316. virtual void markPhysRegUsed(unsigned PhysReg) = 0;
  317. };
  318. struct FormalArgHandler : public ARMIncomingValueHandler {
  319. FormalArgHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI,
  320. CCAssignFn AssignFn)
  321. : ARMIncomingValueHandler(MIRBuilder, MRI, AssignFn) {}
  322. void markPhysRegUsed(unsigned PhysReg) override {
  323. MIRBuilder.getMRI()->addLiveIn(PhysReg);
  324. MIRBuilder.getMBB().addLiveIn(PhysReg);
  325. }
  326. };
  327. } // end anonymous namespace
  328. bool ARMCallLowering::lowerFormalArguments(MachineIRBuilder &MIRBuilder,
  329. const Function &F,
  330. ArrayRef<ArrayRef<Register>> VRegs,
  331. FunctionLoweringInfo &FLI) const {
  332. auto &TLI = *getTLI<ARMTargetLowering>();
  333. auto Subtarget = TLI.getSubtarget();
  334. if (Subtarget->isThumb1Only())
  335. return false;
  336. // Quick exit if there aren't any args
  337. if (F.arg_empty())
  338. return true;
  339. if (F.isVarArg())
  340. return false;
  341. auto &MF = MIRBuilder.getMF();
  342. auto &MBB = MIRBuilder.getMBB();
  343. auto DL = MF.getDataLayout();
  344. for (auto &Arg : F.args()) {
  345. if (!isSupportedType(DL, TLI, Arg.getType()))
  346. return false;
  347. if (Arg.hasPassPointeeByValueCopyAttr())
  348. return false;
  349. }
  350. CCAssignFn *AssignFn =
  351. TLI.CCAssignFnForCall(F.getCallingConv(), F.isVarArg());
  352. FormalArgHandler ArgHandler(MIRBuilder, MIRBuilder.getMF().getRegInfo(),
  353. AssignFn);
  354. SmallVector<ArgInfo, 8> SplitArgInfos;
  355. unsigned Idx = 0;
  356. for (auto &Arg : F.args()) {
  357. ArgInfo OrigArgInfo(VRegs[Idx], Arg.getType());
  358. setArgFlags(OrigArgInfo, Idx + AttributeList::FirstArgIndex, DL, F);
  359. splitToValueTypes(OrigArgInfo, SplitArgInfos, MF);
  360. Idx++;
  361. }
  362. if (!MBB.empty())
  363. MIRBuilder.setInstr(*MBB.begin());
  364. if (!handleAssignments(MIRBuilder, SplitArgInfos, ArgHandler))
  365. return false;
  366. // Move back to the end of the basic block.
  367. MIRBuilder.setMBB(MBB);
  368. return true;
  369. }
  370. namespace {
  371. struct CallReturnHandler : public ARMIncomingValueHandler {
  372. CallReturnHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI,
  373. MachineInstrBuilder MIB, CCAssignFn *AssignFn)
  374. : ARMIncomingValueHandler(MIRBuilder, MRI, AssignFn), MIB(MIB) {}
  375. void markPhysRegUsed(unsigned PhysReg) override {
  376. MIB.addDef(PhysReg, RegState::Implicit);
  377. }
  378. MachineInstrBuilder MIB;
  379. };
  380. // FIXME: This should move to the ARMSubtarget when it supports all the opcodes.
  381. unsigned getCallOpcode(const MachineFunction &MF, const ARMSubtarget &STI,
  382. bool isDirect) {
  383. if (isDirect)
  384. return STI.isThumb() ? ARM::tBL : ARM::BL;
  385. if (STI.isThumb())
  386. return gettBLXrOpcode(MF);
  387. if (STI.hasV5TOps())
  388. return getBLXOpcode(MF);
  389. if (STI.hasV4TOps())
  390. return ARM::BX_CALL;
  391. return ARM::BMOVPCRX_CALL;
  392. }
  393. } // end anonymous namespace
  394. bool ARMCallLowering::lowerCall(MachineIRBuilder &MIRBuilder, CallLoweringInfo &Info) const {
  395. MachineFunction &MF = MIRBuilder.getMF();
  396. const auto &TLI = *getTLI<ARMTargetLowering>();
  397. const auto &DL = MF.getDataLayout();
  398. const auto &STI = MF.getSubtarget<ARMSubtarget>();
  399. const TargetRegisterInfo *TRI = STI.getRegisterInfo();
  400. MachineRegisterInfo &MRI = MF.getRegInfo();
  401. if (STI.genLongCalls())
  402. return false;
  403. if (STI.isThumb1Only())
  404. return false;
  405. auto CallSeqStart = MIRBuilder.buildInstr(ARM::ADJCALLSTACKDOWN);
  406. // Create the call instruction so we can add the implicit uses of arg
  407. // registers, but don't insert it yet.
  408. bool IsDirect = !Info.Callee.isReg();
  409. auto CallOpcode = getCallOpcode(MF, STI, IsDirect);
  410. auto MIB = MIRBuilder.buildInstrNoInsert(CallOpcode);
  411. bool IsThumb = STI.isThumb();
  412. if (IsThumb)
  413. MIB.add(predOps(ARMCC::AL));
  414. MIB.add(Info.Callee);
  415. if (!IsDirect) {
  416. auto CalleeReg = Info.Callee.getReg();
  417. if (CalleeReg && !Register::isPhysicalRegister(CalleeReg)) {
  418. unsigned CalleeIdx = IsThumb ? 2 : 0;
  419. MIB->getOperand(CalleeIdx).setReg(constrainOperandRegClass(
  420. MF, *TRI, MRI, *STI.getInstrInfo(), *STI.getRegBankInfo(),
  421. *MIB.getInstr(), MIB->getDesc(), Info.Callee, CalleeIdx));
  422. }
  423. }
  424. MIB.addRegMask(TRI->getCallPreservedMask(MF, Info.CallConv));
  425. SmallVector<ArgInfo, 8> ArgInfos;
  426. for (auto Arg : Info.OrigArgs) {
  427. if (!isSupportedType(DL, TLI, Arg.Ty))
  428. return false;
  429. if (Arg.Flags[0].isByVal())
  430. return false;
  431. splitToValueTypes(Arg, ArgInfos, MF);
  432. }
  433. auto ArgAssignFn = TLI.CCAssignFnForCall(Info.CallConv, Info.IsVarArg);
  434. ARMOutgoingValueHandler ArgHandler(MIRBuilder, MRI, MIB, ArgAssignFn);
  435. if (!handleAssignments(MIRBuilder, ArgInfos, ArgHandler))
  436. return false;
  437. // Now we can add the actual call instruction to the correct basic block.
  438. MIRBuilder.insertInstr(MIB);
  439. if (!Info.OrigRet.Ty->isVoidTy()) {
  440. if (!isSupportedType(DL, TLI, Info.OrigRet.Ty))
  441. return false;
  442. ArgInfos.clear();
  443. splitToValueTypes(Info.OrigRet, ArgInfos, MF);
  444. auto RetAssignFn = TLI.CCAssignFnForReturn(Info.CallConv, Info.IsVarArg);
  445. CallReturnHandler RetHandler(MIRBuilder, MRI, MIB, RetAssignFn);
  446. if (!handleAssignments(MIRBuilder, ArgInfos, RetHandler))
  447. return false;
  448. }
  449. // We now know the size of the stack - update the ADJCALLSTACKDOWN
  450. // accordingly.
  451. CallSeqStart.addImm(ArgHandler.StackSize).addImm(0).add(predOps(ARMCC::AL));
  452. MIRBuilder.buildInstr(ARM::ADJCALLSTACKUP)
  453. .addImm(ArgHandler.StackSize)
  454. .addImm(0)
  455. .add(predOps(ARMCC::AL));
  456. return true;
  457. }