ARMExpandPseudoInsts.cpp revision c76c59840b7a4491afdcd2f35483f8d6e5ab533a
1//===-- ARMExpandPseudoInsts.cpp - Expand pseudo instructions -----*- C++ -*-=// 2// 3// The LLVM Compiler Infrastructure 4// 5// This file is distributed under the University of Illinois Open Source 6// License. See LICENSE.TXT for details. 7// 8//===----------------------------------------------------------------------===// 9// 10// This file contains a pass that expands pseudo instructions into target 11// instructions to allow proper scheduling, if-conversion, and other late 12// optimizations. This pass should be run after register allocation but before 13// the post-regalloc scheduling pass. 14// 15//===----------------------------------------------------------------------===// 16 17#define DEBUG_TYPE "arm-pseudo" 18#include "ARM.h" 19#include "ARMAddressingModes.h" 20#include "ARMBaseInstrInfo.h" 21#include "ARMBaseRegisterInfo.h" 22#include "ARMMachineFunctionInfo.h" 23#include "ARMRegisterInfo.h" 24#include "llvm/CodeGen/MachineFrameInfo.h" 25#include "llvm/CodeGen/MachineFunctionPass.h" 26#include "llvm/CodeGen/MachineInstrBuilder.h" 27#include "llvm/Target/TargetFrameInfo.h" 28#include "llvm/Target/TargetRegisterInfo.h" 29#include "llvm/Support/raw_ostream.h" // FIXME: for debug only. remove! 30using namespace llvm; 31 32namespace { 33 class ARMExpandPseudo : public MachineFunctionPass { 34 public: 35 static char ID; 36 ARMExpandPseudo() : MachineFunctionPass(ID) {} 37 38 const ARMBaseInstrInfo *TII; 39 const TargetRegisterInfo *TRI; 40 const ARMSubtarget *STI; 41 42 virtual bool runOnMachineFunction(MachineFunction &Fn); 43 44 virtual const char *getPassName() const { 45 return "ARM pseudo instruction expansion pass"; 46 } 47 48 private: 49 void TransferImpOps(MachineInstr &OldMI, 50 MachineInstrBuilder &UseMI, MachineInstrBuilder &DefMI); 51 bool ExpandMBB(MachineBasicBlock &MBB); 52 void ExpandVLD(MachineBasicBlock::iterator &MBBI); 53 void ExpandVST(MachineBasicBlock::iterator &MBBI); 54 void ExpandLaneOp(MachineBasicBlock::iterator &MBBI); 55 void ExpandVTBL(MachineBasicBlock::iterator &MBBI, 56 unsigned Opc, bool IsExt, unsigned NumRegs); 57 }; 58 char ARMExpandPseudo::ID = 0; 59} 60 61/// TransferImpOps - Transfer implicit operands on the pseudo instruction to 62/// the instructions created from the expansion. 63void ARMExpandPseudo::TransferImpOps(MachineInstr &OldMI, 64 MachineInstrBuilder &UseMI, 65 MachineInstrBuilder &DefMI) { 66 const TargetInstrDesc &Desc = OldMI.getDesc(); 67 for (unsigned i = Desc.getNumOperands(), e = OldMI.getNumOperands(); 68 i != e; ++i) { 69 const MachineOperand &MO = OldMI.getOperand(i); 70 assert(MO.isReg() && MO.getReg()); 71 if (MO.isUse()) 72 UseMI.addOperand(MO); 73 else 74 DefMI.addOperand(MO); 75 } 76} 77 78namespace { 79 // Constants for register spacing in NEON load/store instructions. 80 // For quad-register load-lane and store-lane pseudo instructors, the 81 // spacing is initially assumed to be EvenDblSpc, and that is changed to 82 // OddDblSpc depending on the lane number operand. 83 enum NEONRegSpacing { 84 SingleSpc, 85 EvenDblSpc, 86 OddDblSpc 87 }; 88 89 // Entries for NEON load/store information table. The table is sorted by 90 // PseudoOpc for fast binary-search lookups. 91 struct NEONLdStTableEntry { 92 unsigned PseudoOpc; 93 unsigned RealOpc; 94 bool IsLoad; 95 bool HasWriteBack; 96 NEONRegSpacing RegSpacing; 97 unsigned char NumRegs; // D registers loaded or stored 98 unsigned char RegElts; // elements per D register; used for lane ops 99 100 // Comparison methods for binary search of the table. 101 bool operator<(const NEONLdStTableEntry &TE) const { 102 return PseudoOpc < TE.PseudoOpc; 103 } 104 friend bool operator<(const NEONLdStTableEntry &TE, unsigned PseudoOpc) { 105 return TE.PseudoOpc < PseudoOpc; 106 } 107 friend bool LLVM_ATTRIBUTE_UNUSED operator<(unsigned PseudoOpc, 108 const NEONLdStTableEntry &TE) { 109 return PseudoOpc < TE.PseudoOpc; 110 } 111 }; 112} 113 114static const NEONLdStTableEntry NEONLdStTable[] = { 115{ ARM::VLD1DUPq16Pseudo, ARM::VLD1DUPq16, true, false, SingleSpc, 2, 4}, 116{ ARM::VLD1DUPq16Pseudo_UPD, ARM::VLD1DUPq16_UPD, true, true, SingleSpc, 2, 4}, 117{ ARM::VLD1DUPq32Pseudo, ARM::VLD1DUPq32, true, false, SingleSpc, 2, 2}, 118{ ARM::VLD1DUPq32Pseudo_UPD, ARM::VLD1DUPq32_UPD, true, true, SingleSpc, 2, 2}, 119{ ARM::VLD1DUPq8Pseudo, ARM::VLD1DUPq8, true, false, SingleSpc, 2, 8}, 120{ ARM::VLD1DUPq8Pseudo_UPD, ARM::VLD1DUPq8_UPD, true, true, SingleSpc, 2, 8}, 121 122{ ARM::VLD1LNq16Pseudo, ARM::VLD1LNd16, true, false, EvenDblSpc, 1, 4 }, 123{ ARM::VLD1LNq16Pseudo_UPD, ARM::VLD1LNd16_UPD, true, true, EvenDblSpc, 1, 4 }, 124{ ARM::VLD1LNq32Pseudo, ARM::VLD1LNd32, true, false, EvenDblSpc, 1, 2 }, 125{ ARM::VLD1LNq32Pseudo_UPD, ARM::VLD1LNd32_UPD, true, true, EvenDblSpc, 1, 2 }, 126{ ARM::VLD1LNq8Pseudo, ARM::VLD1LNd8, true, false, EvenDblSpc, 1, 8 }, 127{ ARM::VLD1LNq8Pseudo_UPD, ARM::VLD1LNd8_UPD, true, true, EvenDblSpc, 1, 8 }, 128 129{ ARM::VLD1d64QPseudo, ARM::VLD1d64Q, true, false, SingleSpc, 4, 1 }, 130{ ARM::VLD1d64QPseudo_UPD, ARM::VLD1d64Q_UPD, true, true, SingleSpc, 4, 1 }, 131{ ARM::VLD1d64TPseudo, ARM::VLD1d64T, true, false, SingleSpc, 3, 1 }, 132{ ARM::VLD1d64TPseudo_UPD, ARM::VLD1d64T_UPD, true, true, SingleSpc, 3, 1 }, 133 134{ ARM::VLD1q16Pseudo, ARM::VLD1q16, true, false, SingleSpc, 2, 4 }, 135{ ARM::VLD1q16Pseudo_UPD, ARM::VLD1q16_UPD, true, true, SingleSpc, 2, 4 }, 136{ ARM::VLD1q32Pseudo, ARM::VLD1q32, true, false, SingleSpc, 2, 2 }, 137{ ARM::VLD1q32Pseudo_UPD, ARM::VLD1q32_UPD, true, true, SingleSpc, 2, 2 }, 138{ ARM::VLD1q64Pseudo, ARM::VLD1q64, true, false, SingleSpc, 2, 1 }, 139{ ARM::VLD1q64Pseudo_UPD, ARM::VLD1q64_UPD, true, true, SingleSpc, 2, 1 }, 140{ ARM::VLD1q8Pseudo, ARM::VLD1q8, true, false, SingleSpc, 2, 8 }, 141{ ARM::VLD1q8Pseudo_UPD, ARM::VLD1q8_UPD, true, true, SingleSpc, 2, 8 }, 142 143{ ARM::VLD2DUPd16Pseudo, ARM::VLD2DUPd16, true, false, SingleSpc, 2, 4}, 144{ ARM::VLD2DUPd16Pseudo_UPD, ARM::VLD2DUPd16_UPD, true, true, SingleSpc, 2, 4}, 145{ ARM::VLD2DUPd32Pseudo, ARM::VLD2DUPd32, true, false, SingleSpc, 2, 2}, 146{ ARM::VLD2DUPd32Pseudo_UPD, ARM::VLD2DUPd32_UPD, true, true, SingleSpc, 2, 2}, 147{ ARM::VLD2DUPd8Pseudo, ARM::VLD2DUPd8, true, false, SingleSpc, 2, 8}, 148{ ARM::VLD2DUPd8Pseudo_UPD, ARM::VLD2DUPd8_UPD, true, true, SingleSpc, 2, 8}, 149 150{ ARM::VLD2LNd16Pseudo, ARM::VLD2LNd16, true, false, SingleSpc, 2, 4 }, 151{ ARM::VLD2LNd16Pseudo_UPD, ARM::VLD2LNd16_UPD, true, true, SingleSpc, 2, 4 }, 152{ ARM::VLD2LNd32Pseudo, ARM::VLD2LNd32, true, false, SingleSpc, 2, 2 }, 153{ ARM::VLD2LNd32Pseudo_UPD, ARM::VLD2LNd32_UPD, true, true, SingleSpc, 2, 2 }, 154{ ARM::VLD2LNd8Pseudo, ARM::VLD2LNd8, true, false, SingleSpc, 2, 8 }, 155{ ARM::VLD2LNd8Pseudo_UPD, ARM::VLD2LNd8_UPD, true, true, SingleSpc, 2, 8 }, 156{ ARM::VLD2LNq16Pseudo, ARM::VLD2LNq16, true, false, EvenDblSpc, 2, 4 }, 157{ ARM::VLD2LNq16Pseudo_UPD, ARM::VLD2LNq16_UPD, true, true, EvenDblSpc, 2, 4 }, 158{ ARM::VLD2LNq32Pseudo, ARM::VLD2LNq32, true, false, EvenDblSpc, 2, 2 }, 159{ ARM::VLD2LNq32Pseudo_UPD, ARM::VLD2LNq32_UPD, true, true, EvenDblSpc, 2, 2 }, 160 161{ ARM::VLD2d16Pseudo, ARM::VLD2d16, true, false, SingleSpc, 2, 4 }, 162{ ARM::VLD2d16Pseudo_UPD, ARM::VLD2d16_UPD, true, true, SingleSpc, 2, 4 }, 163{ ARM::VLD2d32Pseudo, ARM::VLD2d32, true, false, SingleSpc, 2, 2 }, 164{ ARM::VLD2d32Pseudo_UPD, ARM::VLD2d32_UPD, true, true, SingleSpc, 2, 2 }, 165{ ARM::VLD2d8Pseudo, ARM::VLD2d8, true, false, SingleSpc, 2, 8 }, 166{ ARM::VLD2d8Pseudo_UPD, ARM::VLD2d8_UPD, true, true, SingleSpc, 2, 8 }, 167 168{ ARM::VLD2q16Pseudo, ARM::VLD2q16, true, false, SingleSpc, 4, 4 }, 169{ ARM::VLD2q16Pseudo_UPD, ARM::VLD2q16_UPD, true, true, SingleSpc, 4, 4 }, 170{ ARM::VLD2q32Pseudo, ARM::VLD2q32, true, false, SingleSpc, 4, 2 }, 171{ ARM::VLD2q32Pseudo_UPD, ARM::VLD2q32_UPD, true, true, SingleSpc, 4, 2 }, 172{ ARM::VLD2q8Pseudo, ARM::VLD2q8, true, false, SingleSpc, 4, 8 }, 173{ ARM::VLD2q8Pseudo_UPD, ARM::VLD2q8_UPD, true, true, SingleSpc, 4, 8 }, 174 175{ ARM::VLD3DUPd16Pseudo, ARM::VLD3DUPd16, true, false, SingleSpc, 3, 4}, 176{ ARM::VLD3DUPd16Pseudo_UPD, ARM::VLD3DUPd16_UPD, true, true, SingleSpc, 3, 4}, 177{ ARM::VLD3DUPd32Pseudo, ARM::VLD3DUPd32, true, false, SingleSpc, 3, 2}, 178{ ARM::VLD3DUPd32Pseudo_UPD, ARM::VLD3DUPd32_UPD, true, true, SingleSpc, 3, 2}, 179{ ARM::VLD3DUPd8Pseudo, ARM::VLD3DUPd8, true, false, SingleSpc, 3, 8}, 180{ ARM::VLD3DUPd8Pseudo_UPD, ARM::VLD3DUPd8_UPD, true, true, SingleSpc, 3, 8}, 181 182{ ARM::VLD3LNd16Pseudo, ARM::VLD3LNd16, true, false, SingleSpc, 3, 4 }, 183{ ARM::VLD3LNd16Pseudo_UPD, ARM::VLD3LNd16_UPD, true, true, SingleSpc, 3, 4 }, 184{ ARM::VLD3LNd32Pseudo, ARM::VLD3LNd32, true, false, SingleSpc, 3, 2 }, 185{ ARM::VLD3LNd32Pseudo_UPD, ARM::VLD3LNd32_UPD, true, true, SingleSpc, 3, 2 }, 186{ ARM::VLD3LNd8Pseudo, ARM::VLD3LNd8, true, false, SingleSpc, 3, 8 }, 187{ ARM::VLD3LNd8Pseudo_UPD, ARM::VLD3LNd8_UPD, true, true, SingleSpc, 3, 8 }, 188{ ARM::VLD3LNq16Pseudo, ARM::VLD3LNq16, true, false, EvenDblSpc, 3, 4 }, 189{ ARM::VLD3LNq16Pseudo_UPD, ARM::VLD3LNq16_UPD, true, true, EvenDblSpc, 3, 4 }, 190{ ARM::VLD3LNq32Pseudo, ARM::VLD3LNq32, true, false, EvenDblSpc, 3, 2 }, 191{ ARM::VLD3LNq32Pseudo_UPD, ARM::VLD3LNq32_UPD, true, true, EvenDblSpc, 3, 2 }, 192 193{ ARM::VLD3d16Pseudo, ARM::VLD3d16, true, false, SingleSpc, 3, 4 }, 194{ ARM::VLD3d16Pseudo_UPD, ARM::VLD3d16_UPD, true, true, SingleSpc, 3, 4 }, 195{ ARM::VLD3d32Pseudo, ARM::VLD3d32, true, false, SingleSpc, 3, 2 }, 196{ ARM::VLD3d32Pseudo_UPD, ARM::VLD3d32_UPD, true, true, SingleSpc, 3, 2 }, 197{ ARM::VLD3d8Pseudo, ARM::VLD3d8, true, false, SingleSpc, 3, 8 }, 198{ ARM::VLD3d8Pseudo_UPD, ARM::VLD3d8_UPD, true, true, SingleSpc, 3, 8 }, 199 200{ ARM::VLD3q16Pseudo_UPD, ARM::VLD3q16_UPD, true, true, EvenDblSpc, 3, 4 }, 201{ ARM::VLD3q16oddPseudo_UPD, ARM::VLD3q16_UPD, true, true, OddDblSpc, 3, 4 }, 202{ ARM::VLD3q32Pseudo_UPD, ARM::VLD3q32_UPD, true, true, EvenDblSpc, 3, 2 }, 203{ ARM::VLD3q32oddPseudo_UPD, ARM::VLD3q32_UPD, true, true, OddDblSpc, 3, 2 }, 204{ ARM::VLD3q8Pseudo_UPD, ARM::VLD3q8_UPD, true, true, EvenDblSpc, 3, 8 }, 205{ ARM::VLD3q8oddPseudo_UPD, ARM::VLD3q8_UPD, true, true, OddDblSpc, 3, 8 }, 206 207{ ARM::VLD4DUPd16Pseudo, ARM::VLD4DUPd16, true, false, SingleSpc, 4, 4}, 208{ ARM::VLD4DUPd16Pseudo_UPD, ARM::VLD4DUPd16_UPD, true, true, SingleSpc, 4, 4}, 209{ ARM::VLD4DUPd32Pseudo, ARM::VLD4DUPd32, true, false, SingleSpc, 4, 2}, 210{ ARM::VLD4DUPd32Pseudo_UPD, ARM::VLD4DUPd32_UPD, true, true, SingleSpc, 4, 2}, 211{ ARM::VLD4DUPd8Pseudo, ARM::VLD4DUPd8, true, false, SingleSpc, 4, 8}, 212{ ARM::VLD4DUPd8Pseudo_UPD, ARM::VLD4DUPd8_UPD, true, true, SingleSpc, 4, 8}, 213 214{ ARM::VLD4LNd16Pseudo, ARM::VLD4LNd16, true, false, SingleSpc, 4, 4 }, 215{ ARM::VLD4LNd16Pseudo_UPD, ARM::VLD4LNd16_UPD, true, true, SingleSpc, 4, 4 }, 216{ ARM::VLD4LNd32Pseudo, ARM::VLD4LNd32, true, false, SingleSpc, 4, 2 }, 217{ ARM::VLD4LNd32Pseudo_UPD, ARM::VLD4LNd32_UPD, true, true, SingleSpc, 4, 2 }, 218{ ARM::VLD4LNd8Pseudo, ARM::VLD4LNd8, true, false, SingleSpc, 4, 8 }, 219{ ARM::VLD4LNd8Pseudo_UPD, ARM::VLD4LNd8_UPD, true, true, SingleSpc, 4, 8 }, 220{ ARM::VLD4LNq16Pseudo, ARM::VLD4LNq16, true, false, EvenDblSpc, 4, 4 }, 221{ ARM::VLD4LNq16Pseudo_UPD, ARM::VLD4LNq16_UPD, true, true, EvenDblSpc, 4, 4 }, 222{ ARM::VLD4LNq32Pseudo, ARM::VLD4LNq32, true, false, EvenDblSpc, 4, 2 }, 223{ ARM::VLD4LNq32Pseudo_UPD, ARM::VLD4LNq32_UPD, true, true, EvenDblSpc, 4, 2 }, 224 225{ ARM::VLD4d16Pseudo, ARM::VLD4d16, true, false, SingleSpc, 4, 4 }, 226{ ARM::VLD4d16Pseudo_UPD, ARM::VLD4d16_UPD, true, true, SingleSpc, 4, 4 }, 227{ ARM::VLD4d32Pseudo, ARM::VLD4d32, true, false, SingleSpc, 4, 2 }, 228{ ARM::VLD4d32Pseudo_UPD, ARM::VLD4d32_UPD, true, true, SingleSpc, 4, 2 }, 229{ ARM::VLD4d8Pseudo, ARM::VLD4d8, true, false, SingleSpc, 4, 8 }, 230{ ARM::VLD4d8Pseudo_UPD, ARM::VLD4d8_UPD, true, true, SingleSpc, 4, 8 }, 231 232{ ARM::VLD4q16Pseudo_UPD, ARM::VLD4q16_UPD, true, true, EvenDblSpc, 4, 4 }, 233{ ARM::VLD4q16oddPseudo_UPD, ARM::VLD4q16_UPD, true, true, OddDblSpc, 4, 4 }, 234{ ARM::VLD4q32Pseudo_UPD, ARM::VLD4q32_UPD, true, true, EvenDblSpc, 4, 2 }, 235{ ARM::VLD4q32oddPseudo_UPD, ARM::VLD4q32_UPD, true, true, OddDblSpc, 4, 2 }, 236{ ARM::VLD4q8Pseudo_UPD, ARM::VLD4q8_UPD, true, true, EvenDblSpc, 4, 8 }, 237{ ARM::VLD4q8oddPseudo_UPD, ARM::VLD4q8_UPD, true, true, OddDblSpc, 4, 8 }, 238 239{ ARM::VST1LNq16Pseudo, ARM::VST1LNd16, false, false, EvenDblSpc, 1, 4 }, 240{ ARM::VST1LNq16Pseudo_UPD, ARM::VST1LNd16_UPD,false, true, EvenDblSpc, 1, 4 }, 241{ ARM::VST1LNq32Pseudo, ARM::VST1LNd32, false, false, EvenDblSpc, 1, 2 }, 242{ ARM::VST1LNq32Pseudo_UPD, ARM::VST1LNd32_UPD,false, true, EvenDblSpc, 1, 2 }, 243{ ARM::VST1LNq8Pseudo, ARM::VST1LNd8, false, false, EvenDblSpc, 1, 8 }, 244{ ARM::VST1LNq8Pseudo_UPD, ARM::VST1LNd8_UPD, false, true, EvenDblSpc, 1, 8 }, 245 246{ ARM::VST1d64QPseudo, ARM::VST1d64Q, false, false, SingleSpc, 4, 1 }, 247{ ARM::VST1d64QPseudo_UPD, ARM::VST1d64Q_UPD, false, true, SingleSpc, 4, 1 }, 248{ ARM::VST1d64TPseudo, ARM::VST1d64T, false, false, SingleSpc, 3, 1 }, 249{ ARM::VST1d64TPseudo_UPD, ARM::VST1d64T_UPD, false, true, SingleSpc, 3, 1 }, 250 251{ ARM::VST1q16Pseudo, ARM::VST1q16, false, false, SingleSpc, 2, 4 }, 252{ ARM::VST1q16Pseudo_UPD, ARM::VST1q16_UPD, false, true, SingleSpc, 2, 4 }, 253{ ARM::VST1q32Pseudo, ARM::VST1q32, false, false, SingleSpc, 2, 2 }, 254{ ARM::VST1q32Pseudo_UPD, ARM::VST1q32_UPD, false, true, SingleSpc, 2, 2 }, 255{ ARM::VST1q64Pseudo, ARM::VST1q64, false, false, SingleSpc, 2, 1 }, 256{ ARM::VST1q64Pseudo_UPD, ARM::VST1q64_UPD, false, true, SingleSpc, 2, 1 }, 257{ ARM::VST1q8Pseudo, ARM::VST1q8, false, false, SingleSpc, 2, 8 }, 258{ ARM::VST1q8Pseudo_UPD, ARM::VST1q8_UPD, false, true, SingleSpc, 2, 8 }, 259 260{ ARM::VST2LNd16Pseudo, ARM::VST2LNd16, false, false, SingleSpc, 2, 4 }, 261{ ARM::VST2LNd16Pseudo_UPD, ARM::VST2LNd16_UPD, false, true, SingleSpc, 2, 4 }, 262{ ARM::VST2LNd32Pseudo, ARM::VST2LNd32, false, false, SingleSpc, 2, 2 }, 263{ ARM::VST2LNd32Pseudo_UPD, ARM::VST2LNd32_UPD, false, true, SingleSpc, 2, 2 }, 264{ ARM::VST2LNd8Pseudo, ARM::VST2LNd8, false, false, SingleSpc, 2, 8 }, 265{ ARM::VST2LNd8Pseudo_UPD, ARM::VST2LNd8_UPD, false, true, SingleSpc, 2, 8 }, 266{ ARM::VST2LNq16Pseudo, ARM::VST2LNq16, false, false, EvenDblSpc, 2, 4}, 267{ ARM::VST2LNq16Pseudo_UPD, ARM::VST2LNq16_UPD, false, true, EvenDblSpc, 2, 4}, 268{ ARM::VST2LNq32Pseudo, ARM::VST2LNq32, false, false, EvenDblSpc, 2, 2}, 269{ ARM::VST2LNq32Pseudo_UPD, ARM::VST2LNq32_UPD, false, true, EvenDblSpc, 2, 2}, 270 271{ ARM::VST2d16Pseudo, ARM::VST2d16, false, false, SingleSpc, 2, 4 }, 272{ ARM::VST2d16Pseudo_UPD, ARM::VST2d16_UPD, false, true, SingleSpc, 2, 4 }, 273{ ARM::VST2d32Pseudo, ARM::VST2d32, false, false, SingleSpc, 2, 2 }, 274{ ARM::VST2d32Pseudo_UPD, ARM::VST2d32_UPD, false, true, SingleSpc, 2, 2 }, 275{ ARM::VST2d8Pseudo, ARM::VST2d8, false, false, SingleSpc, 2, 8 }, 276{ ARM::VST2d8Pseudo_UPD, ARM::VST2d8_UPD, false, true, SingleSpc, 2, 8 }, 277 278{ ARM::VST2q16Pseudo, ARM::VST2q16, false, false, SingleSpc, 4, 4 }, 279{ ARM::VST2q16Pseudo_UPD, ARM::VST2q16_UPD, false, true, SingleSpc, 4, 4 }, 280{ ARM::VST2q32Pseudo, ARM::VST2q32, false, false, SingleSpc, 4, 2 }, 281{ ARM::VST2q32Pseudo_UPD, ARM::VST2q32_UPD, false, true, SingleSpc, 4, 2 }, 282{ ARM::VST2q8Pseudo, ARM::VST2q8, false, false, SingleSpc, 4, 8 }, 283{ ARM::VST2q8Pseudo_UPD, ARM::VST2q8_UPD, false, true, SingleSpc, 4, 8 }, 284 285{ ARM::VST3LNd16Pseudo, ARM::VST3LNd16, false, false, SingleSpc, 3, 4 }, 286{ ARM::VST3LNd16Pseudo_UPD, ARM::VST3LNd16_UPD, false, true, SingleSpc, 3, 4 }, 287{ ARM::VST3LNd32Pseudo, ARM::VST3LNd32, false, false, SingleSpc, 3, 2 }, 288{ ARM::VST3LNd32Pseudo_UPD, ARM::VST3LNd32_UPD, false, true, SingleSpc, 3, 2 }, 289{ ARM::VST3LNd8Pseudo, ARM::VST3LNd8, false, false, SingleSpc, 3, 8 }, 290{ ARM::VST3LNd8Pseudo_UPD, ARM::VST3LNd8_UPD, false, true, SingleSpc, 3, 8 }, 291{ ARM::VST3LNq16Pseudo, ARM::VST3LNq16, false, false, EvenDblSpc, 3, 4}, 292{ ARM::VST3LNq16Pseudo_UPD, ARM::VST3LNq16_UPD, false, true, EvenDblSpc, 3, 4}, 293{ ARM::VST3LNq32Pseudo, ARM::VST3LNq32, false, false, EvenDblSpc, 3, 2}, 294{ ARM::VST3LNq32Pseudo_UPD, ARM::VST3LNq32_UPD, false, true, EvenDblSpc, 3, 2}, 295 296{ ARM::VST3d16Pseudo, ARM::VST3d16, false, false, SingleSpc, 3, 4 }, 297{ ARM::VST3d16Pseudo_UPD, ARM::VST3d16_UPD, false, true, SingleSpc, 3, 4 }, 298{ ARM::VST3d32Pseudo, ARM::VST3d32, false, false, SingleSpc, 3, 2 }, 299{ ARM::VST3d32Pseudo_UPD, ARM::VST3d32_UPD, false, true, SingleSpc, 3, 2 }, 300{ ARM::VST3d8Pseudo, ARM::VST3d8, false, false, SingleSpc, 3, 8 }, 301{ ARM::VST3d8Pseudo_UPD, ARM::VST3d8_UPD, false, true, SingleSpc, 3, 8 }, 302 303{ ARM::VST3q16Pseudo_UPD, ARM::VST3q16_UPD, false, true, EvenDblSpc, 3, 4 }, 304{ ARM::VST3q16oddPseudo_UPD, ARM::VST3q16_UPD, false, true, OddDblSpc, 3, 4 }, 305{ ARM::VST3q32Pseudo_UPD, ARM::VST3q32_UPD, false, true, EvenDblSpc, 3, 2 }, 306{ ARM::VST3q32oddPseudo_UPD, ARM::VST3q32_UPD, false, true, OddDblSpc, 3, 2 }, 307{ ARM::VST3q8Pseudo_UPD, ARM::VST3q8_UPD, false, true, EvenDblSpc, 3, 8 }, 308{ ARM::VST3q8oddPseudo_UPD, ARM::VST3q8_UPD, false, true, OddDblSpc, 3, 8 }, 309 310{ ARM::VST4LNd16Pseudo, ARM::VST4LNd16, false, false, SingleSpc, 4, 4 }, 311{ ARM::VST4LNd16Pseudo_UPD, ARM::VST4LNd16_UPD, false, true, SingleSpc, 4, 4 }, 312{ ARM::VST4LNd32Pseudo, ARM::VST4LNd32, false, false, SingleSpc, 4, 2 }, 313{ ARM::VST4LNd32Pseudo_UPD, ARM::VST4LNd32_UPD, false, true, SingleSpc, 4, 2 }, 314{ ARM::VST4LNd8Pseudo, ARM::VST4LNd8, false, false, SingleSpc, 4, 8 }, 315{ ARM::VST4LNd8Pseudo_UPD, ARM::VST4LNd8_UPD, false, true, SingleSpc, 4, 8 }, 316{ ARM::VST4LNq16Pseudo, ARM::VST4LNq16, false, false, EvenDblSpc, 4, 4}, 317{ ARM::VST4LNq16Pseudo_UPD, ARM::VST4LNq16_UPD, false, true, EvenDblSpc, 4, 4}, 318{ ARM::VST4LNq32Pseudo, ARM::VST4LNq32, false, false, EvenDblSpc, 4, 2}, 319{ ARM::VST4LNq32Pseudo_UPD, ARM::VST4LNq32_UPD, false, true, EvenDblSpc, 4, 2}, 320 321{ ARM::VST4d16Pseudo, ARM::VST4d16, false, false, SingleSpc, 4, 4 }, 322{ ARM::VST4d16Pseudo_UPD, ARM::VST4d16_UPD, false, true, SingleSpc, 4, 4 }, 323{ ARM::VST4d32Pseudo, ARM::VST4d32, false, false, SingleSpc, 4, 2 }, 324{ ARM::VST4d32Pseudo_UPD, ARM::VST4d32_UPD, false, true, SingleSpc, 4, 2 }, 325{ ARM::VST4d8Pseudo, ARM::VST4d8, false, false, SingleSpc, 4, 8 }, 326{ ARM::VST4d8Pseudo_UPD, ARM::VST4d8_UPD, false, true, SingleSpc, 4, 8 }, 327 328{ ARM::VST4q16Pseudo_UPD, ARM::VST4q16_UPD, false, true, EvenDblSpc, 4, 4 }, 329{ ARM::VST4q16oddPseudo_UPD, ARM::VST4q16_UPD, false, true, OddDblSpc, 4, 4 }, 330{ ARM::VST4q32Pseudo_UPD, ARM::VST4q32_UPD, false, true, EvenDblSpc, 4, 2 }, 331{ ARM::VST4q32oddPseudo_UPD, ARM::VST4q32_UPD, false, true, OddDblSpc, 4, 2 }, 332{ ARM::VST4q8Pseudo_UPD, ARM::VST4q8_UPD, false, true, EvenDblSpc, 4, 8 }, 333{ ARM::VST4q8oddPseudo_UPD , ARM::VST4q8_UPD, false, true, OddDblSpc, 4, 8 } 334}; 335 336/// LookupNEONLdSt - Search the NEONLdStTable for information about a NEON 337/// load or store pseudo instruction. 338static const NEONLdStTableEntry *LookupNEONLdSt(unsigned Opcode) { 339 unsigned NumEntries = array_lengthof(NEONLdStTable); 340 341#ifndef NDEBUG 342 // Make sure the table is sorted. 343 static bool TableChecked = false; 344 if (!TableChecked) { 345 for (unsigned i = 0; i != NumEntries-1; ++i) 346 assert(NEONLdStTable[i] < NEONLdStTable[i+1] && 347 "NEONLdStTable is not sorted!"); 348 TableChecked = true; 349 } 350#endif 351 352 const NEONLdStTableEntry *I = 353 std::lower_bound(NEONLdStTable, NEONLdStTable + NumEntries, Opcode); 354 if (I != NEONLdStTable + NumEntries && I->PseudoOpc == Opcode) 355 return I; 356 return NULL; 357} 358 359/// GetDSubRegs - Get 4 D subregisters of a Q, QQ, or QQQQ register, 360/// corresponding to the specified register spacing. Not all of the results 361/// are necessarily valid, e.g., a Q register only has 2 D subregisters. 362static void GetDSubRegs(unsigned Reg, NEONRegSpacing RegSpc, 363 const TargetRegisterInfo *TRI, unsigned &D0, 364 unsigned &D1, unsigned &D2, unsigned &D3) { 365 if (RegSpc == SingleSpc) { 366 D0 = TRI->getSubReg(Reg, ARM::dsub_0); 367 D1 = TRI->getSubReg(Reg, ARM::dsub_1); 368 D2 = TRI->getSubReg(Reg, ARM::dsub_2); 369 D3 = TRI->getSubReg(Reg, ARM::dsub_3); 370 } else if (RegSpc == EvenDblSpc) { 371 D0 = TRI->getSubReg(Reg, ARM::dsub_0); 372 D1 = TRI->getSubReg(Reg, ARM::dsub_2); 373 D2 = TRI->getSubReg(Reg, ARM::dsub_4); 374 D3 = TRI->getSubReg(Reg, ARM::dsub_6); 375 } else { 376 assert(RegSpc == OddDblSpc && "unknown register spacing"); 377 D0 = TRI->getSubReg(Reg, ARM::dsub_1); 378 D1 = TRI->getSubReg(Reg, ARM::dsub_3); 379 D2 = TRI->getSubReg(Reg, ARM::dsub_5); 380 D3 = TRI->getSubReg(Reg, ARM::dsub_7); 381 } 382} 383 384/// ExpandVLD - Translate VLD pseudo instructions with Q, QQ or QQQQ register 385/// operands to real VLD instructions with D register operands. 386void ARMExpandPseudo::ExpandVLD(MachineBasicBlock::iterator &MBBI) { 387 MachineInstr &MI = *MBBI; 388 MachineBasicBlock &MBB = *MI.getParent(); 389 390 const NEONLdStTableEntry *TableEntry = LookupNEONLdSt(MI.getOpcode()); 391 assert(TableEntry && TableEntry->IsLoad && "NEONLdStTable lookup failed"); 392 NEONRegSpacing RegSpc = TableEntry->RegSpacing; 393 unsigned NumRegs = TableEntry->NumRegs; 394 395 MachineInstrBuilder MIB = BuildMI(MBB, MBBI, MI.getDebugLoc(), 396 TII->get(TableEntry->RealOpc)); 397 unsigned OpIdx = 0; 398 399 bool DstIsDead = MI.getOperand(OpIdx).isDead(); 400 unsigned DstReg = MI.getOperand(OpIdx++).getReg(); 401 unsigned D0, D1, D2, D3; 402 GetDSubRegs(DstReg, RegSpc, TRI, D0, D1, D2, D3); 403 MIB.addReg(D0, RegState::Define | getDeadRegState(DstIsDead)) 404 .addReg(D1, RegState::Define | getDeadRegState(DstIsDead)); 405 if (NumRegs > 2) 406 MIB.addReg(D2, RegState::Define | getDeadRegState(DstIsDead)); 407 if (NumRegs > 3) 408 MIB.addReg(D3, RegState::Define | getDeadRegState(DstIsDead)); 409 410 if (TableEntry->HasWriteBack) 411 MIB.addOperand(MI.getOperand(OpIdx++)); 412 413 // Copy the addrmode6 operands. 414 MIB.addOperand(MI.getOperand(OpIdx++)); 415 MIB.addOperand(MI.getOperand(OpIdx++)); 416 // Copy the am6offset operand. 417 if (TableEntry->HasWriteBack) 418 MIB.addOperand(MI.getOperand(OpIdx++)); 419 420 // For an instruction writing double-spaced subregs, the pseudo instruction 421 // has an extra operand that is a use of the super-register. Record the 422 // operand index and skip over it. 423 unsigned SrcOpIdx = 0; 424 if (RegSpc == EvenDblSpc || RegSpc == OddDblSpc) 425 SrcOpIdx = OpIdx++; 426 427 // Copy the predicate operands. 428 MIB.addOperand(MI.getOperand(OpIdx++)); 429 MIB.addOperand(MI.getOperand(OpIdx++)); 430 431 // Copy the super-register source operand used for double-spaced subregs over 432 // to the new instruction as an implicit operand. 433 if (SrcOpIdx != 0) { 434 MachineOperand MO = MI.getOperand(SrcOpIdx); 435 MO.setImplicit(true); 436 MIB.addOperand(MO); 437 } 438 // Add an implicit def for the super-register. 439 MIB.addReg(DstReg, RegState::ImplicitDefine | getDeadRegState(DstIsDead)); 440 TransferImpOps(MI, MIB, MIB); 441 MI.eraseFromParent(); 442} 443 444/// ExpandVST - Translate VST pseudo instructions with Q, QQ or QQQQ register 445/// operands to real VST instructions with D register operands. 446void ARMExpandPseudo::ExpandVST(MachineBasicBlock::iterator &MBBI) { 447 MachineInstr &MI = *MBBI; 448 MachineBasicBlock &MBB = *MI.getParent(); 449 450 const NEONLdStTableEntry *TableEntry = LookupNEONLdSt(MI.getOpcode()); 451 assert(TableEntry && !TableEntry->IsLoad && "NEONLdStTable lookup failed"); 452 NEONRegSpacing RegSpc = TableEntry->RegSpacing; 453 unsigned NumRegs = TableEntry->NumRegs; 454 455 MachineInstrBuilder MIB = BuildMI(MBB, MBBI, MI.getDebugLoc(), 456 TII->get(TableEntry->RealOpc)); 457 unsigned OpIdx = 0; 458 if (TableEntry->HasWriteBack) 459 MIB.addOperand(MI.getOperand(OpIdx++)); 460 461 // Copy the addrmode6 operands. 462 MIB.addOperand(MI.getOperand(OpIdx++)); 463 MIB.addOperand(MI.getOperand(OpIdx++)); 464 // Copy the am6offset operand. 465 if (TableEntry->HasWriteBack) 466 MIB.addOperand(MI.getOperand(OpIdx++)); 467 468 bool SrcIsKill = MI.getOperand(OpIdx).isKill(); 469 unsigned SrcReg = MI.getOperand(OpIdx++).getReg(); 470 unsigned D0, D1, D2, D3; 471 GetDSubRegs(SrcReg, RegSpc, TRI, D0, D1, D2, D3); 472 MIB.addReg(D0).addReg(D1); 473 if (NumRegs > 2) 474 MIB.addReg(D2); 475 if (NumRegs > 3) 476 MIB.addReg(D3); 477 478 // Copy the predicate operands. 479 MIB.addOperand(MI.getOperand(OpIdx++)); 480 MIB.addOperand(MI.getOperand(OpIdx++)); 481 482 if (SrcIsKill) 483 // Add an implicit kill for the super-reg. 484 (*MIB).addRegisterKilled(SrcReg, TRI, true); 485 TransferImpOps(MI, MIB, MIB); 486 MI.eraseFromParent(); 487} 488 489/// ExpandLaneOp - Translate VLD*LN and VST*LN instructions with Q, QQ or QQQQ 490/// register operands to real instructions with D register operands. 491void ARMExpandPseudo::ExpandLaneOp(MachineBasicBlock::iterator &MBBI) { 492 MachineInstr &MI = *MBBI; 493 MachineBasicBlock &MBB = *MI.getParent(); 494 495 const NEONLdStTableEntry *TableEntry = LookupNEONLdSt(MI.getOpcode()); 496 assert(TableEntry && "NEONLdStTable lookup failed"); 497 NEONRegSpacing RegSpc = TableEntry->RegSpacing; 498 unsigned NumRegs = TableEntry->NumRegs; 499 unsigned RegElts = TableEntry->RegElts; 500 501 MachineInstrBuilder MIB = BuildMI(MBB, MBBI, MI.getDebugLoc(), 502 TII->get(TableEntry->RealOpc)); 503 unsigned OpIdx = 0; 504 // The lane operand is always the 3rd from last operand, before the 2 505 // predicate operands. 506 unsigned Lane = MI.getOperand(MI.getDesc().getNumOperands() - 3).getImm(); 507 508 // Adjust the lane and spacing as needed for Q registers. 509 assert(RegSpc != OddDblSpc && "unexpected register spacing for VLD/VST-lane"); 510 if (RegSpc == EvenDblSpc && Lane >= RegElts) { 511 RegSpc = OddDblSpc; 512 Lane -= RegElts; 513 } 514 assert(Lane < RegElts && "out of range lane for VLD/VST-lane"); 515 516 unsigned D0, D1, D2, D3; 517 unsigned DstReg = 0; 518 bool DstIsDead = false; 519 if (TableEntry->IsLoad) { 520 DstIsDead = MI.getOperand(OpIdx).isDead(); 521 DstReg = MI.getOperand(OpIdx++).getReg(); 522 GetDSubRegs(DstReg, RegSpc, TRI, D0, D1, D2, D3); 523 MIB.addReg(D0, RegState::Define | getDeadRegState(DstIsDead)); 524 if (NumRegs > 1) 525 MIB.addReg(D1, RegState::Define | getDeadRegState(DstIsDead)); 526 if (NumRegs > 2) 527 MIB.addReg(D2, RegState::Define | getDeadRegState(DstIsDead)); 528 if (NumRegs > 3) 529 MIB.addReg(D3, RegState::Define | getDeadRegState(DstIsDead)); 530 } 531 532 if (TableEntry->HasWriteBack) 533 MIB.addOperand(MI.getOperand(OpIdx++)); 534 535 // Copy the addrmode6 operands. 536 MIB.addOperand(MI.getOperand(OpIdx++)); 537 MIB.addOperand(MI.getOperand(OpIdx++)); 538 // Copy the am6offset operand. 539 if (TableEntry->HasWriteBack) 540 MIB.addOperand(MI.getOperand(OpIdx++)); 541 542 // Grab the super-register source. 543 MachineOperand MO = MI.getOperand(OpIdx++); 544 if (!TableEntry->IsLoad) 545 GetDSubRegs(MO.getReg(), RegSpc, TRI, D0, D1, D2, D3); 546 547 // Add the subregs as sources of the new instruction. 548 unsigned SrcFlags = (getUndefRegState(MO.isUndef()) | 549 getKillRegState(MO.isKill())); 550 MIB.addReg(D0, SrcFlags); 551 if (NumRegs > 1) 552 MIB.addReg(D1, SrcFlags); 553 if (NumRegs > 2) 554 MIB.addReg(D2, SrcFlags); 555 if (NumRegs > 3) 556 MIB.addReg(D3, SrcFlags); 557 558 // Add the lane number operand. 559 MIB.addImm(Lane); 560 OpIdx += 1; 561 562 // Copy the predicate operands. 563 MIB.addOperand(MI.getOperand(OpIdx++)); 564 MIB.addOperand(MI.getOperand(OpIdx++)); 565 566 // Copy the super-register source to be an implicit source. 567 MO.setImplicit(true); 568 MIB.addOperand(MO); 569 if (TableEntry->IsLoad) 570 // Add an implicit def for the super-register. 571 MIB.addReg(DstReg, RegState::ImplicitDefine | getDeadRegState(DstIsDead)); 572 TransferImpOps(MI, MIB, MIB); 573 MI.eraseFromParent(); 574} 575 576/// ExpandVTBL - Translate VTBL and VTBX pseudo instructions with Q or QQ 577/// register operands to real instructions with D register operands. 578void ARMExpandPseudo::ExpandVTBL(MachineBasicBlock::iterator &MBBI, 579 unsigned Opc, bool IsExt, unsigned NumRegs) { 580 MachineInstr &MI = *MBBI; 581 MachineBasicBlock &MBB = *MI.getParent(); 582 583 MachineInstrBuilder MIB = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(Opc)); 584 unsigned OpIdx = 0; 585 586 // Transfer the destination register operand. 587 MIB.addOperand(MI.getOperand(OpIdx++)); 588 if (IsExt) 589 MIB.addOperand(MI.getOperand(OpIdx++)); 590 591 bool SrcIsKill = MI.getOperand(OpIdx).isKill(); 592 unsigned SrcReg = MI.getOperand(OpIdx++).getReg(); 593 unsigned D0, D1, D2, D3; 594 GetDSubRegs(SrcReg, SingleSpc, TRI, D0, D1, D2, D3); 595 MIB.addReg(D0).addReg(D1); 596 if (NumRegs > 2) 597 MIB.addReg(D2); 598 if (NumRegs > 3) 599 MIB.addReg(D3); 600 601 // Copy the other source register operand. 602 MIB.addOperand(MI.getOperand(OpIdx++)); 603 604 // Copy the predicate operands. 605 MIB.addOperand(MI.getOperand(OpIdx++)); 606 MIB.addOperand(MI.getOperand(OpIdx++)); 607 608 if (SrcIsKill) 609 // Add an implicit kill for the super-reg. 610 (*MIB).addRegisterKilled(SrcReg, TRI, true); 611 TransferImpOps(MI, MIB, MIB); 612 MI.eraseFromParent(); 613} 614 615bool ARMExpandPseudo::ExpandMBB(MachineBasicBlock &MBB) { 616 bool Modified = false; 617 618 MachineBasicBlock::iterator MBBI = MBB.begin(), E = MBB.end(); 619 while (MBBI != E) { 620 MachineInstr &MI = *MBBI; 621 MachineBasicBlock::iterator NMBBI = llvm::next(MBBI); 622 623 bool ModifiedOp = true; 624 unsigned Opcode = MI.getOpcode(); 625 switch (Opcode) { 626 default: 627 ModifiedOp = false; 628 break; 629 630 case ARM::Int_eh_sjlj_dispatchsetup: { 631 MachineFunction &MF = *MI.getParent()->getParent(); 632 const ARMBaseInstrInfo *AII = 633 static_cast<const ARMBaseInstrInfo*>(TII); 634 const ARMBaseRegisterInfo &RI = AII->getRegisterInfo(); 635 // For functions using a base pointer, we rematerialize it (via the frame 636 // pointer) here since eh.sjlj.setjmp and eh.sjlj.longjmp don't do it 637 // for us. Otherwise, expand to nothing. 638 if (RI.hasBasePointer(MF)) { 639 ARMFunctionInfo *AFI = MF.getInfo<ARMFunctionInfo>(); 640 int32_t NumBytes = AFI->getFramePtrSpillOffset(); 641 unsigned FramePtr = RI.getFrameRegister(MF); 642 assert(MF.getTarget().getFrameInfo()->hasFP(MF) && 643 "base pointer without frame pointer?"); 644 645 if (AFI->isThumb2Function()) { 646 llvm::emitT2RegPlusImmediate(MBB, MBBI, MI.getDebugLoc(), ARM::R6, 647 FramePtr, -NumBytes, ARMCC::AL, 0, *TII); 648 } else if (AFI->isThumbFunction()) { 649 llvm::emitThumbRegPlusImmediate(MBB, MBBI, ARM::R6, 650 FramePtr, -NumBytes, 651 *TII, RI, MI.getDebugLoc()); 652 } else { 653 llvm::emitARMRegPlusImmediate(MBB, MBBI, MI.getDebugLoc(), ARM::R6, 654 FramePtr, -NumBytes, ARMCC::AL, 0, 655 *TII); 656 } 657 // If there's dynamic realignment, adjust for it. 658 if (RI.needsStackRealignment(MF)) { 659 MachineFrameInfo *MFI = MF.getFrameInfo(); 660 unsigned MaxAlign = MFI->getMaxAlignment(); 661 assert (!AFI->isThumb1OnlyFunction()); 662 // Emit bic r6, r6, MaxAlign 663 unsigned bicOpc = AFI->isThumbFunction() ? 664 ARM::t2BICri : ARM::BICri; 665 AddDefaultCC(AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(), 666 TII->get(bicOpc), ARM::R6) 667 .addReg(ARM::R6, RegState::Kill) 668 .addImm(MaxAlign-1))); 669 } 670 671 } 672 MI.eraseFromParent(); 673 break; 674 } 675 676 case ARM::MOVsrl_flag: 677 case ARM::MOVsra_flag: { 678 // These are just fancy MOVs insructions. 679 AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVs), 680 MI.getOperand(0).getReg()) 681 .addOperand(MI.getOperand(1)) 682 .addReg(0) 683 .addImm(ARM_AM::getSORegOpc((Opcode == ARM::MOVsrl_flag ? ARM_AM::lsr 684 : ARM_AM::asr), 1))) 685 .addReg(ARM::CPSR, RegState::Define); 686 MI.eraseFromParent(); 687 break; 688 } 689 case ARM::RRX: { 690 // This encodes as "MOVs Rd, Rm, rrx 691 MachineInstrBuilder MIB = 692 AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVs), 693 MI.getOperand(0).getReg()) 694 .addOperand(MI.getOperand(1)) 695 .addOperand(MI.getOperand(1)) 696 .addImm(ARM_AM::getSORegOpc(ARM_AM::rrx, 0))) 697 .addReg(0); 698 TransferImpOps(MI, MIB, MIB); 699 MI.eraseFromParent(); 700 break; 701 } 702 case ARM::tLDRpci_pic: 703 case ARM::t2LDRpci_pic: { 704 unsigned NewLdOpc = (Opcode == ARM::tLDRpci_pic) 705 ? ARM::tLDRpci : ARM::t2LDRpci; 706 unsigned DstReg = MI.getOperand(0).getReg(); 707 bool DstIsDead = MI.getOperand(0).isDead(); 708 MachineInstrBuilder MIB1 = 709 AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(), 710 TII->get(NewLdOpc), DstReg) 711 .addOperand(MI.getOperand(1))); 712 (*MIB1).setMemRefs(MI.memoperands_begin(), MI.memoperands_end()); 713 MachineInstrBuilder MIB2 = BuildMI(MBB, MBBI, MI.getDebugLoc(), 714 TII->get(ARM::tPICADD)) 715 .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead)) 716 .addReg(DstReg) 717 .addOperand(MI.getOperand(2)); 718 TransferImpOps(MI, MIB1, MIB2); 719 MI.eraseFromParent(); 720 break; 721 } 722 723 case ARM::MOVi32imm: 724 case ARM::MOVCCi32imm: 725 case ARM::t2MOVi32imm: 726 case ARM::t2MOVCCi32imm: { 727 unsigned PredReg = 0; 728 ARMCC::CondCodes Pred = llvm::getInstrPredicate(&MI, PredReg); 729 unsigned DstReg = MI.getOperand(0).getReg(); 730 bool DstIsDead = MI.getOperand(0).isDead(); 731 bool isCC = Opcode == ARM::MOVCCi32imm || Opcode == ARM::t2MOVCCi32imm; 732 const MachineOperand &MO = MI.getOperand(isCC ? 2 : 1); 733 MachineInstrBuilder LO16, HI16; 734 735 if (!STI->hasV6T2Ops() && 736 (Opcode == ARM::MOVi32imm || Opcode == ARM::MOVCCi32imm)) { 737 // Expand into a movi + orr. 738 LO16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVi), DstReg); 739 HI16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::ORRri)) 740 .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead)) 741 .addReg(DstReg); 742 743 assert (MO.isImm() && "MOVi32imm w/ non-immediate source operand!"); 744 unsigned ImmVal = (unsigned)MO.getImm(); 745 unsigned SOImmValV1 = ARM_AM::getSOImmTwoPartFirst(ImmVal); 746 unsigned SOImmValV2 = ARM_AM::getSOImmTwoPartSecond(ImmVal); 747 LO16 = LO16.addImm(SOImmValV1); 748 HI16 = HI16.addImm(SOImmValV2); 749 (*LO16).setMemRefs(MI.memoperands_begin(), MI.memoperands_end()); 750 (*HI16).setMemRefs(MI.memoperands_begin(), MI.memoperands_end()); 751 LO16.addImm(Pred).addReg(PredReg).addReg(0); 752 HI16.addImm(Pred).addReg(PredReg).addReg(0); 753 TransferImpOps(MI, LO16, HI16); 754 MI.eraseFromParent(); 755 break; 756 } 757 758 bool isThumb = 759 (Opcode == ARM::t2MOVi32imm || Opcode == ARM::t2MOVCCi32imm); 760 761 LO16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), 762 TII->get(isThumb ? ARM::t2MOVi16 : ARM::MOVi16), 763 DstReg); 764 HI16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), 765 TII->get(isThumb ? ARM::t2MOVTi16 : ARM::MOVTi16)) 766 .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead)) 767 .addReg(DstReg); 768 769 if (MO.isImm()) { 770 unsigned Imm = MO.getImm(); 771 unsigned Lo16 = Imm & 0xffff; 772 unsigned Hi16 = (Imm >> 16) & 0xffff; 773 LO16 = LO16.addImm(Lo16); 774 HI16 = HI16.addImm(Hi16); 775 } else { 776 const GlobalValue *GV = MO.getGlobal(); 777 unsigned TF = MO.getTargetFlags(); 778 LO16 = LO16.addGlobalAddress(GV, MO.getOffset(), TF | ARMII::MO_LO16); 779 HI16 = HI16.addGlobalAddress(GV, MO.getOffset(), TF | ARMII::MO_HI16); 780 } 781 (*LO16).setMemRefs(MI.memoperands_begin(), MI.memoperands_end()); 782 (*HI16).setMemRefs(MI.memoperands_begin(), MI.memoperands_end()); 783 LO16.addImm(Pred).addReg(PredReg); 784 HI16.addImm(Pred).addReg(PredReg); 785 TransferImpOps(MI, LO16, HI16); 786 MI.eraseFromParent(); 787 break; 788 } 789 790 case ARM::VMOVQQ: { 791 unsigned DstReg = MI.getOperand(0).getReg(); 792 bool DstIsDead = MI.getOperand(0).isDead(); 793 unsigned EvenDst = TRI->getSubReg(DstReg, ARM::qsub_0); 794 unsigned OddDst = TRI->getSubReg(DstReg, ARM::qsub_1); 795 unsigned SrcReg = MI.getOperand(1).getReg(); 796 bool SrcIsKill = MI.getOperand(1).isKill(); 797 unsigned EvenSrc = TRI->getSubReg(SrcReg, ARM::qsub_0); 798 unsigned OddSrc = TRI->getSubReg(SrcReg, ARM::qsub_1); 799 MachineInstrBuilder Even = 800 AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(), 801 TII->get(ARM::VMOVQ)) 802 .addReg(EvenDst, 803 RegState::Define | getDeadRegState(DstIsDead)) 804 .addReg(EvenSrc, getKillRegState(SrcIsKill))); 805 MachineInstrBuilder Odd = 806 AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(), 807 TII->get(ARM::VMOVQ)) 808 .addReg(OddDst, 809 RegState::Define | getDeadRegState(DstIsDead)) 810 .addReg(OddSrc, getKillRegState(SrcIsKill))); 811 TransferImpOps(MI, Even, Odd); 812 MI.eraseFromParent(); 813 break; 814 } 815 816 case ARM::VLDMQIA: 817 case ARM::VLDMQDB: { 818 unsigned NewOpc = (Opcode == ARM::VLDMQIA) ? ARM::VLDMDIA : ARM::VLDMDDB; 819 MachineInstrBuilder MIB = 820 BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(NewOpc)); 821 unsigned OpIdx = 0; 822 823 // Grab the Q register destination. 824 bool DstIsDead = MI.getOperand(OpIdx).isDead(); 825 unsigned DstReg = MI.getOperand(OpIdx++).getReg(); 826 827 // Copy the source register. 828 MIB.addOperand(MI.getOperand(OpIdx++)); 829 830 // Copy the predicate operands. 831 MIB.addOperand(MI.getOperand(OpIdx++)); 832 MIB.addOperand(MI.getOperand(OpIdx++)); 833 834 // Add the destination operands (D subregs). 835 unsigned D0 = TRI->getSubReg(DstReg, ARM::dsub_0); 836 unsigned D1 = TRI->getSubReg(DstReg, ARM::dsub_1); 837 MIB.addReg(D0, RegState::Define | getDeadRegState(DstIsDead)) 838 .addReg(D1, RegState::Define | getDeadRegState(DstIsDead)); 839 840 // Add an implicit def for the super-register. 841 MIB.addReg(DstReg, RegState::ImplicitDefine | getDeadRegState(DstIsDead)); 842 TransferImpOps(MI, MIB, MIB); 843 MI.eraseFromParent(); 844 break; 845 } 846 847 case ARM::VSTMQIA: 848 case ARM::VSTMQDB: { 849 unsigned NewOpc = (Opcode == ARM::VSTMQIA) ? ARM::VSTMDIA : ARM::VSTMDDB; 850 MachineInstrBuilder MIB = 851 BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(NewOpc)); 852 unsigned OpIdx = 0; 853 854 // Grab the Q register source. 855 bool SrcIsKill = MI.getOperand(OpIdx).isKill(); 856 unsigned SrcReg = MI.getOperand(OpIdx++).getReg(); 857 858 // Copy the destination register. 859 MIB.addOperand(MI.getOperand(OpIdx++)); 860 861 // Copy the predicate operands. 862 MIB.addOperand(MI.getOperand(OpIdx++)); 863 MIB.addOperand(MI.getOperand(OpIdx++)); 864 865 // Add the source operands (D subregs). 866 unsigned D0 = TRI->getSubReg(SrcReg, ARM::dsub_0); 867 unsigned D1 = TRI->getSubReg(SrcReg, ARM::dsub_1); 868 MIB.addReg(D0).addReg(D1); 869 870 if (SrcIsKill) 871 // Add an implicit kill for the Q register. 872 (*MIB).addRegisterKilled(SrcReg, TRI, true); 873 874 TransferImpOps(MI, MIB, MIB); 875 MI.eraseFromParent(); 876 break; 877 } 878 case ARM::VDUPfqf: 879 case ARM::VDUPfdf:{ 880 unsigned NewOpc = Opcode == ARM::VDUPfqf ? ARM::VDUPLNfq : ARM::VDUPLNfd; 881 MachineInstrBuilder MIB = 882 BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(NewOpc)); 883 unsigned OpIdx = 0; 884 unsigned SrcReg = MI.getOperand(1).getReg(); 885 unsigned Lane = getARMRegisterNumbering(SrcReg) & 1; 886 unsigned DReg = TRI->getMatchingSuperReg(SrcReg, 887 Lane & 1 ? ARM::ssub_1 : ARM::ssub_0, &ARM::DPR_VFP2RegClass); 888 // The lane is [0,1] for the containing DReg superregister. 889 // Copy the dst/src register operands. 890 MIB.addOperand(MI.getOperand(OpIdx++)); 891 MIB.addReg(DReg); 892 ++OpIdx; 893 // Add the lane select operand. 894 MIB.addImm(Lane); 895 // Add the predicate operands. 896 MIB.addOperand(MI.getOperand(OpIdx++)); 897 MIB.addOperand(MI.getOperand(OpIdx++)); 898 899 TransferImpOps(MI, MIB, MIB); 900 MI.eraseFromParent(); 901 break; 902 } 903 904 case ARM::VLD1q8Pseudo: 905 case ARM::VLD1q16Pseudo: 906 case ARM::VLD1q32Pseudo: 907 case ARM::VLD1q64Pseudo: 908 case ARM::VLD1q8Pseudo_UPD: 909 case ARM::VLD1q16Pseudo_UPD: 910 case ARM::VLD1q32Pseudo_UPD: 911 case ARM::VLD1q64Pseudo_UPD: 912 case ARM::VLD2d8Pseudo: 913 case ARM::VLD2d16Pseudo: 914 case ARM::VLD2d32Pseudo: 915 case ARM::VLD2q8Pseudo: 916 case ARM::VLD2q16Pseudo: 917 case ARM::VLD2q32Pseudo: 918 case ARM::VLD2d8Pseudo_UPD: 919 case ARM::VLD2d16Pseudo_UPD: 920 case ARM::VLD2d32Pseudo_UPD: 921 case ARM::VLD2q8Pseudo_UPD: 922 case ARM::VLD2q16Pseudo_UPD: 923 case ARM::VLD2q32Pseudo_UPD: 924 case ARM::VLD3d8Pseudo: 925 case ARM::VLD3d16Pseudo: 926 case ARM::VLD3d32Pseudo: 927 case ARM::VLD1d64TPseudo: 928 case ARM::VLD3d8Pseudo_UPD: 929 case ARM::VLD3d16Pseudo_UPD: 930 case ARM::VLD3d32Pseudo_UPD: 931 case ARM::VLD1d64TPseudo_UPD: 932 case ARM::VLD3q8Pseudo_UPD: 933 case ARM::VLD3q16Pseudo_UPD: 934 case ARM::VLD3q32Pseudo_UPD: 935 case ARM::VLD3q8oddPseudo_UPD: 936 case ARM::VLD3q16oddPseudo_UPD: 937 case ARM::VLD3q32oddPseudo_UPD: 938 case ARM::VLD4d8Pseudo: 939 case ARM::VLD4d16Pseudo: 940 case ARM::VLD4d32Pseudo: 941 case ARM::VLD1d64QPseudo: 942 case ARM::VLD4d8Pseudo_UPD: 943 case ARM::VLD4d16Pseudo_UPD: 944 case ARM::VLD4d32Pseudo_UPD: 945 case ARM::VLD1d64QPseudo_UPD: 946 case ARM::VLD4q8Pseudo_UPD: 947 case ARM::VLD4q16Pseudo_UPD: 948 case ARM::VLD4q32Pseudo_UPD: 949 case ARM::VLD4q8oddPseudo_UPD: 950 case ARM::VLD4q16oddPseudo_UPD: 951 case ARM::VLD4q32oddPseudo_UPD: 952 case ARM::VLD1DUPq8Pseudo: 953 case ARM::VLD1DUPq16Pseudo: 954 case ARM::VLD1DUPq32Pseudo: 955 case ARM::VLD1DUPq8Pseudo_UPD: 956 case ARM::VLD1DUPq16Pseudo_UPD: 957 case ARM::VLD1DUPq32Pseudo_UPD: 958 case ARM::VLD2DUPd8Pseudo: 959 case ARM::VLD2DUPd16Pseudo: 960 case ARM::VLD2DUPd32Pseudo: 961 case ARM::VLD2DUPd8Pseudo_UPD: 962 case ARM::VLD2DUPd16Pseudo_UPD: 963 case ARM::VLD2DUPd32Pseudo_UPD: 964 case ARM::VLD3DUPd8Pseudo: 965 case ARM::VLD3DUPd16Pseudo: 966 case ARM::VLD3DUPd32Pseudo: 967 case ARM::VLD3DUPd8Pseudo_UPD: 968 case ARM::VLD3DUPd16Pseudo_UPD: 969 case ARM::VLD3DUPd32Pseudo_UPD: 970 case ARM::VLD4DUPd8Pseudo: 971 case ARM::VLD4DUPd16Pseudo: 972 case ARM::VLD4DUPd32Pseudo: 973 case ARM::VLD4DUPd8Pseudo_UPD: 974 case ARM::VLD4DUPd16Pseudo_UPD: 975 case ARM::VLD4DUPd32Pseudo_UPD: 976 ExpandVLD(MBBI); 977 break; 978 979 case ARM::VST1q8Pseudo: 980 case ARM::VST1q16Pseudo: 981 case ARM::VST1q32Pseudo: 982 case ARM::VST1q64Pseudo: 983 case ARM::VST1q8Pseudo_UPD: 984 case ARM::VST1q16Pseudo_UPD: 985 case ARM::VST1q32Pseudo_UPD: 986 case ARM::VST1q64Pseudo_UPD: 987 case ARM::VST2d8Pseudo: 988 case ARM::VST2d16Pseudo: 989 case ARM::VST2d32Pseudo: 990 case ARM::VST2q8Pseudo: 991 case ARM::VST2q16Pseudo: 992 case ARM::VST2q32Pseudo: 993 case ARM::VST2d8Pseudo_UPD: 994 case ARM::VST2d16Pseudo_UPD: 995 case ARM::VST2d32Pseudo_UPD: 996 case ARM::VST2q8Pseudo_UPD: 997 case ARM::VST2q16Pseudo_UPD: 998 case ARM::VST2q32Pseudo_UPD: 999 case ARM::VST3d8Pseudo: 1000 case ARM::VST3d16Pseudo: 1001 case ARM::VST3d32Pseudo: 1002 case ARM::VST1d64TPseudo: 1003 case ARM::VST3d8Pseudo_UPD: 1004 case ARM::VST3d16Pseudo_UPD: 1005 case ARM::VST3d32Pseudo_UPD: 1006 case ARM::VST1d64TPseudo_UPD: 1007 case ARM::VST3q8Pseudo_UPD: 1008 case ARM::VST3q16Pseudo_UPD: 1009 case ARM::VST3q32Pseudo_UPD: 1010 case ARM::VST3q8oddPseudo_UPD: 1011 case ARM::VST3q16oddPseudo_UPD: 1012 case ARM::VST3q32oddPseudo_UPD: 1013 case ARM::VST4d8Pseudo: 1014 case ARM::VST4d16Pseudo: 1015 case ARM::VST4d32Pseudo: 1016 case ARM::VST1d64QPseudo: 1017 case ARM::VST4d8Pseudo_UPD: 1018 case ARM::VST4d16Pseudo_UPD: 1019 case ARM::VST4d32Pseudo_UPD: 1020 case ARM::VST1d64QPseudo_UPD: 1021 case ARM::VST4q8Pseudo_UPD: 1022 case ARM::VST4q16Pseudo_UPD: 1023 case ARM::VST4q32Pseudo_UPD: 1024 case ARM::VST4q8oddPseudo_UPD: 1025 case ARM::VST4q16oddPseudo_UPD: 1026 case ARM::VST4q32oddPseudo_UPD: 1027 ExpandVST(MBBI); 1028 break; 1029 1030 case ARM::VLD1LNq8Pseudo: 1031 case ARM::VLD1LNq16Pseudo: 1032 case ARM::VLD1LNq32Pseudo: 1033 case ARM::VLD1LNq8Pseudo_UPD: 1034 case ARM::VLD1LNq16Pseudo_UPD: 1035 case ARM::VLD1LNq32Pseudo_UPD: 1036 case ARM::VLD2LNd8Pseudo: 1037 case ARM::VLD2LNd16Pseudo: 1038 case ARM::VLD2LNd32Pseudo: 1039 case ARM::VLD2LNq16Pseudo: 1040 case ARM::VLD2LNq32Pseudo: 1041 case ARM::VLD2LNd8Pseudo_UPD: 1042 case ARM::VLD2LNd16Pseudo_UPD: 1043 case ARM::VLD2LNd32Pseudo_UPD: 1044 case ARM::VLD2LNq16Pseudo_UPD: 1045 case ARM::VLD2LNq32Pseudo_UPD: 1046 case ARM::VLD3LNd8Pseudo: 1047 case ARM::VLD3LNd16Pseudo: 1048 case ARM::VLD3LNd32Pseudo: 1049 case ARM::VLD3LNq16Pseudo: 1050 case ARM::VLD3LNq32Pseudo: 1051 case ARM::VLD3LNd8Pseudo_UPD: 1052 case ARM::VLD3LNd16Pseudo_UPD: 1053 case ARM::VLD3LNd32Pseudo_UPD: 1054 case ARM::VLD3LNq16Pseudo_UPD: 1055 case ARM::VLD3LNq32Pseudo_UPD: 1056 case ARM::VLD4LNd8Pseudo: 1057 case ARM::VLD4LNd16Pseudo: 1058 case ARM::VLD4LNd32Pseudo: 1059 case ARM::VLD4LNq16Pseudo: 1060 case ARM::VLD4LNq32Pseudo: 1061 case ARM::VLD4LNd8Pseudo_UPD: 1062 case ARM::VLD4LNd16Pseudo_UPD: 1063 case ARM::VLD4LNd32Pseudo_UPD: 1064 case ARM::VLD4LNq16Pseudo_UPD: 1065 case ARM::VLD4LNq32Pseudo_UPD: 1066 case ARM::VST1LNq8Pseudo: 1067 case ARM::VST1LNq16Pseudo: 1068 case ARM::VST1LNq32Pseudo: 1069 case ARM::VST1LNq8Pseudo_UPD: 1070 case ARM::VST1LNq16Pseudo_UPD: 1071 case ARM::VST1LNq32Pseudo_UPD: 1072 case ARM::VST2LNd8Pseudo: 1073 case ARM::VST2LNd16Pseudo: 1074 case ARM::VST2LNd32Pseudo: 1075 case ARM::VST2LNq16Pseudo: 1076 case ARM::VST2LNq32Pseudo: 1077 case ARM::VST2LNd8Pseudo_UPD: 1078 case ARM::VST2LNd16Pseudo_UPD: 1079 case ARM::VST2LNd32Pseudo_UPD: 1080 case ARM::VST2LNq16Pseudo_UPD: 1081 case ARM::VST2LNq32Pseudo_UPD: 1082 case ARM::VST3LNd8Pseudo: 1083 case ARM::VST3LNd16Pseudo: 1084 case ARM::VST3LNd32Pseudo: 1085 case ARM::VST3LNq16Pseudo: 1086 case ARM::VST3LNq32Pseudo: 1087 case ARM::VST3LNd8Pseudo_UPD: 1088 case ARM::VST3LNd16Pseudo_UPD: 1089 case ARM::VST3LNd32Pseudo_UPD: 1090 case ARM::VST3LNq16Pseudo_UPD: 1091 case ARM::VST3LNq32Pseudo_UPD: 1092 case ARM::VST4LNd8Pseudo: 1093 case ARM::VST4LNd16Pseudo: 1094 case ARM::VST4LNd32Pseudo: 1095 case ARM::VST4LNq16Pseudo: 1096 case ARM::VST4LNq32Pseudo: 1097 case ARM::VST4LNd8Pseudo_UPD: 1098 case ARM::VST4LNd16Pseudo_UPD: 1099 case ARM::VST4LNd32Pseudo_UPD: 1100 case ARM::VST4LNq16Pseudo_UPD: 1101 case ARM::VST4LNq32Pseudo_UPD: 1102 ExpandLaneOp(MBBI); 1103 break; 1104 1105 case ARM::VTBL2Pseudo: 1106 ExpandVTBL(MBBI, ARM::VTBL2, false, 2); break; 1107 case ARM::VTBL3Pseudo: 1108 ExpandVTBL(MBBI, ARM::VTBL3, false, 3); break; 1109 case ARM::VTBL4Pseudo: 1110 ExpandVTBL(MBBI, ARM::VTBL4, false, 4); break; 1111 case ARM::VTBX2Pseudo: 1112 ExpandVTBL(MBBI, ARM::VTBX2, true, 2); break; 1113 case ARM::VTBX3Pseudo: 1114 ExpandVTBL(MBBI, ARM::VTBX3, true, 3); break; 1115 case ARM::VTBX4Pseudo: 1116 ExpandVTBL(MBBI, ARM::VTBX4, true, 4); break; 1117 } 1118 1119 if (ModifiedOp) 1120 Modified = true; 1121 MBBI = NMBBI; 1122 } 1123 1124 return Modified; 1125} 1126 1127bool ARMExpandPseudo::runOnMachineFunction(MachineFunction &MF) { 1128 TII = static_cast<const ARMBaseInstrInfo*>(MF.getTarget().getInstrInfo()); 1129 TRI = MF.getTarget().getRegisterInfo(); 1130 STI = &MF.getTarget().getSubtarget<ARMSubtarget>(); 1131 1132 bool Modified = false; 1133 for (MachineFunction::iterator MFI = MF.begin(), E = MF.end(); MFI != E; 1134 ++MFI) 1135 Modified |= ExpandMBB(*MFI); 1136 return Modified; 1137} 1138 1139/// createARMExpandPseudoPass - returns an instance of the pseudo instruction 1140/// expansion pass. 1141FunctionPass *llvm::createARMExpandPseudoPass() { 1142 return new ARMExpandPseudo(); 1143} 1144