AMDGPUISelLowering.cpp revision da25cd3e6de8f21005590c2de49868f883cf2410
1f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===-- AMDGPUISelLowering.cpp - AMDGPU Common DAG lowering functions -----===//
2f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
3f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//                     The LLVM Compiler Infrastructure
4f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
5f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard// This file is distributed under the University of Illinois Open Source
6f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard// License. See LICENSE.TXT for details.
7f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
8f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===----------------------------------------------------------------------===//
9f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
10f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard/// \file
11f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard/// \brief This is the parent TargetLowering class for hardware code gen
12f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard/// targets.
13f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
14f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===----------------------------------------------------------------------===//
15f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
16f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "AMDGPUISelLowering.h"
17e7397ee81ad07cab36362bab5a086f20acc60a80Tom Stellard#include "AMDGPU.h"
1890c64cbaa124e0e8541680efeaa56f0e6eb78d9aChristian Konig#include "AMDGPURegisterInfo.h"
1990c64cbaa124e0e8541680efeaa56f0e6eb78d9aChristian Konig#include "AMDGPUSubtarget.h"
205c35290fa35ae234fed02496404cb0fc37e1c8a5Benjamin Kramer#include "AMDILIntrinsicInfo.h"
21f502c292f6edd6b0562a93cc67cd241f52a57d54Tom Stellard#include "R600MachineFunctionInfo.h"
22e7397ee81ad07cab36362bab5a086f20acc60a80Tom Stellard#include "SIMachineFunctionInfo.h"
2390c64cbaa124e0e8541680efeaa56f0e6eb78d9aChristian Konig#include "llvm/CodeGen/CallingConvLower.h"
24f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/CodeGen/MachineFunction.h"
25f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/CodeGen/MachineRegisterInfo.h"
26f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/CodeGen/SelectionDAG.h"
27f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/CodeGen/TargetLoweringObjectFileImpl.h"
28e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard#include "llvm/IR/DataLayout.h"
29f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
30f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardusing namespace llvm;
31f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
3290c64cbaa124e0e8541680efeaa56f0e6eb78d9aChristian Konig#include "AMDGPUGenCallingConv.inc"
3390c64cbaa124e0e8541680efeaa56f0e6eb78d9aChristian Konig
34f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardAMDGPUTargetLowering::AMDGPUTargetLowering(TargetMachine &TM) :
35f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  TargetLowering(TM, new TargetLoweringObjectFileELF()) {
36f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
37f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Initialize target lowering borrowed from AMDIL
38f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  InitAMDILLowering();
39f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
40f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // We need to custom lower some of the intrinsics
41f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);
42f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
43f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Library functions.  These default to Expand, but we have instructions
44f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // for them.
45f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::FCEIL,  MVT::f32, Legal);
46f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::FEXP2,  MVT::f32, Legal);
47f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::FPOW,   MVT::f32, Legal);
48f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::FLOG2,  MVT::f32, Legal);
49f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::FABS,   MVT::f32, Legal);
50f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::FFLOOR, MVT::f32, Legal);
51f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::FRINT,  MVT::f32, Legal);
52f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
53ba534c21437ba133cb9d6b3f9dae80fa9c4f0cb7Tom Stellard  // The hardware supports ROTR, but not ROTL
54ba534c21437ba133cb9d6b3f9dae80fa9c4f0cb7Tom Stellard  setOperationAction(ISD::ROTL, MVT::i32, Expand);
55ba534c21437ba133cb9d6b3f9dae80fa9c4f0cb7Tom Stellard
56f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Lower floating point store/load to integer store/load to reduce the number
57f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // of patterns in tablegen.
58f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::STORE, MVT::f32, Promote);
59f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  AddPromotedToType(ISD::STORE, MVT::f32, MVT::i32);
60f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
61fc047278c160cf15d99502d8170d431cfcfe8a5bTom Stellard  setOperationAction(ISD::STORE, MVT::v2f32, Promote);
62fc047278c160cf15d99502d8170d431cfcfe8a5bTom Stellard  AddPromotedToType(ISD::STORE, MVT::v2f32, MVT::v2i32);
63fc047278c160cf15d99502d8170d431cfcfe8a5bTom Stellard
64f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::STORE, MVT::v4f32, Promote);
65f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  AddPromotedToType(ISD::STORE, MVT::v4f32, MVT::v4i32);
66f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
6768e132866236f5d59271d2c7ffb77a9c8e743752Tom Stellard  setOperationAction(ISD::STORE, MVT::f64, Promote);
6868e132866236f5d59271d2c7ffb77a9c8e743752Tom Stellard  AddPromotedToType(ISD::STORE, MVT::f64, MVT::i64);
6968e132866236f5d59271d2c7ffb77a9c8e743752Tom Stellard
704c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  setTruncStoreAction(MVT::v2i32, MVT::v2i16, Custom);
714c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  setTruncStoreAction(MVT::v2i32, MVT::v2i8, Custom);
724c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  setTruncStoreAction(MVT::v4i32, MVT::v4i8, Custom);
734c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  // XXX: This can be change to Custom, once ExpandVectorStores can
744c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  // handle 64-bit stores.
754c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  setTruncStoreAction(MVT::v4i32, MVT::v4i16, Expand);
764c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard
77f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::LOAD, MVT::f32, Promote);
78f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  AddPromotedToType(ISD::LOAD, MVT::f32, MVT::i32);
79f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
80ac85f3f65ce67f71bb8e4626e0a50d818500e426Tom Stellard  setOperationAction(ISD::LOAD, MVT::v2f32, Promote);
81ac85f3f65ce67f71bb8e4626e0a50d818500e426Tom Stellard  AddPromotedToType(ISD::LOAD, MVT::v2f32, MVT::v2i32);
82ac85f3f65ce67f71bb8e4626e0a50d818500e426Tom Stellard
83f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::LOAD, MVT::v4f32, Promote);
84f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  AddPromotedToType(ISD::LOAD, MVT::v4f32, MVT::v4i32);
85f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
8668e132866236f5d59271d2c7ffb77a9c8e743752Tom Stellard  setOperationAction(ISD::LOAD, MVT::f64, Promote);
8768e132866236f5d59271d2c7ffb77a9c8e743752Tom Stellard  AddPromotedToType(ISD::LOAD, MVT::f64, MVT::i64);
8868e132866236f5d59271d2c7ffb77a9c8e743752Tom Stellard
89a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  setOperationAction(ISD::CONCAT_VECTORS, MVT::v4i32, Custom);
90a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  setOperationAction(ISD::CONCAT_VECTORS, MVT::v4f32, Custom);
91a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  setOperationAction(ISD::EXTRACT_SUBVECTOR, MVT::v2i32, Custom);
92a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  setOperationAction(ISD::EXTRACT_SUBVECTOR, MVT::v2f32, Custom);
93692ee102ebef535d311c35d53457028083e5c5beTom Stellard
9430d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::EXTLOAD, MVT::v2i8, Expand);
9530d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::SEXTLOAD, MVT::v2i8, Expand);
9630d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::ZEXTLOAD, MVT::v2i8, Expand);
9730d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::EXTLOAD, MVT::v4i8, Expand);
9830d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::SEXTLOAD, MVT::v4i8, Expand);
9930d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::ZEXTLOAD, MVT::v4i8, Expand);
10030d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::EXTLOAD, MVT::v2i16, Expand);
10130d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::SEXTLOAD, MVT::v2i16, Expand);
10230d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::ZEXTLOAD, MVT::v2i16, Expand);
10330d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::EXTLOAD, MVT::v4i16, Expand);
10430d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::SEXTLOAD, MVT::v4i16, Expand);
10530d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard  setLoadExtAction(ISD::ZEXTLOAD, MVT::v4i16, Expand);
10630d84d8dfa0433088d541c66b92af0da3855bc9cTom Stellard
107d7a472c9c696ebf010835d9254fb15036e558d84Tom Stellard  setOperationAction(ISD::FNEG, MVT::v2f32, Expand);
108d7a472c9c696ebf010835d9254fb15036e558d84Tom Stellard  setOperationAction(ISD::FNEG, MVT::v4f32, Expand);
109d7a472c9c696ebf010835d9254fb15036e558d84Tom Stellard
11045b14e341a8a85e877d001bbd43f5e2b25b61cb8Christian Konig  setOperationAction(ISD::MUL, MVT::i64, Expand);
11145b14e341a8a85e877d001bbd43f5e2b25b61cb8Christian Konig
112f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::UDIV, MVT::i32, Expand);
113f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::UDIVREM, MVT::i32, Custom);
114f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  setOperationAction(ISD::UREM, MVT::i32, Expand);
115f5660aab413539bd94cfea8cd88fed80c54cd984Tom Stellard  setOperationAction(ISD::VSELECT, MVT::v2f32, Expand);
116f5660aab413539bd94cfea8cd88fed80c54cd984Tom Stellard  setOperationAction(ISD::VSELECT, MVT::v4f32, Expand);
117f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry
1185464a92861c76f1e091cd219dee71ce9858eb195Tom Stellard  static const MVT::SimpleValueType IntTypes[] = {
1195464a92861c76f1e091cd219dee71ce9858eb195Tom Stellard    MVT::v2i32, MVT::v4i32
120f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry  };
1210991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard  const size_t NumIntTypes = array_lengthof(IntTypes);
122f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry
1230991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard  for (unsigned int x  = 0; x < NumIntTypes; ++x) {
1245464a92861c76f1e091cd219dee71ce9858eb195Tom Stellard    MVT::SimpleValueType VT = IntTypes[x];
125f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    //Expand the following operations for the current type by default
126f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::ADD,  VT, Expand);
127f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::AND,  VT, Expand);
128e3d60ac33421a69545e2989b890899d76a918d2fTom Stellard    setOperationAction(ISD::FP_TO_SINT, VT, Expand);
129e3d60ac33421a69545e2989b890899d76a918d2fTom Stellard    setOperationAction(ISD::FP_TO_UINT, VT, Expand);
130f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::MUL,  VT, Expand);
131f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::OR,   VT, Expand);
132f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::SHL,  VT, Expand);
133e3d60ac33421a69545e2989b890899d76a918d2fTom Stellard    setOperationAction(ISD::SINT_TO_FP, VT, Expand);
134f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::SRL,  VT, Expand);
135f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::SRA,  VT, Expand);
136f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::SUB,  VT, Expand);
137f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::UDIV, VT, Expand);
138e3d60ac33421a69545e2989b890899d76a918d2fTom Stellard    setOperationAction(ISD::UINT_TO_FP, VT, Expand);
139f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::UREM, VT, Expand);
140f5660aab413539bd94cfea8cd88fed80c54cd984Tom Stellard    setOperationAction(ISD::VSELECT, VT, Expand);
141f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry    setOperationAction(ISD::XOR,  VT, Expand);
142f97c7fef52098bbd6a7ccc69657d112a36d77660Aaron Watry  }
1430991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard
1445464a92861c76f1e091cd219dee71ce9858eb195Tom Stellard  static const MVT::SimpleValueType FloatTypes[] = {
1455464a92861c76f1e091cd219dee71ce9858eb195Tom Stellard    MVT::v2f32, MVT::v4f32
1460991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard  };
1470991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard  const size_t NumFloatTypes = array_lengthof(FloatTypes);
1480991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard
1490991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard  for (unsigned int x = 0; x < NumFloatTypes; ++x) {
1505464a92861c76f1e091cd219dee71ce9858eb195Tom Stellard    MVT::SimpleValueType VT = FloatTypes[x];
1510991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard    setOperationAction(ISD::FADD, VT, Expand);
1520991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard    setOperationAction(ISD::FDIV, VT, Expand);
15384c0bd9803547b1cb09a20032bbc151a718b9457Tom Stellard    setOperationAction(ISD::FFLOOR, VT, Expand);
1540991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard    setOperationAction(ISD::FMUL, VT, Expand);
1553cae823f69f083c5eef19f0ea3128c48d7807c9bTom Stellard    setOperationAction(ISD::FRINT, VT, Expand);
1560991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard    setOperationAction(ISD::FSUB, VT, Expand);
1570991c314d7c1a2052963dc89af1d2f07134488b6Tom Stellard  }
158f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
159f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
1602b272a1c8cb6d9f02223a598495d84cd9d75b13dTom Stellard//===----------------------------------------------------------------------===//
1612b272a1c8cb6d9f02223a598495d84cd9d75b13dTom Stellard// Target Information
1622b272a1c8cb6d9f02223a598495d84cd9d75b13dTom Stellard//===----------------------------------------------------------------------===//
1632b272a1c8cb6d9f02223a598495d84cd9d75b13dTom Stellard
1642b272a1c8cb6d9f02223a598495d84cd9d75b13dTom StellardMVT AMDGPUTargetLowering::getVectorIdxTy() const {
1652b272a1c8cb6d9f02223a598495d84cd9d75b13dTom Stellard  return MVT::i32;
1662b272a1c8cb6d9f02223a598495d84cd9d75b13dTom Stellard}
1672b272a1c8cb6d9f02223a598495d84cd9d75b13dTom Stellard
1682b272a1c8cb6d9f02223a598495d84cd9d75b13dTom Stellard
169f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===---------------------------------------------------------------------===//
1701f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard// Target Properties
1711f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard//===---------------------------------------------------------------------===//
1721f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard
1731f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellardbool AMDGPUTargetLowering::isFAbsFree(EVT VT) const {
1741f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard  assert(VT.isFloatingPoint());
1751f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard  return VT == MVT::f32;
1761f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard}
1771f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard
1781f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellardbool AMDGPUTargetLowering::isFNegFree(EVT VT) const {
1791f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard  assert(VT.isFloatingPoint());
1801f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard  return VT == MVT::f32;
1811f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard}
1821f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard
1831f67c63cb23ba5d405452d72bb8892df6b7ccd4fTom Stellard//===---------------------------------------------------------------------===//
184f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard// TargetLowering Callbacks
185f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===---------------------------------------------------------------------===//
186f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
18790c64cbaa124e0e8541680efeaa56f0e6eb78d9aChristian Konigvoid AMDGPUTargetLowering::AnalyzeFormalArguments(CCState &State,
18890c64cbaa124e0e8541680efeaa56f0e6eb78d9aChristian Konig                             const SmallVectorImpl<ISD::InputArg> &Ins) const {
18990c64cbaa124e0e8541680efeaa56f0e6eb78d9aChristian Konig
19090c64cbaa124e0e8541680efeaa56f0e6eb78d9aChristian Konig  State.AnalyzeFormalArguments(Ins, CC_AMDGPU);
191f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
192f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
193f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardSDValue AMDGPUTargetLowering::LowerReturn(
194f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                     SDValue Chain,
195f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                     CallingConv::ID CallConv,
196f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                     bool isVarArg,
197f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                     const SmallVectorImpl<ISD::OutputArg> &Outs,
198f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                     const SmallVectorImpl<SDValue> &OutVals,
199ac6d9bec671252dd1e596fa71180ff6b39d06b5dAndrew Trick                                     SDLoc DL, SelectionDAG &DAG) const {
200f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return DAG.getNode(AMDGPUISD::RET_FLAG, DL, MVT::Other, Chain);
201f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
202f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
203f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===---------------------------------------------------------------------===//
204f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard// Target specific lowering
205f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===---------------------------------------------------------------------===//
206f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
207f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardSDValue AMDGPUTargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG)
208f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    const {
209f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  switch (Op.getOpcode()) {
210f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  default:
211f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    Op.getNode()->dump();
212f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    assert(0 && "Custom lowering code for this"
213f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard        "instruction is not implemented yet!");
214f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    break;
215f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // AMDIL DAG lowering
216f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SDIV: return LowerSDIV(Op, DAG);
217f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SREM: return LowerSREM(Op, DAG);
218f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SIGN_EXTEND_INREG: return LowerSIGN_EXTEND_INREG(Op, DAG);
219f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::BRCOND: return LowerBRCOND(Op, DAG);
220f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // AMDGPU DAG lowering
221a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  case ISD::CONCAT_VECTORS: return LowerCONCAT_VECTORS(Op, DAG);
222a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  case ISD::EXTRACT_SUBVECTOR: return LowerEXTRACT_SUBVECTOR(Op, DAG);
223f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::INTRINSIC_WO_CHAIN: return LowerINTRINSIC_WO_CHAIN(Op, DAG);
2244c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  case ISD::STORE: return LowerVectorStore(Op, DAG);
225f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::UDIVREM: return LowerUDIVREM(Op, DAG);
226f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
227f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return Op;
228f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
229f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
230e3d4cbc7d25061441adafa47450a31571c87bf85Tom StellardSDValue AMDGPUTargetLowering::LowerGlobalAddress(AMDGPUMachineFunction* MFI,
231e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard                                                 SDValue Op,
232e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard                                                 SelectionDAG &DAG) const {
233e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard
234e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard  const DataLayout *TD = getTargetMachine().getDataLayout();
235e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard  GlobalAddressSDNode *G = cast<GlobalAddressSDNode>(Op);
236da25cd3e6de8f21005590c2de49868f883cf2410Tom Stellard
237da25cd3e6de8f21005590c2de49868f883cf2410Tom Stellard  assert(G->getAddressSpace() == AMDGPUAS::LOCAL_ADDRESS);
238e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard  // XXX: What does the value of G->getOffset() mean?
239e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard  assert(G->getOffset() == 0 &&
240e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard         "Do not know what to do with an non-zero offset");
241e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard
242e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard  unsigned Offset = MFI->LDSSize;
243e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard  const GlobalValue *GV = G->getGlobal();
244e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard  uint64_t Size = TD->getTypeAllocSize(GV->getType()->getElementType());
245e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard
246e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard  // XXX: Account for alignment?
247e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard  MFI->LDSSize += Size;
248e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard
249da25cd3e6de8f21005590c2de49868f883cf2410Tom Stellard  return DAG.getConstant(Offset, getPointerTy(G->getAddressSpace()));
250e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard}
251e3d4cbc7d25061441adafa47450a31571c87bf85Tom Stellard
252a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellardvoid AMDGPUTargetLowering::ExtractVectorElements(SDValue Op, SelectionDAG &DAG,
253a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                                         SmallVectorImpl<SDValue> &Args,
254a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                                         unsigned Start,
255a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                                         unsigned Count) const {
256a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  EVT VT = Op.getValueType();
257a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  for (unsigned i = Start, e = Start + Count; i != e; ++i) {
258a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard    Args.push_back(DAG.getNode(ISD::EXTRACT_VECTOR_ELT, SDLoc(Op),
259a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                               VT.getVectorElementType(),
260a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                               Op, DAG.getConstant(i, MVT::i32)));
261a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  }
262a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard}
263a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard
264a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom StellardSDValue AMDGPUTargetLowering::LowerCONCAT_VECTORS(SDValue Op,
265a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                                                  SelectionDAG &DAG) const {
266a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  SmallVector<SDValue, 8> Args;
267a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  SDValue A = Op.getOperand(0);
268a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  SDValue B = Op.getOperand(1);
269a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard
270a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  ExtractVectorElements(A, DAG, Args, 0,
271a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                        A.getValueType().getVectorNumElements());
272a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  ExtractVectorElements(B, DAG, Args, 0,
273a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                        B.getValueType().getVectorNumElements());
274a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard
275a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  return DAG.getNode(ISD::BUILD_VECTOR, SDLoc(Op), Op.getValueType(),
276a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                     &Args[0], Args.size());
277a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard}
278a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard
279a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom StellardSDValue AMDGPUTargetLowering::LowerEXTRACT_SUBVECTOR(SDValue Op,
280a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                                                     SelectionDAG &DAG) const {
281a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard
282a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  SmallVector<SDValue, 8> Args;
283a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  EVT VT = Op.getValueType();
284a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  unsigned Start = cast<ConstantSDNode>(Op.getOperand(1))->getZExtValue();
285a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  ExtractVectorElements(Op.getOperand(0), DAG, Args, Start,
286a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                        VT.getVectorNumElements());
287a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard
288a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard  return DAG.getNode(ISD::BUILD_VECTOR, SDLoc(Op), Op.getValueType(),
289a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard                     &Args[0], Args.size());
290a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard}
291a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard
292a41520cf9b9cefed2091a0624a34c5f7fdb42a68Tom Stellard
293f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardSDValue AMDGPUTargetLowering::LowerINTRINSIC_WO_CHAIN(SDValue Op,
294f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    SelectionDAG &DAG) const {
295f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  unsigned IntrinsicID = cast<ConstantSDNode>(Op.getOperand(0))->getZExtValue();
296ac6d9bec671252dd1e596fa71180ff6b39d06b5dAndrew Trick  SDLoc DL(Op);
297f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  EVT VT = Op.getValueType();
298f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
299f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  switch (IntrinsicID) {
300f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    default: return Op;
301f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDIL_abs:
302f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return LowerIntrinsicIABS(Op, DAG);
303f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDIL_exp:
304f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(ISD::FEXP2, DL, VT, Op.getOperand(1));
305f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDGPU_lrp:
306f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return LowerIntrinsicLRP(Op, DAG);
307f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDIL_fraction:
308f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::FRACT, DL, VT, Op.getOperand(1));
309f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDIL_max:
310f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::FMAX, DL, VT, Op.getOperand(1),
311f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  Op.getOperand(2));
312f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDGPU_imax:
313f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::SMAX, DL, VT, Op.getOperand(1),
314f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  Op.getOperand(2));
315f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDGPU_umax:
316f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::UMAX, DL, VT, Op.getOperand(1),
317f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  Op.getOperand(2));
318f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDIL_min:
319f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::FMIN, DL, VT, Op.getOperand(1),
320f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  Op.getOperand(2));
321f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDGPU_imin:
322f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::SMIN, DL, VT, Op.getOperand(1),
323f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  Op.getOperand(2));
324f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDGPU_umin:
325f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::UMIN, DL, VT, Op.getOperand(1),
326f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  Op.getOperand(2));
327f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    case AMDGPUIntrinsic::AMDIL_round_nearest:
328f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(ISD::FRINT, DL, VT, Op.getOperand(1));
329f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
330f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
331f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
332f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard///IABS(a) = SMAX(sub(0, a), a)
333f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardSDValue AMDGPUTargetLowering::LowerIntrinsicIABS(SDValue Op,
334f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    SelectionDAG &DAG) const {
335f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
336ac6d9bec671252dd1e596fa71180ff6b39d06b5dAndrew Trick  SDLoc DL(Op);
337f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  EVT VT = Op.getValueType();
338f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Neg = DAG.getNode(ISD::SUB, DL, VT, DAG.getConstant(0, VT),
339f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                              Op.getOperand(1));
340f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
341f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return DAG.getNode(AMDGPUISD::SMAX, DL, VT, Neg, Op.getOperand(1));
342f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
343f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
344f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard/// Linear Interpolation
345f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard/// LRP(a, b, c) = muladd(a,  b, (1 - a) * c)
346f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardSDValue AMDGPUTargetLowering::LowerIntrinsicLRP(SDValue Op,
347f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    SelectionDAG &DAG) const {
348ac6d9bec671252dd1e596fa71180ff6b39d06b5dAndrew Trick  SDLoc DL(Op);
349f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  EVT VT = Op.getValueType();
350f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue OneSubA = DAG.getNode(ISD::FSUB, DL, VT,
351f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                DAG.getConstantFP(1.0f, MVT::f32),
352f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                Op.getOperand(1));
353f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue OneSubAC = DAG.getNode(ISD::FMUL, DL, VT, OneSubA,
354f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                    Op.getOperand(3));
355e3111964a0902bc38440980b0915b189f829c395Vincent Lejeune  return DAG.getNode(ISD::FADD, DL, VT,
356e3111964a0902bc38440980b0915b189f829c395Vincent Lejeune      DAG.getNode(ISD::FMUL, DL, VT, Op.getOperand(1), Op.getOperand(2)),
357e3111964a0902bc38440980b0915b189f829c395Vincent Lejeune      OneSubAC);
358f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
359f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
360f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard/// \brief Generate Min/Max node
361f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardSDValue AMDGPUTargetLowering::LowerMinMax(SDValue Op,
362f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    SelectionDAG &DAG) const {
363ac6d9bec671252dd1e596fa71180ff6b39d06b5dAndrew Trick  SDLoc DL(Op);
364f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  EVT VT = Op.getValueType();
365f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
366f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue LHS = Op.getOperand(0);
367f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue RHS = Op.getOperand(1);
368f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue True = Op.getOperand(2);
369f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue False = Op.getOperand(3);
370f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue CC = Op.getOperand(4);
371f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
372f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  if (VT != MVT::f32 ||
373f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      !((LHS == True && RHS == False) || (LHS == False && RHS == True))) {
374f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    return SDValue();
375f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
376f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
377f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  ISD::CondCode CCOpcode = cast<CondCodeSDNode>(CC)->get();
378f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  switch (CCOpcode) {
379f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETOEQ:
380f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETONE:
381f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETUNE:
382f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETNE:
383f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETUEQ:
384f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETEQ:
385f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETFALSE:
386f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETFALSE2:
387f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETTRUE:
388f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETTRUE2:
389f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETUO:
390f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETO:
391f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    assert(0 && "Operation should already be optimised !");
392f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETULE:
393f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETULT:
394f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETOLE:
395f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETOLT:
396f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETLE:
397f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETLT: {
398f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    if (LHS == True)
399f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::FMIN, DL, VT, LHS, RHS);
400f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    else
401f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::FMAX, DL, VT, LHS, RHS);
402f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
403f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETGT:
404f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETGE:
405f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETUGE:
406f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETOGE:
407f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETUGT:
408f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETOGT: {
409f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    if (LHS == True)
410f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::FMAX, DL, VT, LHS, RHS);
411f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    else
412f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return DAG.getNode(AMDGPUISD::FMIN, DL, VT, LHS, RHS);
413f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
414f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  case ISD::SETCC_INVALID:
415f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    assert(0 && "Invalid setcc condcode !");
416f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
417f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return Op;
418f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
419f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
420f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
421f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
422f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardSDValue AMDGPUTargetLowering::LowerUDIVREM(SDValue Op,
423f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    SelectionDAG &DAG) const {
424ac6d9bec671252dd1e596fa71180ff6b39d06b5dAndrew Trick  SDLoc DL(Op);
425f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  EVT VT = Op.getValueType();
426f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
427f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Num = Op.getOperand(0);
428f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Den = Op.getOperand(1);
429f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
430f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SmallVector<SDValue, 8> Results;
431f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
432f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // RCP =  URECIP(Den) = 2^32 / Den + e
433f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // e is rounding error.
434f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue RCP = DAG.getNode(AMDGPUISD::URECIP, DL, VT, Den);
435f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
436f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // RCP_LO = umulo(RCP, Den) */
437f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue RCP_LO = DAG.getNode(ISD::UMULO, DL, VT, RCP, Den);
438f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
439f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // RCP_HI = mulhu (RCP, Den) */
440f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue RCP_HI = DAG.getNode(ISD::MULHU, DL, VT, RCP, Den);
441f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
442f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // NEG_RCP_LO = -RCP_LO
443f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue NEG_RCP_LO = DAG.getNode(ISD::SUB, DL, VT, DAG.getConstant(0, VT),
444f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                     RCP_LO);
445f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
446f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // ABS_RCP_LO = (RCP_HI == 0 ? NEG_RCP_LO : RCP_LO)
447f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue ABS_RCP_LO = DAG.getSelectCC(DL, RCP_HI, DAG.getConstant(0, VT),
448f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                           NEG_RCP_LO, RCP_LO,
449f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                           ISD::SETEQ);
450f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Calculate the rounding error from the URECIP instruction
451f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // E = mulhu(ABS_RCP_LO, RCP)
452f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue E = DAG.getNode(ISD::MULHU, DL, VT, ABS_RCP_LO, RCP);
453f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
454f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // RCP_A_E = RCP + E
455f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue RCP_A_E = DAG.getNode(ISD::ADD, DL, VT, RCP, E);
456f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
457f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // RCP_S_E = RCP - E
458f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue RCP_S_E = DAG.getNode(ISD::SUB, DL, VT, RCP, E);
459f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
460f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Tmp0 = (RCP_HI == 0 ? RCP_A_E : RCP_SUB_E)
461f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Tmp0 = DAG.getSelectCC(DL, RCP_HI, DAG.getConstant(0, VT),
462f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                     RCP_A_E, RCP_S_E,
463f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                     ISD::SETEQ);
464f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Quotient = mulhu(Tmp0, Num)
465f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Quotient = DAG.getNode(ISD::MULHU, DL, VT, Tmp0, Num);
466f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
467f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Num_S_Remainder = Quotient * Den
468f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Num_S_Remainder = DAG.getNode(ISD::UMULO, DL, VT, Quotient, Den);
469f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
470f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Remainder = Num - Num_S_Remainder
471f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Remainder = DAG.getNode(ISD::SUB, DL, VT, Num, Num_S_Remainder);
472f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
473f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Remainder_GE_Den = (Remainder >= Den ? -1 : 0)
474f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Remainder_GE_Den = DAG.getSelectCC(DL, Remainder, Den,
475f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                 DAG.getConstant(-1, VT),
476f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                 DAG.getConstant(0, VT),
477f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                 ISD::SETGE);
478f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Remainder_GE_Zero = (Remainder >= 0 ? -1 : 0)
479f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Remainder_GE_Zero = DAG.getSelectCC(DL, Remainder,
480f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  DAG.getConstant(0, VT),
481f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  DAG.getConstant(-1, VT),
482f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  DAG.getConstant(0, VT),
483f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  ISD::SETGE);
484f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Tmp1 = Remainder_GE_Den & Remainder_GE_Zero
485f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Tmp1 = DAG.getNode(ISD::AND, DL, VT, Remainder_GE_Den,
486f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                               Remainder_GE_Zero);
487f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
488f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Calculate Division result:
489f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
490f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Quotient_A_One = Quotient + 1
491f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Quotient_A_One = DAG.getNode(ISD::ADD, DL, VT, Quotient,
492f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                         DAG.getConstant(1, VT));
493f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
494f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Quotient_S_One = Quotient - 1
495f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Quotient_S_One = DAG.getNode(ISD::SUB, DL, VT, Quotient,
496f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                         DAG.getConstant(1, VT));
497f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
498f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Div = (Tmp1 == 0 ? Quotient : Quotient_A_One)
499f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Div = DAG.getSelectCC(DL, Tmp1, DAG.getConstant(0, VT),
500f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                     Quotient, Quotient_A_One, ISD::SETEQ);
501f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
502f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Div = (Remainder_GE_Zero == 0 ? Quotient_S_One : Div)
503f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  Div = DAG.getSelectCC(DL, Remainder_GE_Zero, DAG.getConstant(0, VT),
504f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                            Quotient_S_One, Div, ISD::SETEQ);
505f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
506f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Calculate Rem result:
507f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
508f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Remainder_S_Den = Remainder - Den
509f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Remainder_S_Den = DAG.getNode(ISD::SUB, DL, VT, Remainder, Den);
510f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
511f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Remainder_A_Den = Remainder + Den
512f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Remainder_A_Den = DAG.getNode(ISD::ADD, DL, VT, Remainder, Den);
513f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
514f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Rem = (Tmp1 == 0 ? Remainder : Remainder_S_Den)
515f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Rem = DAG.getSelectCC(DL, Tmp1, DAG.getConstant(0, VT),
516f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                    Remainder, Remainder_S_Den, ISD::SETEQ);
517f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
518f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // Rem = (Remainder_GE_Zero == 0 ? Remainder_A_Den : Rem)
519f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  Rem = DAG.getSelectCC(DL, Remainder_GE_Zero, DAG.getConstant(0, VT),
520f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                            Remainder_A_Den, Rem, ISD::SETEQ);
521f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  SDValue Ops[2];
522f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  Ops[0] = Div;
523f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  Ops[1] = Rem;
524f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return DAG.getMergeValues(Ops, 2, DL);
525f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
526f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
5274c52d450dc3968267d1f089d36397fc785dcc7b4Tom StellardSDValue AMDGPUTargetLowering::LowerVectorStore(const SDValue &Op,
5284c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard                                               SelectionDAG &DAG) const {
5294c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  StoreSDNode *Store = dyn_cast<StoreSDNode>(Op);
5304c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  EVT MemVT = Store->getMemoryVT();
5314c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  unsigned MemBits = MemVT.getSizeInBits();
5324c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard
5334c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  // Byte stores are really expensive, so if possible, try to pack
5344c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  // 32-bit vector truncatating store into an i32 store.
5354c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  // XXX: We could also handle optimize other vector bitwidths
5364c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  if (!MemVT.isVector() || MemBits > 32) {
5374c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    return SDValue();
5384c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  }
5394c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard
5404c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  SDLoc DL(Op);
5414c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  const SDValue &Value = Store->getValue();
5424c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  EVT VT = Value.getValueType();
5434c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  const SDValue &Ptr = Store->getBasePtr();
5444c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  EVT MemEltVT = MemVT.getVectorElementType();
5454c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  unsigned MemEltBits = MemEltVT.getSizeInBits();
5464c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  unsigned MemNumElements = MemVT.getVectorNumElements();
5474c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  EVT PackedVT = EVT::getIntegerVT(*DAG.getContext(), MemVT.getSizeInBits());
5484c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  SDValue Mask;
5494c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  switch(MemEltBits) {
5504c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  case 8:
5514c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    Mask = DAG.getConstant(0xFF, PackedVT);
5524c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    break;
5534c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  case 16:
5544c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    Mask = DAG.getConstant(0xFFFF, PackedVT);
5554c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    break;
5564c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  default:
5574c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    llvm_unreachable("Cannot lower this vector store");
5584c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  }
5594c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  SDValue PackedValue;
5604c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  for (unsigned i = 0; i < MemNumElements; ++i) {
5614c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    EVT ElemVT = VT.getVectorElementType();
5624c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    SDValue Elt = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, ElemVT, Value,
5634c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard                              DAG.getConstant(i, MVT::i32));
5644c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    Elt = DAG.getZExtOrTrunc(Elt, DL, PackedVT);
5654c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    Elt = DAG.getNode(ISD::AND, DL, PackedVT, Elt, Mask);
5664c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    SDValue Shift = DAG.getConstant(MemEltBits * i, PackedVT);
5674c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    Elt = DAG.getNode(ISD::SHL, DL, PackedVT, Elt, Shift);
5684c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    if (i == 0) {
5694c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard      PackedValue = Elt;
5704c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    } else {
5714c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard      PackedValue = DAG.getNode(ISD::OR, DL, PackedVT, PackedValue, Elt);
5724c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard    }
5734c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  }
5744c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard  return DAG.getStore(Store->getChain(), DL, PackedValue, Ptr,
5754c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard                      MachinePointerInfo(Store->getMemOperand()->getValue()),
5764c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard                      Store->isVolatile(),  Store->isNonTemporal(),
5774c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard                      Store->getAlignment());
5784c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard}
5794c52d450dc3968267d1f089d36397fc785dcc7b4Tom Stellard
580f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===----------------------------------------------------------------------===//
581f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard// Helper functions
582f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===----------------------------------------------------------------------===//
583f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
584f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardbool AMDGPUTargetLowering::isHWTrueValue(SDValue Op) const {
585f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  if (ConstantFPSDNode * CFP = dyn_cast<ConstantFPSDNode>(Op)) {
586f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    return CFP->isExactlyValue(1.0);
587f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
588f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
589f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    return C->isAllOnesValue();
590f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
591f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return false;
592f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
593f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
594f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardbool AMDGPUTargetLowering::isHWFalseValue(SDValue Op) const {
595f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  if (ConstantFPSDNode * CFP = dyn_cast<ConstantFPSDNode>(Op)) {
596f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    return CFP->getValueAPF().isZero();
597f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
598f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
599f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    return C->isNullValue();
600f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
601f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return false;
602f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
603f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
604f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardSDValue AMDGPUTargetLowering::CreateLiveInRegister(SelectionDAG &DAG,
605f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                  const TargetRegisterClass *RC,
606f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                                   unsigned Reg, EVT VT) const {
607f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  MachineFunction &MF = DAG.getMachineFunction();
608f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  MachineRegisterInfo &MRI = MF.getRegInfo();
609f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  unsigned VirtualRegister;
610f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  if (!MRI.isLiveIn(Reg)) {
611f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    VirtualRegister = MRI.createVirtualRegister(RC);
612f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    MRI.addLiveIn(Reg, VirtualRegister);
613f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  } else {
614f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    VirtualRegister = MRI.getLiveInVirtReg(Reg);
615f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
616f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return DAG.getRegister(VirtualRegister, VT);
617f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
618f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
619f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#define NODE_NAME_CASE(node) case AMDGPUISD::node: return #node;
620f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
621f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardconst char* AMDGPUTargetLowering::getTargetNodeName(unsigned Opcode) const {
622f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  switch (Opcode) {
623f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  default: return 0;
624f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // AMDIL DAG nodes
625f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(CALL);
626f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(UMUL);
627f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(DIV_INF);
628f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(RET_FLAG);
629f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(BRANCH_COND);
630f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
631f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  // AMDGPU DAG nodes
632f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(DWORDADDR)
633f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(FRACT)
634f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(FMAX)
635f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(SMAX)
636f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(UMAX)
637f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(FMIN)
638f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(SMIN)
639f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(UMIN)
640f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(URECIP)
641f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  NODE_NAME_CASE(EXPORT)
642c7e1888d93f4cb2982266986f3af7e99df631fa1Tom Stellard  NODE_NAME_CASE(CONST_ADDRESS)
643c0b0c677a1138f0a5ce1435fc1e70cef38fd95c8Tom Stellard  NODE_NAME_CASE(REGISTER_LOAD)
644c0b0c677a1138f0a5ce1435fc1e70cef38fd95c8Tom Stellard  NODE_NAME_CASE(REGISTER_STORE)
64568db37b952be497c94c7aa98cf26f3baadb5afd3Tom Stellard  NODE_NAME_CASE(LOAD_CONSTANT)
64668db37b952be497c94c7aa98cf26f3baadb5afd3Tom Stellard  NODE_NAME_CASE(LOAD_INPUT)
64768db37b952be497c94c7aa98cf26f3baadb5afd3Tom Stellard  NODE_NAME_CASE(SAMPLE)
64868db37b952be497c94c7aa98cf26f3baadb5afd3Tom Stellard  NODE_NAME_CASE(SAMPLEB)
64968db37b952be497c94c7aa98cf26f3baadb5afd3Tom Stellard  NODE_NAME_CASE(SAMPLED)
65068db37b952be497c94c7aa98cf26f3baadb5afd3Tom Stellard  NODE_NAME_CASE(SAMPLEL)
651ec484277dd04399d7b2ea37508e39fc4998bc9a7Tom Stellard  NODE_NAME_CASE(STORE_MSKOR)
652f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
653f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
654