[PATCH RFC 3/4] R600: Implement iterative algorithm for udivrem

Jan Vesely jan.vesely at rutgers.edu
Fri Apr 25 12:08:37 PDT 2014


Initial implementation, rather slow

Signed-off-by: Jan Vesely <jan.vesely at rutgers.edu>
---
 lib/Target/R600/AMDGPUISelLowering.cpp | 50 ++++++++++++++++++++++++++++++++++
 1 file changed, 50 insertions(+)

diff --git a/lib/Target/R600/AMDGPUISelLowering.cpp b/lib/Target/R600/AMDGPUISelLowering.cpp
index 01d1eaf..a004b91 100644
--- a/lib/Target/R600/AMDGPUISelLowering.cpp
+++ b/lib/Target/R600/AMDGPUISelLowering.cpp
@@ -429,6 +429,56 @@ void AMDGPUTargetLowering::ReplaceNodeResults(SDNode *N,
     Results.push_back(UDIVREM.getValue(1));
     break;
   }
+  case ISD::UDIVREM: {
+    SDValue Op = SDValue(N, 0);
+    SDLoc DL(Op);
+    EVT VT = Op.getValueType();
+    EVT HalfVT = VT.getHalfSizedIntegerVT(*DAG.getContext());
+
+    //HiLo split
+    SDValue LHS_Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, HalfVT,
+      N->getOperand(0), DAG.getConstant(0, HalfVT));
+    SDValue LHS_Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, HalfVT,
+      N->getOperand(0), DAG.getConstant(1, HalfVT));
+
+    SDValue RHS = N->getOperand(1);
+
+    SDValue DIV = DAG.getConstant(0, VT);
+    SDValue REM = DAG.getConstant(0, VT);
+
+    const unsigned bitWidth = VT.getSizeInBits();
+    const unsigned halfBitWidth = HalfVT.getSizeInBits();
+
+    SDValue one = DAG.getConstant(1, HalfVT);
+    SDValue one_VT = DAG.getConstant(1, VT);
+    for (unsigned i = 0; i < bitWidth; ++i) {
+      SDValue POS = DAG.getConstant((bitWidth - i - 1) % halfBitWidth, HalfVT);
+      // Get Value of high bit
+      SDValue HBit = DAG.getNode(ISD::SRL, DL, HalfVT,
+        i < halfBitWidth ? LHS_Hi : LHS_Lo, POS);
+      HBit = DAG.getNode(ISD::AND, DL, HalfVT, HBit, one);
+      HBit = DAG.getNode(ISD::ZERO_EXTEND, DL, VT, HBit);
+
+      // Add the high bit to shifted remainder
+      REM = DAG.getNode(ISD::SHL, DL, VT, REM, one);
+      REM = DAG.getNode(ISD::OR, DL, VT, REM, HBit);
+
+      // Update DIV
+      SDValue ShDIV = DAG.getNode(ISD::SHL, DL, VT, DIV, one);
+      SDValue ShDIV_plus = DAG.getNode(ISD::OR, DL, VT, ShDIV, one_VT);
+
+      DIV = DAG.getSelectCC(DL, REM, RHS, ShDIV_plus, ShDIV, ISD::SETGE);
+
+      // Update REM
+      SDValue REM_sub = DAG.getNode(ISD::SUB, DL, VT, REM, RHS);
+
+      REM = DAG.getSelectCC(DL, REM, RHS, REM_sub, REM, ISD::SETGE);
+    }
+
+    Results.push_back(DIV);
+    Results.push_back(REM);
+    break;
+  }
   default:
     return;
   }
-- 
1.9.0




More information about the llvm-commits mailing list