6 年之前 · 4113e2297d
--- a/include/llvm/CodeGen/SelectionDAGNodes.h
+++ b/include/llvm/CodeGen/SelectionDAGNodes.h
@@ -2197,8 +2197,6 @@ public:
 
															       : MemSDNode(NodeTy, Order, dl, VTs, MemVT, MMO) {
														
 
															     LSBaseSDNodeBits.AddressingMode = AM;
														
 
															     assert(getAddressingMode() == AM && "Value truncated");
														
 
															-    assert((!MMO->isAtomic() || MMO->isVolatile()) &&
														
 
															-           "use an AtomicSDNode instead for non-volatile atomics");
														
 
															   }
														
 
															   const SDValue &getOffset() const {
														
--- a/include/llvm/CodeGen/TargetLowering.h
+++ b/include/llvm/CodeGen/TargetLowering.h
@@ -3716,6 +3716,25 @@ public:
 
															     return MachineMemOperand::MONone;
														
 
															   }
														
 
															+  /// Should SelectionDAG lower an atomic store of the given kind as a normal
														
 
															+  /// StoreSDNode (as opposed to an AtomicSDNode)?  NOTE: The intention is to
														
 
															+  /// eventually migrate all targets to the using StoreSDNodes, but porting is
														
 
															+  /// being done target at a time.  
														
 
															+  virtual bool lowerAtomicStoreAsStoreSDNode(const StoreInst &SI) const {
														
 
															+    assert(SI.isAtomic() && "violated precondition");
														
 
															+    return false;
														
 
															+  }
														
 
															+
														
 
															+  /// Should SelectionDAG lower an atomic load of the given kind as a normal
														
 
															+  /// LoadSDNode (as opposed to an AtomicSDNode)?  NOTE: The intention is to
														
 
															+  /// eventually migrate all targets to the using LoadSDNodes, but porting is
														
 
															+  /// being done target at a time.  
														
 
															+  virtual bool lowerAtomicLoadAsLoadSDNode(const LoadInst &LI) const {
														
 
															+    assert(LI.isAtomic() && "violated precondition");
														
 
															+    return false;
														
 
															+  }
														
 
															+
														
 
															+
														
 
															   /// This callback is invoked by the type legalizer to legalize nodes with an
														
 
															   /// illegal operand type but legal result types.  It replaces the
														
 
															   /// LowerOperation callback in the type Legalizer.  The reason we can not do
														
--- a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
@@ -4658,9 +4658,26 @@ void SelectionDAGBuilder::visitAtomicLoad(const LoadInst &I) {
 
															                            AAMDNodes(), nullptr, SSID, Order);
														
 
															   InChain = TLI.prepareVolatileOrAtomicLoad(InChain, dl, DAG);
														
 
															-  SDValue L =
														
 
															-      DAG.getAtomic(ISD::ATOMIC_LOAD, dl, MemVT, MemVT, InChain,
														
 
															-                    getValue(I.getPointerOperand()), MMO);
														
 
															+
														
 
															+  SDValue Ptr = getValue(I.getPointerOperand());
														
 
															+
														
 
															+  if (TLI.lowerAtomicLoadAsLoadSDNode(I)) {
														
 
															+    // TODO: Once this is better exercised by tests, it should be merged with
														
 
															+    // the normal path for loads to prevent future divergence.
														
 
															+    SDValue L = DAG.getLoad(MemVT, dl, InChain, Ptr, MMO);
														
 
															+    if (MemVT != VT)
														
 
															+      L = DAG.getPtrExtOrTrunc(L, dl, VT);
														
 
															+
														
 
															+    setValue(&I, L);
														
 
															+    if (!I.isUnordered()) {
														
 
															+      SDValue OutChain = L.getValue(1);
														
 
															+      DAG.setRoot(OutChain);
														
 
															+    }
														
 
															+    return;
														
 
															+  }
														
 
															+  
														
 
															+  SDValue L = DAG.getAtomic(ISD::ATOMIC_LOAD, dl, MemVT, MemVT, InChain,
														
 
															+                            Ptr, MMO);
														
 
															   SDValue OutChain = L.getValue(1);
														
 
															   if (MemVT != VT)
														
@@ -4699,9 +4716,17 @@ void SelectionDAGBuilder::visitAtomicStore(const StoreInst &I) {
 
															   SDValue Val = getValue(I.getValueOperand());
														
 
															   if (Val.getValueType() != MemVT)
														
 
															     Val = DAG.getPtrExtOrTrunc(Val, dl, MemVT);
														
 
															+  SDValue Ptr = getValue(I.getPointerOperand());
														
 
															+  if (TLI.lowerAtomicStoreAsStoreSDNode(I)) {
														
 
															+    // TODO: Once this is better exercised by tests, it should be merged with
														
 
															+    // the normal path for stores to prevent future divergence.
														
 
															+    SDValue S = DAG.getStore(InChain, dl, Val, Ptr, MMO);
														
 
															+    DAG.setRoot(S);
														
 
															+    return;
														
 
															+  }
														
 
															   SDValue OutChain = DAG.getAtomic(ISD::ATOMIC_STORE, dl, MemVT, InChain,
														
 
															-                                   getValue(I.getPointerOperand()), Val, MMO);
														
 
															+                                   Ptr, Val, MMO);
														
 
															   DAG.setRoot(OutChain);
														
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -92,6 +92,13 @@ static cl::opt<bool> MulConstantOptimization(
 
															              "SHIFT, LEA, etc."),
														
 
															     cl::Hidden);
														
 
															+static cl::opt<bool> ExperimentalUnorderedISEL(
														
 
															+    "x86-experimental-unordered-atomic-isel", cl::init(false),
														
 
															+    cl::desc("Use LoadSDNode and StoreSDNode instead of "
														
 
															+             "AtomicSDNode for unordered atomic loads and "
														
 
															+             "stores respectively."),
														
 
															+    cl::Hidden);
														
 
															+
														
 
															 /// Call this when the user attempts to do something unsupported, like
														
 
															 /// returning a double without SSE2 enabled on x86_64. This is not fatal, unlike
														
 
															 /// report_fatal_error, so calling code should attempt to recover without
														
@@ -26493,6 +26500,18 @@ X86TargetLowering::lowerIdempotentRMWIntoFencedLoad(AtomicRMWInst *AI) const {
 
															   return Loaded;
														
 
															 }
														
 
															+bool X86TargetLowering::lowerAtomicStoreAsStoreSDNode(const StoreInst &SI) const {
														
 
															+  if (!SI.isUnordered())
														
 
															+    return false;
														
 
															+  return ExperimentalUnorderedISEL;
														
 
															+}
														
 
															+bool X86TargetLowering::lowerAtomicLoadAsLoadSDNode(const LoadInst &LI) const {
														
 
															+  if (!LI.isUnordered())
														
 
															+    return false;
														
 
															+  return ExperimentalUnorderedISEL;
														
 
															+}
														
 
															+
														
 
															+
														
 
															 /// Emit a locked operation on a stack location which does not change any
														
 
															 /// memory location, but does involve a lock prefix.  Location is chosen to be
														
 
															 /// a) very likely accessed only by a single thread to minimize cache traffic,
														
--- a/lib/Target/X86/X86ISelLowering.h
+++ b/lib/Target/X86/X86ISelLowering.h
@@ -1388,6 +1388,9 @@ namespace llvm {
 
															     LoadInst *
														
 
															     lowerIdempotentRMWIntoFencedLoad(AtomicRMWInst *AI) const override;
														
 
															+    bool lowerAtomicStoreAsStoreSDNode(const StoreInst &SI) const override;
														
 
															+    bool lowerAtomicLoadAsLoadSDNode(const LoadInst &LI) const override;
														
 
															+
														
 
															     bool needsCmpXchgNb(Type *MemType) const;
														
 
															     void SetupEntryBlockForSjLj(MachineInstr &MI, MachineBasicBlock *MBB,
														
--- a/test/CodeGen/X86/atomic-unordered.ll
+++ b/test/CodeGen/X86/atomic-unordered.ll