@@ -585,7 +585,7 @@ getOperationOrderings(MemSDNode *N, const NVPTXSubtarget *Subtarget) {
585585 // |------------------------------------------------------|-------------------------------|
586586 // | cuda::atomic_load | fence.sc.<scope>; |
587587 // | (memory_order_seq_cst, cuda::thread_scope_<scope>) | ld.acquire.<scope>; |
588- // |------------------------------------------------------|-------------------------------|
588+ // |------------------------------------------------------|-------------------------------|
589589 // | cuda::atomic_store | fence.sc.<scope>; |
590590 // | (memory_order_seq_cst, cuda::thread_scope_<scope>) | st.release.<scope>; |
591591 // |------------------------------------------------------|-------------------------------|
@@ -1868,7 +1868,7 @@ bool NVPTXDAGToDAGISel::tryStoreParam(SDNode *N) {
18681868 case 1 : {
18691869 MVT::SimpleValueType MemTy = Mem->getMemoryVT ().getSimpleVT ().SimpleTy ;
18701870 SDValue Imm = Ops[0 ];
1871- if (MemTy != MVT::f16 && MemTy != MVT::v2f16 &&
1871+ if (MemTy != MVT::f16 && MemTy != MVT::v2f16 && MemTy != MVT:: bf16 &&
18721872 (isa<ConstantSDNode>(Imm) || isa<ConstantFPSDNode>(Imm))) {
18731873 // Convert immediate to target constant
18741874 if (MemTy == MVT::f32 || MemTy == MVT::f64 ) {
@@ -2824,8 +2824,8 @@ void NVPTXDAGToDAGISel::SelectCpAsyncBulkPrefetchL2(SDNode *N) {
28242824 SDLoc DL (N);
28252825 SmallVector<SDValue, 4 > Ops (N->ops ().slice (2 , NumArgs));
28262826 Ops.push_back (N->getOperand (0 )); // Chain operand
2827-
2828- unsigned Opcode = IsCacheHint
2827+
2828+ unsigned Opcode = IsCacheHint
28292829 ? NVPTX::CP_ASYNC_BULK_PREFETCH_CH
28302830 : NVPTX::CP_ASYNC_BULK_PREFETCH;
28312831 ReplaceNode (N, CurDAG->getMachineNode (Opcode, DL, N->getVTList (), Ops));
0 commit comments