microsoft
diff --git a/‎cmake/onnxruntime_rocm_hipify.cmake‎
Lines changed: 1 addition & 0 deletions b/‎cmake/onnxruntime_rocm_hipify.cmake‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎onnxruntime/contrib_ops/cuda/bert/attention_impl.cu‎
Lines changed: 1 addition & 1 deletion b/‎onnxruntime/contrib_ops/cuda/bert/attention_impl.cu‎
Lines changed: 1 addition & 1 deletion
@@ -9,6 +9,7 @@ set(contrib_ops_excluded_files
   "bert/attention.h"
   "bert/attention_impl.cu"
   "bert/attention_softmax.h"
+  "bert/attention_softmax.cu"
   "bert/decoder_masked_multihead_attention.h"
   "bert/decoder_masked_multihead_attention.cc"
   "bert/decoder_masked_self_attention.h"
 
@@ -44,7 +44,7 @@ limitations under the License.
 #include "contrib_ops/cuda/bert/cutlass_fmha/memory_efficient_attention.h"
 
 using namespace onnxruntime::cuda;
-using namespace cub;
+using namespace onnxruntime::contrib::attention_softmax_cuda;
 
 namespace onnxruntime {
 namespace contrib {