We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent af7009e commit b17216cCopy full SHA for b17216c
csrc/gpu/aten/operators/xetla/kernels/include/subgroup/tile/impl/load_xe.hpp
@@ -398,9 +398,9 @@ tile_load(tile_t& tile, payload_t& payload) {
398
static constexpr gpu_arch arch_tag = payload_t::arch_tag;
399
400
using load_store_attr = load_store_attr_t<msg_type::block_1d, arch_tag>;
401
- static constexpr uint32_t max_load_vec_len = std::min(
402
- uint32_t(tile_t::block_elems * sizeof(dtype)),
403
- load_store_attr::max_load_vec_len);
+
+ static constexpr uint32_t max_load_vec_len =
+ load_store_attr::max_load_vec_len;
404
405
static constexpr uint32_t max_load_vec_elems =
406
max_load_vec_len / sizeof(dtype);
0 commit comments