@@ -672,7 +672,8 @@ def AMDGPU_PermlanePermAttr : EnumAttr<AMDGPU_Dialect, AMDGPU_PermlanePerm,
672672def AMDGPU_PermlaneOp : AMDGPU_Op<"permlane", [Pure, AllTypesMatch<["result", "src"]>]> {
673673 let summary = "AMDGPU permlane op";
674674 let description = [{
675- High-level wrapper on `rocdl.permlane.*` variants.
675+ High-level wrapper on `rocdl.permlane.*` variants for permutations
676+ on rows of lanes in a subgroup.
676677
677678 Supports arbitrary int/float/vector types, which will be repacked to i32 and
678679 one or more `rocdl.permlane.*` ops during lowering.
@@ -689,14 +690,13 @@ def AMDGPU_PermlaneOp : AMDGPU_Op<"permlane", [Pure, AllTypesMatch<["result", "s
689690 Operands:
690691 * `$src`: Vector register to permute across lanes of the subgroup.
691692 * `$kind`: The kind of permutation operation.
692- * `$fetch_inactive`: Optional. Used to dertermine behavior of invalid lanes (disabled thread or out-of-range).
693- `fetch_inactive = false`: If source lane is invalid, use `bound_ctrl` to determine the source value.
694- `fetch_inactive = true`: If the source lane is disabled, fetch the source value anyway
695- (ignoring `bound_ctrl`). If the source lane is out-of-range, behavior is decided by `bound_ctrl`.
693+ * `$fetch_inactive`: Optional. Used to dertermine behavior of a fetch from a disabled lane.
694+ `fetch_inactive = false`: If the source lane is disabled, use `bound_ctrl` to determine the source value.
695+ `fetch_inactive = true`: If the source lane is disabled, fetch the source value anyway (ignoring `bound_ctrl`).
696696 * `$bound_ctrl`: Optional. Used to determine what a thread should do if its source operand is from
697- a disabled thread or invalid input : use the value zero, or disable the write.
698- `bound_ctrl = false`: Do not write when source is invalid or out-of-range.
699- `bound_ctrl = true`: Use zero as input if source is invalid or out-of-range
697+ a disabled lane : use the value zero, or disable the write.
698+ `bound_ctrl = false`: Do not write when source is from a disabled lane
699+ `bound_ctrl = true`: Use zero as input if source is from a disabled lane
700700
701701 Note: Lowering is only supported on gfx950 and up.
702702 }];
0 commit comments