|
| 1 | +/*========================== begin_copyright_notice ============================ |
| 2 | +
|
| 3 | +Copyright (C) 2022-2024 Intel Corporation |
| 4 | +
|
| 5 | +SPDX-License-Identifier: MIT |
| 6 | +
|
| 7 | +============================= end_copyright_notice ===========================*/ |
| 8 | + |
| 9 | +#include "common/LLVMWarningsPush.hpp" |
| 10 | +#include <llvm/IR/PatternMatch.h> |
| 11 | +#include <llvm/Pass.h> |
| 12 | +#include <llvm/Support/Debug.h> |
| 13 | +#include <llvm/Support/raw_ostream.h> |
| 14 | +#include "common/LLVMWarningsPop.hpp" |
| 15 | +#include "GenISAIntrinsics/GenIntrinsics.h" |
| 16 | +#include "Compiler/CISACodeGen/ShaderCodeGen.hpp" |
| 17 | +#include "Compiler/MetaDataUtilsWrapper.h" |
| 18 | +#include "Compiler/CISACodeGen/CSWalkOrder.hpp" |
| 19 | +#include "Probe/Assertion.h" |
| 20 | + |
| 21 | +using namespace llvm; |
| 22 | +using namespace IGC; |
| 23 | + |
| 24 | + |
| 25 | +void IGC::overrideWalkOrderKeysInPass( |
| 26 | + bool is_pow2_x, bool is_pow2_y, bool is_pow2_z, |
| 27 | + SComputeShaderWalkOrder& walkOrderStruct, |
| 28 | + CodeGenContext* ctx) |
| 29 | +{ |
| 30 | + ThreadIDLayout& threadIDLayout = walkOrderStruct.m_threadIDLayout; |
| 31 | + CS_WALK_ORDER& walkOrder = walkOrderStruct.m_walkOrder; |
| 32 | + bool& enableHWGenerateLID = walkOrderStruct.m_enableHWGenerateLID; |
| 33 | + |
| 34 | + ModuleMetaData* MMD = ctx->getModuleMetaData(); |
| 35 | + const CPlatform& platform = ctx->platform; |
| 36 | + const CDriverInfo& driverInfo = ctx->m_DriverInfo; |
| 37 | + |
| 38 | + if ((IGC_IS_FLAG_ENABLED(ForceTileY) || MMD->csInfo.forceTileYWalk) && |
| 39 | + platform.supportHWGenerateTID() && driverInfo.SupportHWGenerateTID()) |
| 40 | + { |
| 41 | + threadIDLayout = ThreadIDLayout::TileY; |
| 42 | + walkOrder = CS_WALK_ORDER::WO_YXZ; |
| 43 | + enableHWGenerateLID = enableHWGenerateLIDInPass(walkOrder, is_pow2_x, is_pow2_y, is_pow2_z); |
| 44 | + } |
| 45 | + |
| 46 | + if (MMD->csInfo.walkOrderEnabled) |
| 47 | + { |
| 48 | + walkOrder = (CS_WALK_ORDER)MMD->csInfo.walkOrderOverride; |
| 49 | + enableHWGenerateLID = enableHWGenerateLIDInPass(walkOrder, is_pow2_x, is_pow2_y, is_pow2_z); |
| 50 | + } |
| 51 | + |
| 52 | + if (IGC_IS_FLAG_ENABLED(OverrideCsWalkOrderEnable)) |
| 53 | + { |
| 54 | + walkOrder = (CS_WALK_ORDER)IGC_GET_FLAG_VALUE(OverrideCsWalkOrder); |
| 55 | + enableHWGenerateLID = enableHWGenerateLIDInPass(walkOrder, is_pow2_x, is_pow2_y, is_pow2_z); |
| 56 | + } |
| 57 | + |
| 58 | + if (IGC_IS_FLAG_ENABLED(OverrideCsTileLayoutEnable)) |
| 59 | + { |
| 60 | + threadIDLayout = (ThreadIDLayout)IGC_IS_FLAG_ENABLED(OverrideCsTileLayout); |
| 61 | + } |
| 62 | +} |
| 63 | + |
| 64 | +bool IGC::enableHWGenerateLIDInPass( |
| 65 | + CS_WALK_ORDER walk_order, |
| 66 | + bool is_pow2_x, bool is_pow2_y, bool is_pow2_z) |
| 67 | +{ |
| 68 | + bool bEnableHWGenerateLID = false; |
| 69 | + |
| 70 | + switch (walk_order) |
| 71 | + { |
| 72 | + case CS_WALK_ORDER::WO_XYZ: |
| 73 | + case CS_WALK_ORDER::WO_YXZ: |
| 74 | + bEnableHWGenerateLID = (is_pow2_x && is_pow2_y); |
| 75 | + break; |
| 76 | + |
| 77 | + case CS_WALK_ORDER::WO_XZY: |
| 78 | + case CS_WALK_ORDER::WO_ZXY: |
| 79 | + bEnableHWGenerateLID = (is_pow2_x && is_pow2_z); |
| 80 | + break; |
| 81 | + |
| 82 | + case CS_WALK_ORDER::WO_YZX: |
| 83 | + case CS_WALK_ORDER::WO_ZYX: |
| 84 | + bEnableHWGenerateLID = (is_pow2_y && is_pow2_z); |
| 85 | + break; |
| 86 | + } |
| 87 | + return bEnableHWGenerateLID; |
| 88 | +} |
| 89 | + |
| 90 | +Optional<CS_WALK_ORDER> |
| 91 | +IGC::selectBestWalkOrderInPass( |
| 92 | + ThreadIDLayout Layout, |
| 93 | + bool is_pow2_x, bool is_pow2_y, bool is_pow2_z) |
| 94 | +{ |
| 95 | + constexpr uint UNDEF = std::numeric_limits<uint>::max(); |
| 96 | + uint order0 = UNDEF; |
| 97 | + uint order1 = UNDEF; |
| 98 | + if (Layout == ThreadIDLayout::TileY) |
| 99 | + { |
| 100 | + IGC_ASSERT(is_pow2_y); |
| 101 | + order0 = 1; |
| 102 | + order1 = (is_pow2_x ? 0 : (is_pow2_z ? 2 : UNDEF)); |
| 103 | + } |
| 104 | + else |
| 105 | + { |
| 106 | + //below is from HAS p-code except tileY |
| 107 | + //try to find walk_order so that HW can generate LID |
| 108 | + if (is_pow2_x) |
| 109 | + { |
| 110 | + // (pow2,pow2,z) or (pow2,y,pow2) or illegal |
| 111 | + order0 = 0; |
| 112 | + order1 = (is_pow2_y ? 1 : (is_pow2_z ? 2 : UNDEF)); |
| 113 | + } |
| 114 | + else if (is_pow2_y) |
| 115 | + { |
| 116 | + // (x,pow2,pow2) or illegal |
| 117 | + order0 = 1; |
| 118 | + order1 = (is_pow2_z ? 2 : UNDEF); |
| 119 | + } |
| 120 | + } |
| 121 | + |
| 122 | + if (order1 != UNDEF) |
| 123 | + { |
| 124 | + // select walkorder |
| 125 | + return getWalkOrderInPass(order0, order1); |
| 126 | + } |
| 127 | + |
| 128 | + return None; |
| 129 | +} |
| 130 | + |
| 131 | +void IGC::setEmitLocalMaskInPass(SGVUsage channelNum, EMIT_LOCAL_MASK& emitMask) |
| 132 | +{ |
| 133 | + //only 4 patterns are supported: None; X; XY; XYZ |
| 134 | + switch (channelNum) |
| 135 | + { |
| 136 | + case THREAD_ID_IN_GROUP_X: |
| 137 | + emitMask = (EMIT_LOCAL_MASK::EM_NONE == emitMask) ? EMIT_LOCAL_MASK::EM_X : emitMask; |
| 138 | + break; |
| 139 | + case THREAD_ID_IN_GROUP_Y: |
| 140 | + emitMask = (EMIT_LOCAL_MASK::EM_NONE == emitMask || EMIT_LOCAL_MASK::EM_X == emitMask) ? |
| 141 | + EMIT_LOCAL_MASK::EM_XY : emitMask; |
| 142 | + break; |
| 143 | + case THREAD_ID_IN_GROUP_Z: |
| 144 | + emitMask = EMIT_LOCAL_MASK::EM_XYZ; |
| 145 | + break; |
| 146 | + default: |
| 147 | + break; |
| 148 | + } |
| 149 | +} |
| 150 | + |
| 151 | +//order0: the internal walk dim |
| 152 | +//order1: the intermediate walk dim |
| 153 | +//e.g.: 1, 0 means, YXZ walkorder |
| 154 | +CS_WALK_ORDER IGC::getWalkOrderInPass(uint order0, uint order1) |
| 155 | +{ |
| 156 | + auto getWalkOrderValue = [](uint order0, uint order1) constexpr { |
| 157 | + return (order0 << 4 | order1 << 2); |
| 158 | + }; |
| 159 | + |
| 160 | + switch (getWalkOrderValue(order0, order1)) |
| 161 | + { |
| 162 | + case getWalkOrderValue(0, 1): return CS_WALK_ORDER::WO_XYZ; //012 |
| 163 | + case getWalkOrderValue(0, 2): return CS_WALK_ORDER::WO_XZY; //021 |
| 164 | + case getWalkOrderValue(1, 0): return CS_WALK_ORDER::WO_YXZ; //102 |
| 165 | + case getWalkOrderValue(1, 2): return CS_WALK_ORDER::WO_YZX; //120 |
| 166 | + case getWalkOrderValue(2, 0): return CS_WALK_ORDER::WO_ZXY; //201 |
| 167 | + case getWalkOrderValue(2, 1): return CS_WALK_ORDER::WO_ZYX; //210 |
| 168 | + default: |
| 169 | + IGC_ASSERT_MESSAGE(0, "unhandled case!"); |
| 170 | + return CS_WALK_ORDER::WO_XYZ; |
| 171 | + } |
| 172 | +} |
0 commit comments