intel
diff --git a/‎IGC/Compiler/CISACodeGen/EmitVISAPass.cpp‎
Lines changed: 39 additions & 85 deletions b/‎IGC/Compiler/CISACodeGen/EmitVISAPass.cpp‎
Lines changed: 39 additions & 85 deletions
@@ -737,8 +737,9 @@ bool EmitPass::runOnFunction(llvm::Function &F) {
         m_encoder->SetIsCodePatchCandidate(false);
       }
 
-      if (m_pCtx->platform.supportDualSimd8PS() && m_pCtx->platform.isCoreChildOf(IGFX_XE2_HPG_CORE) &&
-          m_currShader->GetShaderType() == ShaderType::PIXEL_SHADER) {
+      if (m_pCtx->platform.supportDualSimd8PS() &&
+          m_pCtx->platform.isCoreChildOf(IGFX_XE2_HPG_CORE) &&
+          m_currShader->GetShaderType() == ShaderType::PIXEL_SHADER ) {
         m_encoder->SetIsCodePatchCandidate(false);
       }
     } else {
@@ -3991,8 +3992,7 @@ void EmitPass::emitVideoAnalyticGRF(llvm::GenIntrinsicInst *inst, const DWORD re
 
 static bool isVectorTypeAllowed(Value *I) {
   IGCLLVM::FixedVectorType *VecType = llvm::dyn_cast<IGCLLVM::FixedVectorType>(I->getType());
-  if (!VecType)
-    return false;
+  if (!VecType) return false;
   auto ElType = VecType->getElementType();
   return ElType->isIntegerTy(32) || ElType->isFloatTy();
 }
@@ -4038,10 +4038,8 @@ void EmitPass::BinaryUnary(llvm::Instruction *inst, const SSource source[2], con
     break;
   case Instruction::FAdd:
   case Instruction::Add:
-    if (inst->getType()->isVectorTy())
-      Add(source, modifier);
-    else
-      EmitSimpleAlu(inst, source, modifier);
+    if (inst->getType()->isVectorTy()) Add(source, modifier);
+    else EmitSimpleAlu(inst, source, modifier);
     break;
   case Instruction::Call:
     EmitAluIntrinsic(cast<CallInst>(inst), source, modifier);
@@ -4240,6 +4238,7 @@ static unsigned getVectorSize(Value *I) {
   return NumElements;
 }
 
+
 void EmitPass::FPTrunc(const SSource sources[2], const DstModifier &modifier) {
 
   CVariable *src[2];
@@ -4345,18 +4344,13 @@ bool EmitPass::isVectorEmissionPossible(const SSource sources[2], CVariable *src
   // any non ordinary state of source modifiers
   // can be a sign of emission of a specific pattern,
   // emission can interfere with
-  if (sources[0].elementOffset != 0)
-    return false;
-  if (sources[1].elementOffset != 0)
-    return false;
-  if (sources[0].SIMDOffset != 0)
-    return false;
-  if (sources[1].SIMDOffset != 0)
-    return false;
+  if (sources[0].elementOffset != 0) return false;
+  if (sources[1].elementOffset != 0) return false;
+  if (sources[0].SIMDOffset != 0) return false;
+  if (sources[1].SIMDOffset != 0) return false;
 
   bool AllowedVectorTypes = isVectorTypeAllowed(sources[0].value) && isVectorTypeAllowed(sources[1].value);
-  if (!AllowedVectorTypes)
-    return false;
+  if (!AllowedVectorTypes) return false;
 
   bool DestSizeEquals = false;
   // it's possible have a case where two uniform vectors are
@@ -4731,8 +4725,7 @@ void EmitPass::VectorMad(const SSource sources[3], const DstModifier &modifier)
 void EmitPass::FDiv(const SSource sources[2], const DstModifier &modifier) {
 
   CVariable *src[2];
-  for (int i = 0; i < 2; ++i)
-    src[i] = GetSrcVariable(sources[i]);
+  for (int i = 0; i < 2; ++i) src[i] = GetSrcVariable(sources[i]);
   bool IsPossible = isVectorEmissionPossible(sources, src);
 
   if (IGC_IS_FLAG_ENABLED(EnableVectorEmitter) && IsPossible) {
@@ -5697,7 +5690,8 @@ void EmitPass::emitSimdShuffle(llvm::Instruction *inst) {
         CVariable *tempCopy = m_currShader->GetNewVariable(simdChannel, "SanitizedIndexShuffleTmp");
         m_encoder->And(tempCopy, simdChannel, m_currShader->ImmToVariable(maskOfValidLanes, ISA_TYPE_UW));
         simdChannelUW = m_currShader->BitCast(tempCopy, ISA_TYPE_UW);
-      } else {
+      }
+      else {
         m_encoder->SetSrcRegion(0, 2, 1, 0);
         m_encoder->SetDstRegion(2);
         m_encoder->And(simdChannelUW, simdChannelUW, m_currShader->ImmToVariable(maskOfValidLanes, ISA_TYPE_UW));
@@ -8746,13 +8740,12 @@ void EmitPass::EmitGenIntrinsicMessage(llvm::GenIntrinsicInst *inst) {
     break;
   case GenISAIntrinsic::GenISA_ldrawvector_indexed:
   case GenISAIntrinsic::GenISA_ldraw_indexed:
-    emitLoadRawIndexed(cast<LdRawIntrinsic>(inst), cast<LdRawIntrinsic>(inst)->getOffsetValue(), nullptr, nullptr,
-                       false /*flipVarOffsetSign*/);
+    emitLoadRawIndexed(cast<LdRawIntrinsic>(inst), cast<LdRawIntrinsic>(inst)->getOffsetValue(), nullptr, nullptr);
     break;
   case GenISAIntrinsic::GenISA_storerawvector_indexed:
   case GenISAIntrinsic::GenISA_storeraw_indexed:
     emitStoreRawIndexed(cast<StoreRawIntrinsic>(inst), cast<StoreRawIntrinsic>(inst)->getOffsetValue(), nullptr,
-                        nullptr, false /*flipVarOffsetSign*/);
+                        nullptr);
     break;
   case GenISAIntrinsic::GenISA_GetBufferPtr:
     emitGetBufferPtr(inst);
@@ -9218,7 +9211,6 @@ void EmitPass::EmitIntrinsicMessage(llvm::IntrinsicInst *inst) {
   case Intrinsic::fabs:
   case Intrinsic::trap:
   case Intrinsic::experimental_noalias_scope_decl:
-  case Intrinsic::assume:
     // do nothing
     break;
   case Intrinsic::stacksave:
@@ -10440,8 +10432,8 @@ void EmitPass::setRovCacheCtrl(GenIntrinsicInst *inst) {
   inst->setMetadata("lsc.cache.ctrl", node);
 }
 
-void EmitPass::emitLoadRawIndexed(LdRawIntrinsic *inst, Value *varOffset, ConstantInt *immScale, ConstantInt *immOffset,
-                                  bool flipVarOffsetSign) {
+void EmitPass::emitLoadRawIndexed(LdRawIntrinsic *inst, Value *varOffset, ConstantInt *immScale,
+                                  ConstantInt *immOffset) {
   Value *bufPtrv = inst->getResourceValue();
 
   LSC_DOC_ADDR_SPACE addrSpace = m_pCtx->getUserAddrSpaceMD().Get(inst);
@@ -10452,7 +10444,7 @@ void EmitPass::emitLoadRawIndexed(LdRawIntrinsic *inst, Value *varOffset, Consta
     }
     LSC_CACHE_OPTS cacheOpts = translateLSCCacheControlsFromMetadata(inst, true);
     emitLSCVectorLoad(inst, bufPtrv,
-                      varOffset, immOffset, immScale, flipVarOffsetSign, cacheOpts, addrSpace
+                      varOffset, immOffset, immScale, cacheOpts, addrSpace
     );
     return;
   }
@@ -10711,8 +10703,7 @@ void EmitPass::emitLoad3DInner(LdRawIntrinsic *inst, ResourceDescriptor &resourc
   }
 }
 
-void EmitPass::emitLoad(LoadInst *inst, Value *offset, ConstantInt *immOffset, ConstantInt *immScale,
-                        bool flipVarOffsetSign
+void EmitPass::emitLoad(LoadInst *inst, Value *offset, ConstantInt *immOffset, ConstantInt *immScale
 ) {
   if (m_pCtx->getModuleMetaData()->isHDCFastClearShader) {
     emitFastClear(inst);
@@ -10724,13 +10715,13 @@ void EmitPass::emitLoad(LoadInst *inst, Value *offset, ConstantInt *immOffset, C
     LSC_DOC_ADDR_SPACE addrSpace = m_pCtx->getUserAddrSpaceMD().Get(inst);
 
     emitLSCVectorLoad(inst, inst->getPointerOperand(),
-                      offset, immOffset, immScale, flipVarOffsetSign, cacheOpts, addrSpace
+                      offset, immOffset, immScale, cacheOpts, addrSpace
     );
     return;
   }
   IGC_ASSERT_MESSAGE(immScale ? immScale->getSExtValue() == 1 : true, "Immediate Scale not supported on non-LSC path!");
 
-  emitVectorLoad(inst, offset, immOffset, flipVarOffsetSign);
+  emitVectorLoad(inst, offset, immOffset);
 }
 
 void EmitPass::emitPredicatedLoad(Instruction *inst) {
@@ -10745,7 +10736,7 @@ void EmitPass::emitPredicatedLoad(Instruction *inst) {
   LSC_DOC_ADDR_SPACE addrSpace = m_pCtx->getUserAddrSpaceMD().Get(inst);
 
   emitLSCVectorLoad(inst, offset,
-                    offset, nullptr, nullptr, false, cacheOpts, addrSpace
+                    offset, nullptr, nullptr, cacheOpts, addrSpace
   );
 }
 
@@ -11782,7 +11773,7 @@ void EmitPass::emitSymbolRelocation(Function &F) {
 }
 
 void EmitPass::emitStoreRawIndexed(StoreRawIntrinsic *inst, Value *varOffset, ConstantInt *immScale,
-                                   ConstantInt *immOffset, bool flipVarOffsetSign) {
+                                   ConstantInt *immOffset) {
   Value *pBufPtr = inst->getResourceValue();
   Value *pValToStore = inst->getStoreValue();
 
@@ -11793,8 +11784,8 @@ void EmitPass::emitStoreRawIndexed(StoreRawIntrinsic *inst, Value *varOffset, Co
 
     LSC_CACHE_OPTS cacheOpts = translateLSCCacheControlsFromMetadata(inst, false);
     emitLSCVectorStore(pBufPtr,
-                       varOffset, immOffset, immScale, flipVarOffsetSign, pValToStore, inst->getParent(), cacheOpts,
-                       inst->getAlignment(), false, addrSpace
+                       varOffset, immOffset, immScale, pValToStore, inst->getParent(), cacheOpts, inst->getAlignment(),
+                       false, addrSpace
     );
     return;
   }
@@ -11919,21 +11910,20 @@ void EmitPass::emitStore3DInner(Value *pllValToStore, Value *pllDstPtr, Value *p
   }
 }
 
-void EmitPass::emitStore(StoreInst *inst, Value *varOffset, ConstantInt *immOffset, ConstantInt *immScale,
-                         bool flipVarOffsetSign
+void EmitPass::emitStore(StoreInst *inst, Value *varOffset, ConstantInt *immOffset, ConstantInt *immScale
 ) {
   if (shouldGenerateLSC(inst)) {
     LSC_DOC_ADDR_SPACE addrSpace = m_pCtx->getUserAddrSpaceMD().Get(inst);
 
     LSC_CACHE_OPTS cacheOpts = translateLSCCacheControlsFromMetadata(inst, false);
     emitLSCVectorStore(inst->getPointerOperand(),
-                       varOffset, immOffset, immScale, flipVarOffsetSign, inst->getValueOperand(), inst->getParent(),
-                       cacheOpts, IGCLLVM::getAlignmentValue(inst), inst->getMetadata("enable.vmask"), addrSpace
+                       varOffset, immOffset, immScale, inst->getValueOperand(), inst->getParent(), cacheOpts,
+                       IGCLLVM::getAlignmentValue(inst), inst->getMetadata("enable.vmask"), addrSpace
     );
     return;
   }
   IGC_ASSERT_MESSAGE(immScale ? immScale->getSExtValue() == 1 : true, "Immediate Scale not supported on non-LSC path!");
-  emitVectorStore(inst, varOffset, immOffset, flipVarOffsetSign);
+  emitVectorStore(inst, varOffset, immOffset);
 }
 
 void EmitPass::emitPredicatedStore(Instruction *inst) {
@@ -11946,8 +11936,7 @@ void EmitPass::emitPredicatedStore(Instruction *inst) {
   LSC_CACHE_OPTS cacheOpts = translateLSCCacheControlsFromMetadata(inst, false);
 
   emitLSCVectorStore(inst->getOperand(0),
-                     inst->getOperand(0), nullptr, nullptr, false /*flipVarOffsetSign*/, inst->getOperand(1),
-                     inst->getParent(), cacheOpts,
+                     inst->getOperand(0), nullptr, nullptr, inst->getOperand(1), inst->getParent(), cacheOpts,
                      cast<ConstantInt>(inst->getOperand(2))->getZExtValue(), // alignment
                      inst->getMetadata("enable.vmask"), addrSpace
                      ,
@@ -14640,7 +14629,7 @@ CVariable *EmitPass::UnpackOrBroadcastIfUniform(CVariable *pVar) {
 }
 
 void EmitPass::emitAtomicRaw(llvm::GenIntrinsicInst *pInst, Value *dstAddr, ConstantInt *immOffset,
-                             ConstantInt *immScale, bool flipVarOffsetSign
+                             ConstantInt *immScale
 ) {
   ForceDMask();
   // Currently, Dword Atomics can be called by matching 2 intrinsics. One is the
@@ -14714,13 +14703,6 @@ void EmitPass::emitAtomicRaw(llvm::GenIntrinsicInst *pInst, Value *dstAddr, Cons
 
   // Dst address in bytes.
   CVariable *pDstAddr = GetSymbol(dstAddr);
-  if (flipVarOffsetSign) {
-    CVariable *eNegBase = m_currShader->GetNewVariable(pDstAddr, CName(pDstAddr->getName(), "Neg"));
-    m_encoder->SetSrcModifier(0, EMOD_NEG);
-    m_encoder->Copy(eNegBase, pDstAddr); // MOV with -src modifier
-    m_encoder->Push();
-    pDstAddr = eNegBase;
-  }
 
 
   PointerType *PtrTy = dyn_cast<PointerType>(dstAddr->getType());
@@ -16642,7 +16624,7 @@ void EmitPass::emitFastClearSend(llvm::Instruction *pInst) {
   m_encoder->Push();
 }
 
-void EmitPass::emitVectorLoad(LoadInst *inst, Value *offset, ConstantInt *immOffset, bool flipVarOffsetSign) {
+void EmitPass::emitVectorLoad(LoadInst *inst, Value *offset, ConstantInt *immOffset) {
   int immOffsetInt = 0;
   if (immOffset)
     immOffsetInt = static_cast<int>(immOffset->getSExtValue());
@@ -16656,13 +16638,6 @@ void EmitPass::emitVectorLoad(LoadInst *inst, Value *offset, ConstantInt *immOff
   // eOffset is in bytes
   // offset corresponds to Int2Ptr operand obtained during pattern matching
   CVariable *eOffset = GetSymbol(immOffset ? offset : Ptr);
-  if (flipVarOffsetSign) {
-    CVariable *eNegOffset = m_currShader->GetNewVariable(eOffset, CName(eOffset->getName(), "Neg"));
-    m_encoder->SetSrcModifier(0, EMOD_NEG);
-    m_encoder->Copy(eNegOffset, eOffset); // MOV with -src modifier
-    m_encoder->Push();
-    eOffset = eNegOffset;
-  }
   if (useA32) {
     eOffset = TruncatePointer(eOffset);
   }
@@ -17101,7 +17076,7 @@ void EmitPass::emitVectorLoad(LoadInst *inst, Value *offset, ConstantInt *immOff
   }
 }
 
-void EmitPass::emitVectorStore(StoreInst *inst, Value *offset, ConstantInt *immOffset, bool flipVarOffsetSign) {
+void EmitPass::emitVectorStore(StoreInst *inst, Value *offset, ConstantInt *immOffset) {
   int immOffsetInt = 0;
   if (immOffset)
     immOffsetInt = static_cast<int>(immOffset->getSExtValue());
@@ -17118,13 +17093,6 @@ void EmitPass::emitVectorStore(StoreInst *inst, Value *offset, ConstantInt *immO
   // eOffset is in bytes
   // offset corresponds to Int2Ptr operand obtained during pattern matching
   CVariable *eOffset = GetSymbol(immOffset ? offset : Ptr);
-  if (flipVarOffsetSign) {
-    CVariable *eNegOffset = m_currShader->GetNewVariable(eOffset, CName(eOffset->getName(), "Neg"));
-    m_encoder->SetSrcModifier(0, EMOD_NEG);
-    m_encoder->Copy(eNegOffset, eOffset); // MOV with -src modifier
-    m_encoder->Push();
-    eOffset = eNegOffset;
-  }
   bool useA32 = !isA64Ptr(ptrType, m_currShader->GetContext());
   if (useA32) {
     eOffset = TruncatePointer(eOffset);
@@ -17799,7 +17767,7 @@ void EmitPass::emitLSCVectorLoad_uniform(LSC_CACHE_OPTS CacheOpts, bool UseA32,
 
 void EmitPass::emitLSCVectorLoad(Instruction *inst, Value *Ptr,
                                  Value *varOffset, ConstantInt *immOffset, ConstantInt *immScale,
-                                 bool flipVarOffsetSign, LSC_CACHE_OPTS cacheOpts, LSC_DOC_ADDR_SPACE addrSpace
+                                 LSC_CACHE_OPTS cacheOpts, LSC_DOC_ADDR_SPACE addrSpace
 ) {
 
   bool predicatedLoad = false;
@@ -17829,13 +17797,6 @@ void EmitPass::emitLSCVectorLoad(Instruction *inst, Value *Ptr,
   // eOffset is in bytes
   // offset corresponds to Int2Ptr operand obtained during pattern matching
   CVariable *eOffset = GetSymbol(varOffset);
-  if (flipVarOffsetSign) {
-    CVariable *eNegOffset = m_currShader->GetNewVariable(eOffset, CName(eOffset->getName(), "Neg"));
-    m_encoder->SetSrcModifier(0, EMOD_NEG);
-    m_encoder->Copy(eNegOffset, eOffset); // MOV with -src modifier
-    m_encoder->Push();
-    eOffset = eNegOffset;
-  }
   if (useA32) {
     eOffset = TruncatePointer(eOffset);
   }
@@ -18187,9 +18148,9 @@ void EmitPass::emitLSCVectorStore_uniform(LSC_CACHE_OPTS CacheOpts, bool UseA32,
 }
 
 void EmitPass::emitLSCVectorStore(Value *Ptr,
-                                  Value *varOffset, ConstantInt *immOffset, ConstantInt *immScale,
-                                  bool flipVarOffsetSign, Value *storedVal, BasicBlock *BB, LSC_CACHE_OPTS cacheOpts,
-                                  alignment_t align, bool dontForceDmask, LSC_DOC_ADDR_SPACE addrSpace
+                                  Value *varOffset, ConstantInt *immOffset, ConstantInt *immScale, Value *storedVal,
+                                  BasicBlock *BB, LSC_CACHE_OPTS cacheOpts, alignment_t align, bool dontForceDmask,
+                                  LSC_DOC_ADDR_SPACE addrSpace
                                   ,
                                   Value *predicate) {
 
@@ -18210,13 +18171,6 @@ void EmitPass::emitLSCVectorStore(Value *Ptr,
 
   // offset corresponds to Int2Ptr operand obtained during pattern matching
   CVariable *eOffset = GetSymbol(varOffset);
-  if (flipVarOffsetSign) {
-    CVariable *eNegOffset = m_currShader->GetNewVariable(eOffset, CName(eOffset->getName(), "Neg"));
-    m_encoder->SetSrcModifier(0, EMOD_NEG);
-    m_encoder->Copy(eNegOffset, eOffset); // MOV with -src modifier
-    m_encoder->Push();
-    eOffset = eNegOffset;
-  }
   bool useA32 = !isA64Ptr(ptrType, m_currShader->GetContext());
   LSC_ADDR_SIZE addrSize = useA32 ? LSC_ADDR_SIZE_32b : LSC_ADDR_SIZE_64b;
   if (useA32) {