Skip to content

Commit cd15c82

Browse files
Do not prefer copy engine for local to local transfers.
Execution Units are faster. Signed-off-by: Michal Mrozek <[email protected]>
1 parent 8f93f4f commit cd15c82

File tree

3 files changed

+10
-14
lines changed

3 files changed

+10
-14
lines changed

opencl/source/helpers/cl_hw_helper_pvc_and_later.inl

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*
2-
* Copyright (C) 2021 Intel Corporation
2+
* Copyright (C) 2021-2022 Intel Corporation
33
*
44
* SPDX-License-Identifier: MIT
55
*
@@ -9,7 +9,7 @@
99

1010
template <>
1111
inline bool ClHwHelperHw<Family>::preferBlitterForLocalToLocalTransfers() const {
12-
return true;
12+
return false;
1313
}
1414

1515
template <>

opencl/test/unit_test/command_queue/command_queue_tests_pvc_and_later.cpp

Lines changed: 6 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -285,8 +285,7 @@ HWTEST2_F(BcsCsrSelectionCommandQueueTests, givenBcsSelectedWithForceBcsEngineIn
285285
dstGraphicsAllocation.memoryPool = MemoryPool::LocalMemory;
286286
CsrSelectionArgs args{CL_COMMAND_COPY_BUFFER, &srcMemObj, &dstMemObj, 0u, nullptr};
287287
CommandStreamReceiver &selectedCsr = queue->selectCsrForBuiltinOperation(args);
288-
EXPECT_EQ(queue->getBcsCommandStreamReceiver(linkBcsType), &selectedCsr);
289-
EXPECT_EQ(linkBcsType, selectedCsr.getOsContext().getEngineType());
288+
EXPECT_EQ(&queue->getGpgpuCommandStreamReceiver(), &selectedCsr);
290289
}
291290
}
292291

@@ -383,12 +382,11 @@ HWTEST2_F(BcsCsrSelectionCommandQueueTests, givenOneBcsEngineInQueueWhenSelectin
383382
dstGraphicsAllocation.memoryPool = MemoryPool::LocalMemory;
384383
CsrSelectionArgs args{CL_COMMAND_COPY_BUFFER, &srcMemObj, &dstMemObj, 0u, nullptr};
385384
CommandStreamReceiver &selectedCsr = queue->selectCsrForBuiltinOperation(args);
386-
EXPECT_EQ(queue->getBcsCommandStreamReceiver(linkBcsType), &selectedCsr);
387-
EXPECT_EQ(linkBcsType, selectedCsr.getOsContext().getEngineType());
385+
EXPECT_EQ(&queue->getGpgpuCommandStreamReceiver(), &selectedCsr);
388386
}
389387
}
390388

391-
HWTEST2_F(BcsCsrSelectionCommandQueueTests, givenMultipleEnginesInQueueWhenSelectingCsrForLocalToLocalOperationThenSelectProperBcsCsr, IsAtLeastXeHpcCore) {
389+
HWTEST2_F(BcsCsrSelectionCommandQueueTests, givenMultipleEnginesInQueueWhenSelectingCsrForLocalToLocalOperationThenSelectProperGpGpuCsr, IsAtLeastXeHpcCore) {
392390
DebugManagerStateRestore restore{};
393391
DebugManager.flags.EnableBlitterForEnqueueOperations.set(1);
394392

@@ -416,8 +414,7 @@ HWTEST2_F(BcsCsrSelectionCommandQueueTests, givenMultipleEnginesInQueueWhenSelec
416414
aub_stream::ENGINE_BCS8,
417415
});
418416
CommandStreamReceiver &selectedCsr = queue->selectCsrForBuiltinOperation(args);
419-
EXPECT_EQ(queue->getBcsCommandStreamReceiver(aub_stream::ENGINE_BCS), &selectedCsr);
420-
EXPECT_EQ(aub_stream::ENGINE_BCS, selectedCsr.getOsContext().getEngineType());
417+
EXPECT_EQ(&queue->getGpgpuCommandStreamReceiver(), &selectedCsr);
421418
}
422419
{
423420
auto queue = createQueueWithEngines({
@@ -427,8 +424,7 @@ HWTEST2_F(BcsCsrSelectionCommandQueueTests, givenMultipleEnginesInQueueWhenSelec
427424
aub_stream::ENGINE_BCS8,
428425
});
429426
CommandStreamReceiver &selectedCsr = queue->selectCsrForBuiltinOperation(args);
430-
EXPECT_EQ(queue->getBcsCommandStreamReceiver(aub_stream::ENGINE_BCS5), &selectedCsr);
431-
EXPECT_EQ(aub_stream::ENGINE_BCS5, selectedCsr.getOsContext().getEngineType());
427+
EXPECT_EQ(&queue->getGpgpuCommandStreamReceiver(), &selectedCsr);
432428
}
433429
}
434430

@@ -503,4 +499,4 @@ HWTEST2_F(OoqCommandQueueHwBlitTest, givenBarrierBeforeFirstKernelWhenEnqueueNDR
503499
const auto memFenceItor = find<MI_MEM_FENCE *>(memFenceStateItor, ccsHwParser.cmdList.end());
504500
EXPECT_NE(ccsHwParser.cmdList.end(), memFenceItor);
505501
EXPECT_NE(ccsHwParser.cmdList.end(), memFenceStateItor);
506-
}
502+
}

opencl/test/unit_test/xe_hpc_core/hw_helper_tests_xe_hpc_core.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -919,8 +919,8 @@ XE_HPC_CORETEST_F(HwHelperTestsXeHpcCore, WhenCheckingSipWAThenFalseIsReturned)
919919
EXPECT_FALSE(HwHelper::get(renderCoreFamily).isSipWANeeded(*defaultHwInfo));
920920
}
921921

922-
XE_HPC_CORETEST_F(HwHelperTestsXeHpcCore, WhenCheckingPreferenceForBlitterForLocalToLocalTransfersThenReturnTrue) {
923-
EXPECT_TRUE(ClHwHelper::get(renderCoreFamily).preferBlitterForLocalToLocalTransfers());
922+
XE_HPC_CORETEST_F(HwHelperTestsXeHpcCore, WhenCheckingPreferenceForBlitterForLocalToLocalTransfersThenReturnFalse) {
923+
EXPECT_FALSE(ClHwHelper::get(renderCoreFamily).preferBlitterForLocalToLocalTransfers());
924924
}
925925

926926
XE_HPC_CORETEST_F(HwHelperTestsXeHpcCore, givenBdA0WhenBcsSubDeviceSupportIsCheckedThenReturnFalse) {

0 commit comments

Comments
 (0)