Skip to content

Commit 2508396

Browse files
Add parameter to setGpgpuWalkerThreadData.
Change-Id: I931f27ad3a21d3d151b19ac9226e245134295b98 Signed-off-by: Mrozek, Michal <[email protected]>
1 parent 711ba14 commit 2508396

File tree

4 files changed

+7
-5
lines changed

4 files changed

+7
-5
lines changed

runtime/command_queue/gpgpu_walker.h

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -130,7 +130,8 @@ class GpgpuWalkerHelper {
130130
uint32_t workDim,
131131
bool localIdsGenerationByRuntime,
132132
bool inlineDataProgrammingRequired,
133-
const iOpenCL::SPatchThreadPayload &threadPayload);
133+
const iOpenCL::SPatchThreadPayload &threadPayload,
134+
uint32_t requiredWorkgroupOrder);
134135

135136
static void dispatchProfilingCommandsStart(
136137
TagNode<HwTimeStamps> &hwTimeStamps,

runtime/command_queue/gpgpu_walker_bdw_plus.inl

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,8 @@ inline size_t GpgpuWalkerHelper<GfxFamily>::setGpgpuWalkerThreadData(
2121
uint32_t workDim,
2222
bool localIdsGenerationByRuntime,
2323
bool inlineDataProgrammingRequired,
24-
const iOpenCL::SPatchThreadPayload &threadPayload) {
24+
const iOpenCL::SPatchThreadPayload &threadPayload,
25+
uint32_t requiredWorkgroupOrder) {
2526
auto localWorkSize = localWorkSizesIn[0] * localWorkSizesIn[1] * localWorkSizesIn[2];
2627

2728
auto threadsPerWorkGroup = getThreadsPerWG(simd, localWorkSize);
@@ -146,7 +147,7 @@ void GpgpuWalkerHelper<GfxFamily>::dispatchScheduler(
146147
size_t workGroups[3] = {(scheduler.getGws() / scheduler.getLws()), 1, 1};
147148
GpgpuWalkerHelper<GfxFamily>::setGpgpuWalkerThreadData(pGpGpuWalkerCmd, globalOffsets, globalOffsets, workGroups, localWorkSizes,
148149
simd, 1, true, inlineDataProgrammingRequired,
149-
*scheduler.getKernelInfo().patchInfo.threadPayload);
150+
*scheduler.getKernelInfo().patchInfo.threadPayload, 0u);
150151

151152
// Implement disabling special WA DisableLSQCROPERFforOCL if needed
152153
GpgpuWalkerHelper<GfxFamily>::applyWADisableLSQCROPERFforOCL(&commandStream, scheduler, false);

runtime/command_queue/hardware_interface_bdw_plus.inl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -134,7 +134,7 @@ inline void HardwareInterface<GfxFamily>::programWalker(
134134
GpgpuWalkerHelper<GfxFamily>::setGpgpuWalkerThreadData(walkerCmd, globalOffsets, startWorkGroups,
135135
numWorkGroups, localWorkSizes, simd, dim,
136136
false, false,
137-
*kernel.getKernelInfo().patchInfo.threadPayload);
137+
*kernel.getKernelInfo().patchInfo.threadPayload, 0u);
138138
}
139139

140140
} // namespace NEO

unit_tests/command_queue/work_group_size_tests.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -88,7 +88,7 @@ struct WorkGroupSizeBase {
8888
(workItems[2] + workGroupSize[2] - 1) / workGroupSize[2]};
8989
const iOpenCL::SPatchThreadPayload threadPayload = {};
9090
GpgpuWalkerHelper<FamilyType>::setGpgpuWalkerThreadData(&pCmd, globalOffsets, workGroupsStart, workGroupsNum,
91-
workGroupSize, simdSize, dims, true, false, threadPayload);
91+
workGroupSize, simdSize, dims, true, false, threadPayload, 0u);
9292

9393
//And check if it is programmed correctly
9494
auto numWorkItems = computeWalkerWorkItems<FamilyType>(pCmd);

0 commit comments

Comments
 (0)