mirror of
https://github.com/intel/compute-runtime.git
synced 2025-09-15 13:01:45 +08:00
Add multi thread test for enqueue NDRange and WriteBuffer with queue per thread
Signed-off-by: Cencelewska, Katarzyna <katarzyna.cencelewska@intel.com>
This commit is contained in:

committed by
Compute-Runtime-Automation

parent
260a324a6f
commit
5bdf758049
@ -75,7 +75,7 @@ struct MockCommandQueueHw : public CommandQueueHw<GfxFamily> {
|
||||
using CommandQueue::bcsInitialized;
|
||||
};
|
||||
|
||||
HWTEST_F(EnqueueKernelTest, givenTwoThreadsAndBscEnabledWhenEnqueueWriteBufferAndEnqueueNDRangeKernelInLoopThenIsNoRace) {
|
||||
HWTEST_F(EnqueueKernelTest, givenTwoThreadsAndBcsEnabledWhenEnqueueWriteBufferAndEnqueueNDRangeKernelInLoopThenIsNoRace) {
|
||||
DebugManagerStateRestore debugRestorer;
|
||||
DebugManager.flags.ForceCsrLockInBcsEnqueueOnlyForGpgpuSubmission.set(1);
|
||||
HardwareInfo hwInfo = *defaultHwInfo.get();
|
||||
@ -196,7 +196,7 @@ HWTEST_F(EnqueueKernelTest, givenTwoThreadsAndBscEnabledWhenEnqueueWriteBufferAn
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
}
|
||||
|
||||
HWTEST_F(EnqueueKernelTest, givenBscEnabledWhenThread1EnqueueWriteBufferAndThread2EnqueueNDRangeKernelInLoopThenIsNoRace) {
|
||||
HWTEST_F(EnqueueKernelTest, givenBcsEnabledWhenThread1EnqueueWriteBufferAndThread2EnqueueNDRangeKernelInLoopThenIsNoRace) {
|
||||
DebugManagerStateRestore debugRestorer;
|
||||
DebugManager.flags.ForceCsrLockInBcsEnqueueOnlyForGpgpuSubmission.set(1);
|
||||
HardwareInfo hwInfo = *defaultHwInfo.get();
|
||||
@ -320,3 +320,121 @@ HWTEST_F(EnqueueKernelTest, givenBscEnabledWhenThread1EnqueueWriteBufferAndThrea
|
||||
retVal = clReleaseContext(context);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
}
|
||||
|
||||
HWTEST_F(EnqueueKernelTest, givenBcsEnabledAndQueuePerThreadWhenEnqueueWriteBufferAndEnqueueNDRangeKernelInLoopThenIsNoRace) {
|
||||
DebugManagerStateRestore debugRestorer;
|
||||
DebugManager.flags.ForceCsrLockInBcsEnqueueOnlyForGpgpuSubmission.set(1);
|
||||
DebugManager.flags.EnableCmdQRoundRobindEngineAssign.set(0);
|
||||
HardwareInfo hwInfo = *defaultHwInfo.get();
|
||||
hwInfo.capabilityTable.blitterOperationsSupported = true;
|
||||
REQUIRE_FULL_BLITTER_OR_SKIP(&hwInfo);
|
||||
|
||||
std::atomic<bool> startEnqueueProcess(false);
|
||||
|
||||
auto iterationCount = 40;
|
||||
const auto threadCount = 10;
|
||||
|
||||
constexpr size_t n = 256;
|
||||
unsigned int data[n] = {};
|
||||
constexpr size_t bufferSize = n * sizeof(unsigned int);
|
||||
|
||||
size_t gws[3] = {1, 0, 0};
|
||||
size_t gwsSize[3] = {n, 1, 1};
|
||||
size_t lws[3] = {1, 1, 1};
|
||||
cl_uint workDim = 1;
|
||||
|
||||
KernelBinaryHelper kbHelper("CopyBuffer_simd16", false);
|
||||
std::string testFile;
|
||||
testFile.append(clFiles);
|
||||
testFile.append("CopyBuffer_simd16.cl");
|
||||
size_t sourceSize = 0;
|
||||
auto pSource = loadDataFromFile(testFile.c_str(), sourceSize);
|
||||
EXPECT_NE(0u, sourceSize);
|
||||
EXPECT_NE(nullptr, pSource);
|
||||
|
||||
MockClDevice mockClDevice{MockDevice::createWithExecutionEnvironment<MockDevice>(&hwInfo, pDevice->executionEnvironment, 0)};
|
||||
|
||||
const cl_device_id deviceId = &mockClDevice;
|
||||
auto context = clCreateContext(nullptr, 1, &deviceId, nullptr, nullptr, &retVal);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
EXPECT_NE(nullptr, context);
|
||||
|
||||
const char *sources[1] = {pSource.get()};
|
||||
auto program = clCreateProgramWithSource(
|
||||
context,
|
||||
1,
|
||||
sources,
|
||||
&sourceSize,
|
||||
&retVal);
|
||||
ASSERT_NE(nullptr, program);
|
||||
|
||||
retVal = clBuildProgram(
|
||||
program,
|
||||
1,
|
||||
&deviceId,
|
||||
nullptr,
|
||||
nullptr,
|
||||
nullptr);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
|
||||
auto kernel = clCreateKernel(program, "CopyBuffer", &retVal);
|
||||
ASSERT_NE(nullptr, kernel);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
|
||||
cl_mem_flags flags = CL_MEM_READ_WRITE;
|
||||
auto buffer0 = clCreateBuffer(context, flags, bufferSize, nullptr, &retVal);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
auto buffer1 = clCreateBuffer(context, flags, bufferSize, nullptr, &retVal);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
|
||||
retVal = clSetKernelArg(kernel, 0, sizeof(cl_mem), &buffer0);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
retVal = clSetKernelArg(kernel, 1, sizeof(cl_mem), &buffer1);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
|
||||
auto function = [&]() {
|
||||
while (!startEnqueueProcess)
|
||||
;
|
||||
|
||||
auto queue = clCreateCommandQueue(context, deviceId, 0, &retVal);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
EXPECT_NE(nullptr, queue);
|
||||
for (int i = 0; i < iterationCount; i++) {
|
||||
|
||||
retVal = clEnqueueWriteBuffer(queue, buffer0, false, 0, bufferSize, data, 0, nullptr, nullptr);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
retVal = clEnqueueNDRangeKernel(queue, kernel, workDim, gws, gwsSize, lws, 0, nullptr, nullptr);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
}
|
||||
retVal = clFinish(queue);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
retVal = clReleaseCommandQueue(queue);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
};
|
||||
|
||||
std::vector<std::thread> threads;
|
||||
for (auto thread = 0; thread < threadCount; thread++) {
|
||||
threads.push_back(std::thread(function));
|
||||
}
|
||||
|
||||
startEnqueueProcess = true;
|
||||
|
||||
for (auto &thread : threads) {
|
||||
thread.join();
|
||||
}
|
||||
|
||||
retVal = clReleaseMemObject(buffer0);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
|
||||
retVal = clReleaseMemObject(buffer1);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
|
||||
retVal = clReleaseKernel(kernel);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
|
||||
retVal = clReleaseProgram(program);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
|
||||
retVal = clReleaseContext(context);
|
||||
EXPECT_EQ(CL_SUCCESS, retVal);
|
||||
}
|
Reference in New Issue
Block a user