mirror of
https://github.com/intel/compute-runtime.git
synced 2026-01-11 08:07:19 +08:00
Adding zello_fence blackbox testcase
Signed-off-by: vinod krishna <vinod.krishna@intel.com>
This commit is contained in:
committed by
Compute-Runtime-Automation
parent
4191dfdb43
commit
22f40d9a8e
@@ -19,6 +19,7 @@ if("${CMAKE_BUILD_TYPE}" STREQUAL "Debug")
|
||||
zello_world_usm
|
||||
zello_world_global_work_offset
|
||||
zello_scratch
|
||||
zello_fence
|
||||
)
|
||||
|
||||
include_directories(common)
|
||||
@@ -53,6 +54,7 @@ if("${CMAKE_BUILD_TYPE}" STREQUAL "Debug")
|
||||
|
||||
target_link_libraries(zello_world_jitc_ocloc PUBLIC ocloc_lib)
|
||||
target_link_libraries(zello_scratch PUBLIC ocloc_lib)
|
||||
target_link_libraries(zello_fence PUBLIC ocloc_lib)
|
||||
if(UNIX)
|
||||
target_link_libraries(zello_world_global_work_offset PUBLIC ocloc_lib)
|
||||
endif()
|
||||
|
||||
210
level_zero/core/test/black_box_tests/zello_fence.cpp
Normal file
210
level_zero/core/test/black_box_tests/zello_fence.cpp
Normal file
@@ -0,0 +1,210 @@
|
||||
/*
|
||||
* Copyright (C) 2019-2021 Intel Corporation
|
||||
*
|
||||
* SPDX-License-Identifier: MIT
|
||||
*
|
||||
*/
|
||||
|
||||
#include <level_zero/ze_api.h>
|
||||
|
||||
#include "zello_common.h"
|
||||
#include "zello_compile.h"
|
||||
|
||||
#include <fstream>
|
||||
#include <iostream>
|
||||
#include <memory>
|
||||
|
||||
bool verbose = false;
|
||||
|
||||
const char *clProgram = R"==(
|
||||
__kernel void increment_by_one(__global uchar *dst, __global uchar *src) {
|
||||
unsigned int gid = get_global_id(0);
|
||||
dst[gid] = (uchar)(src[gid] + 1);
|
||||
}
|
||||
)==";
|
||||
|
||||
void createModule(ze_context_handle_t &context, ze_module_handle_t &module, ze_device_handle_t &device) {
|
||||
// Prepare spirV
|
||||
std::string buildLog;
|
||||
auto spirV = compileToSpirV(clProgram, "", buildLog);
|
||||
if (buildLog.size() > 0) {
|
||||
std::cout << "Build log " << buildLog;
|
||||
}
|
||||
SUCCESS_OR_TERMINATE((0 == spirV.size()));
|
||||
|
||||
ze_module_desc_t moduleDesc = {};
|
||||
ze_module_build_log_handle_t buildlog;
|
||||
moduleDesc.format = ZE_MODULE_FORMAT_IL_SPIRV;
|
||||
moduleDesc.pInputModule = spirV.data();
|
||||
moduleDesc.inputSize = spirV.size();
|
||||
moduleDesc.pBuildFlags = "";
|
||||
if (zeModuleCreate(context, device, &moduleDesc, &module, &buildlog) != ZE_RESULT_SUCCESS) {
|
||||
size_t szLog = 0;
|
||||
zeModuleBuildLogGetString(buildlog, &szLog, nullptr);
|
||||
|
||||
char *strLog = (char *)malloc(szLog);
|
||||
zeModuleBuildLogGetString(buildlog, &szLog, strLog);
|
||||
std::cout << "Build log:" << strLog << std::endl;
|
||||
|
||||
free(strLog);
|
||||
}
|
||||
SUCCESS_OR_TERMINATE(zeModuleBuildLogDestroy(buildlog));
|
||||
}
|
||||
|
||||
void createKernel(ze_module_handle_t &module, ze_kernel_handle_t &kernel,
|
||||
uint32_t numThreads, uint32_t sizex, uint32_t sizey,
|
||||
uint32_t sizez) {
|
||||
|
||||
ze_kernel_desc_t kernelDesc = {};
|
||||
kernelDesc.pKernelName = "increment_by_one";
|
||||
SUCCESS_OR_TERMINATE(zeKernelCreate(module, &kernelDesc, &kernel));
|
||||
ze_kernel_properties_t kernProps;
|
||||
SUCCESS_OR_TERMINATE(zeKernelGetProperties(kernel, &kernProps));
|
||||
std::cout << "Kernel : \n"
|
||||
<< " * name : " << kernelDesc.pKernelName << "\n"
|
||||
<< " * uuid.mid : " << kernProps.uuid.mid << "\n"
|
||||
<< " * uuid.kid : " << kernProps.uuid.kid << "\n"
|
||||
<< " * maxSubgroupSize : " << kernProps.maxSubgroupSize << "\n"
|
||||
<< " * localMemSize : " << kernProps.localMemSize << "\n"
|
||||
<< " * spillMemSize : " << kernProps.spillMemSize << "\n"
|
||||
<< " * privateMemSize : " << kernProps.privateMemSize << "\n"
|
||||
<< " * maxNumSubgroups : " << kernProps.maxNumSubgroups << "\n"
|
||||
<< " * numKernelArgs : " << kernProps.numKernelArgs << "\n"
|
||||
<< " * requiredSubgroupSize : " << kernProps.requiredSubgroupSize << "\n"
|
||||
<< " * requiredNumSubGroups : " << kernProps.requiredNumSubGroups << "\n"
|
||||
<< " * requiredGroupSizeX : " << kernProps.requiredGroupSizeX << "\n"
|
||||
<< " * requiredGroupSizeY : " << kernProps.requiredGroupSizeY << "\n"
|
||||
<< " * requiredGroupSizeZ : " << kernProps.requiredGroupSizeZ << "\n";
|
||||
|
||||
uint32_t groupSizeX = sizex;
|
||||
uint32_t groupSizeY = sizey;
|
||||
uint32_t groupSizeZ = sizey;
|
||||
SUCCESS_OR_TERMINATE(zeKernelSuggestGroupSize(kernel, numThreads, 1U, 1U, &groupSizeX, &groupSizeY, &groupSizeZ));
|
||||
SUCCESS_OR_TERMINATE_BOOL(numThreads % groupSizeX == 0);
|
||||
if (verbose) {
|
||||
std::cout << "Group size : (" << groupSizeX << ", " << groupSizeY << ", " << groupSizeZ
|
||||
<< ")" << std::endl;
|
||||
}
|
||||
SUCCESS_OR_TERMINATE(zeKernelSetGroupSize(kernel, groupSizeX, groupSizeY, groupSizeZ));
|
||||
}
|
||||
|
||||
bool testFence(ze_context_handle_t &context, ze_device_handle_t &device) {
|
||||
constexpr size_t allocSize = 4096;
|
||||
constexpr size_t bytesPerThread = sizeof(char);
|
||||
constexpr size_t numThreads = allocSize / bytesPerThread;
|
||||
ze_module_handle_t module;
|
||||
ze_kernel_handle_t kernel;
|
||||
ze_command_queue_handle_t cmdQueue;
|
||||
ze_command_list_handle_t cmdList;
|
||||
|
||||
void *srcBuffer;
|
||||
void *dstBuffer;
|
||||
uint32_t groupSizeX = 32u;
|
||||
uint32_t groupSizeY = 1u;
|
||||
uint32_t groupSizeZ = 1u;
|
||||
|
||||
// Create commandQueue and cmdList
|
||||
ze_command_queue_desc_t cmdQueueDesc = {};
|
||||
cmdQueueDesc.ordinal = getCommandQueueOrdinal(device);
|
||||
cmdQueueDesc.index = 0;
|
||||
cmdQueueDesc.mode = ZE_COMMAND_QUEUE_MODE_ASYNCHRONOUS;
|
||||
SUCCESS_OR_TERMINATE(zeCommandQueueCreate(context, device, &cmdQueueDesc, &cmdQueue));
|
||||
SUCCESS_OR_TERMINATE(createCommandList(context, device, cmdList));
|
||||
|
||||
// Create module and kernel
|
||||
createModule(context, module, device);
|
||||
createKernel(module, kernel, numThreads, groupSizeX, groupSizeY,
|
||||
groupSizeZ);
|
||||
|
||||
// Alloc buffers
|
||||
srcBuffer = nullptr;
|
||||
dstBuffer = nullptr;
|
||||
ze_device_mem_alloc_desc_t deviceDesc = {};
|
||||
deviceDesc.stype = ZE_STRUCTURE_TYPE_DEVICE_MEM_ALLOC_DESC;
|
||||
deviceDesc.ordinal = 0;
|
||||
deviceDesc.flags = 0;
|
||||
deviceDesc.pNext = nullptr;
|
||||
SUCCESS_OR_TERMINATE(zeMemAllocDevice(context, &deviceDesc, allocSize, 1, device, &srcBuffer));
|
||||
SUCCESS_OR_TERMINATE(zeMemAllocDevice(context, &deviceDesc, allocSize, 1, device, &dstBuffer));
|
||||
|
||||
// Init data and copy to device
|
||||
uint8_t initDataSrc[allocSize];
|
||||
memset(initDataSrc, 7, sizeof(initDataSrc));
|
||||
uint8_t initDataDst[allocSize];
|
||||
memset(initDataDst, 3, sizeof(initDataDst));
|
||||
SUCCESS_OR_TERMINATE(zeCommandListAppendMemoryCopy(
|
||||
cmdList, srcBuffer, initDataSrc, sizeof(initDataSrc), nullptr, 0, nullptr));
|
||||
SUCCESS_OR_TERMINATE(zeCommandListAppendMemoryCopy(
|
||||
cmdList, dstBuffer, initDataDst, sizeof(initDataDst), nullptr, 0, nullptr));
|
||||
|
||||
// copying of data must finish before running the user kernel
|
||||
SUCCESS_OR_TERMINATE(zeCommandListAppendBarrier(cmdList, nullptr, 0, nullptr));
|
||||
|
||||
// Set kernel args and get ready to dispatch
|
||||
SUCCESS_OR_TERMINATE(zeKernelSetArgumentValue(kernel, 0, sizeof(dstBuffer), &dstBuffer));
|
||||
SUCCESS_OR_TERMINATE(zeKernelSetArgumentValue(kernel, 1, sizeof(srcBuffer), &srcBuffer));
|
||||
ze_group_count_t dispatchTraits;
|
||||
dispatchTraits.groupCountX = numThreads / groupSizeX;
|
||||
dispatchTraits.groupCountY = 1u;
|
||||
dispatchTraits.groupCountZ = 1u;
|
||||
if (verbose) {
|
||||
std::cerr << "Number of groups : (" << dispatchTraits.groupCountX << ", "
|
||||
<< dispatchTraits.groupCountY << ", " << dispatchTraits.groupCountZ << ")"
|
||||
<< std::endl;
|
||||
}
|
||||
|
||||
SUCCESS_OR_TERMINATE_BOOL(dispatchTraits.groupCountX * groupSizeX == allocSize);
|
||||
SUCCESS_OR_TERMINATE(zeCommandListAppendLaunchKernel(
|
||||
cmdList, kernel, &dispatchTraits, nullptr, 0, nullptr));
|
||||
|
||||
// Create Fence
|
||||
ze_fence_handle_t fence;
|
||||
ze_fence_desc_t fenceDesc = {};
|
||||
fenceDesc.stype = ZE_STRUCTURE_TYPE_FENCE_DESC;
|
||||
fenceDesc.pNext = nullptr;
|
||||
fenceDesc.flags = 0;
|
||||
SUCCESS_OR_TERMINATE(zeFenceCreate(cmdQueue, &fenceDesc, &fence));
|
||||
|
||||
// Execute CommandList
|
||||
SUCCESS_OR_TERMINATE(zeCommandListClose(cmdList));
|
||||
SUCCESS_OR_TERMINATE(zeCommandQueueExecuteCommandLists(cmdQueue, 1, &cmdList, fence));
|
||||
|
||||
// Wait for fence to be signaled
|
||||
SUCCESS_OR_TERMINATE(zeFenceHostSynchronize(fence, std::numeric_limits<uint32_t>::max()));
|
||||
if (verbose)
|
||||
std::cout << "zeFenceHostSynchronize success" << std::endl;
|
||||
|
||||
//Tear down
|
||||
SUCCESS_OR_TERMINATE(zeFenceReset(fence));
|
||||
SUCCESS_OR_TERMINATE(zeCommandListReset(cmdList));
|
||||
SUCCESS_OR_TERMINATE(zeMemFree(context, dstBuffer));
|
||||
SUCCESS_OR_TERMINATE(zeMemFree(context, srcBuffer));
|
||||
SUCCESS_OR_TERMINATE(zeFenceDestroy(fence));
|
||||
SUCCESS_OR_TERMINATE(zeCommandListDestroy(cmdList));
|
||||
SUCCESS_OR_TERMINATE(zeCommandQueueDestroy(cmdQueue));
|
||||
SUCCESS_OR_TERMINATE(zeKernelDestroy(kernel));
|
||||
SUCCESS_OR_TERMINATE(zeModuleDestroy(module));
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
int main(int argc, char *argv[]) {
|
||||
bool outputValidationSuccessful;
|
||||
verbose = isVerbose(argc, argv);
|
||||
|
||||
ze_context_handle_t context = nullptr;
|
||||
ze_driver_handle_t driverHandle = nullptr;
|
||||
auto device = zelloInitContextAndGetDevices(context, driverHandle);
|
||||
|
||||
ze_device_properties_t deviceProperties = {};
|
||||
SUCCESS_OR_TERMINATE(zeDeviceGetProperties(device, &deviceProperties));
|
||||
std::cout << "Device : \n"
|
||||
<< " * name : " << deviceProperties.name << "\n"
|
||||
<< " * vendorId : " << std::hex << deviceProperties.vendorId << "\n";
|
||||
|
||||
outputValidationSuccessful = testFence(context, device);
|
||||
|
||||
SUCCESS_OR_TERMINATE(zeContextDestroy(context));
|
||||
std::cout << "\nZello Fence Results validation " << (outputValidationSuccessful ? "PASSED" : "FAILED") << "\n";
|
||||
return 0;
|
||||
}
|
||||
Reference in New Issue
Block a user