compute-runtime/runtime/event/event.h

/*
 * Copyright (c) 2017, Intel Corporation
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included
 * in all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 * OTHER DEALINGS IN THE SOFTWARE.
 */

#pragma once
#include "runtime/api/cl_types.h"
#include "runtime/helpers/base_object.h"
#include <cstdint>
#include <atomic>
#include <vector>
#include "runtime/helpers/task_information.h"
#include "runtime/utilities/idlist.h"
#include "runtime/utilities/iflist.h"
#include "runtime/event/hw_timestamps.h"
#include "runtime/os_interface/os_time.h"
#include "runtime/os_interface/performance_counters.h"
#include "runtime/helpers/completion_stamp.h"
#include "runtime/helpers/flush_stamp.h"
#include "runtime/utilities/arrayref.h"

#define OCLRT_NUM_TIMESTAMP_BITS (32)

namespace OCLRT {
template <typename TagType>
struct TagNode;
class CommandQueue;
class Context;
class Device;

template <>
struct OpenCLObjectMapper<_cl_event> {
    typedef class Event DerivedType;
};

class Event : public BaseObject<_cl_event>, public IDNode<Event> {
  public:
    enum class ECallbackTarget : uint32_t {
        Queued = 0,
        Submitted,
        Running,
        Completed,
        MAX,
        Invalid
    };

    struct Callback : public IFNode<Callback> {
        typedef void(CL_CALLBACK *ClbFuncT)(cl_event, cl_int, void *);

        Callback(cl_event event, ClbFuncT clb, cl_int type, void *data)
            : event(event), callbackFunction(clb), callbackExecutionStatusTarget(type), userData(data) {
        }

        void execute() {
            callbackFunction(event, callbackExecutionStatusTarget, userData);
        }

        int32_t getCallbackExecutionStatusTarget() const {
            return callbackExecutionStatusTarget;
        }

        // From OCL spec :
        //     "If the callback is called as the result of the command associated with
        //      event being abnormally terminated, an appropriate error code for the error that caused
        //      the termination will be passed to event_command_exec_status instead."
        // This function allows to override this value
        void overrideCallbackExecutionStatusTarget(int32_t newCallbackExecutionStatusTarget) {
            DEBUG_BREAK_IF(newCallbackExecutionStatusTarget >= 0);
            callbackExecutionStatusTarget = newCallbackExecutionStatusTarget;
        }

      private:
        cl_event event;
        ClbFuncT callbackFunction;
        int32_t callbackExecutionStatusTarget; // minimum event execution status that will triger this callback
        void *userData;
    };

    static const cl_ulong objectMagic = 0x80134213A43C981ALL;
    static const cl_uint eventNotReady;

    Event(CommandQueue *cmdQueue, cl_command_type cmdType,
          uint32_t taskLevel, uint32_t taskCount);

    Event(const Event &) = delete;
    Event &operator=(const Event &) = delete;

    ~Event() override;

    uint32_t getCompletionStamp(void) const;
    void updateCompletionStamp(uint32_t taskCount, uint32_t tasklevel, FlushStamp flushStamp);
    cl_ulong getDelta(cl_ulong startTime,
                      cl_ulong endTime);
    bool calcProfilingData();
    void setCPUProfilingPath(bool isCPUPath) { isCPUPath ? profilingCpuPath = CL_TRUE : profilingCpuPath = CL_FALSE; }
    cl_bool isCPUProfilingPath() {
        return profilingCpuPath;
    }

    cl_int getEventProfilingInfo(cl_profiling_info paramName,
                                 size_t paramValueSize,
                                 void *paramValue,
                                 size_t *paramValueSizeRet);

    cl_bool isProfilingEnabled() { return profilingEnabled; }

    void setProfilingEnabled(cl_bool profilingEnabled) {
        this->profilingEnabled = profilingEnabled;
    }

    HwTimeStamps *getHwTimeStamp();
    GraphicsAllocation *getHwTimeStampAllocation();

    bool isPerfCountersEnabled() {
        return perfCountersEnabled;
    }

    void setPerfCountersEnabled(bool perfCountersEnabled) {
        this->perfCountersEnabled = perfCountersEnabled;
    }

    void copyPerfCounters(InstrPmRegsCfg *config);

    HwPerfCounter *getHwPerfCounter();
    GraphicsAllocation *getHwPerfCounterAllocation();

    std::unique_ptr<FlushStampTracker> flushStamp;
    std::atomic<uint32_t> taskLevel;

    void addChild(Event &e);

    virtual bool setStatus(cl_int status);

    static cl_int waitForEvents(cl_uint numEvents,
                                const cl_event *eventList);

    std::unique_ptr<Command> setCommand(std::unique_ptr<Command> newCmd) {
        std::unique_ptr<Command> prevCmd;
        prevCmd.reset(cmdToSubmit.exchange(newCmd.release()));
        eventWithoutCommand = false;
        return prevCmd;
    }
    Command *peekCommand() {
        return cmdToSubmit;
    }

    IFNodeRef<Event> *peekChildEvents() {
        return childEventsToNotify.peekHead();
    }

    bool peekHasChildEvents() {
        return (peekChildEvents() != nullptr);
    }

    bool peekHasCallbacks(ECallbackTarget target) {
        if (target >= ECallbackTarget::MAX) {
            DEBUG_BREAK_IF(true);
            return false;
        }
        return (callbacks[(uint32_t)target].peekHead() != nullptr);
    }

    bool peekHasCallbacks() {
        for (uint32_t i = 0; i < (uint32_t)ECallbackTarget::MAX; ++i) {
            if (peekHasCallbacks((ECallbackTarget)i)) {
                return true;
            }
        }
        return false;
    }

    // return the number of events that are blocking this event
    uint32_t peekNumEventsBlockingThis() const {
        return parentCount;
    }

    // returns true if event is completed (in terms of definition provided by OCL spec)
    bool peekIsCompleted(const int32_t *executionStatusSnapshot = nullptr) {
        // Note from OLC spec :
        //    "A command is considered complete if its execution status
        //     is CL_COMPLETE or a negative value."
        int32_t statusSnapshot = 0;
        if (executionStatusSnapshot != nullptr) {
            statusSnapshot = *executionStatusSnapshot;
        } else {
            statusSnapshot = updateEventAndReturnCurrentStatus();
        }
        return (statusSnapshot == CL_COMPLETE) || (statusSnapshot < 0);
    }

    // Note from OCL spec :
    //      "A negative integer value causes all enqueued commands that wait on this user event
    //       to be terminated."
    bool peekIsCompletedByTermination(const int32_t *executionStatusSnapshot = nullptr) {
        if (executionStatusSnapshot == nullptr) {
            return (peekExecutionStatus() < 0);
        } else {
            return (*executionStatusSnapshot < 0);
        }
    }

    bool peekIsSubmitted(const int32_t *executionStatusSnapshot = nullptr) {
        if (executionStatusSnapshot == nullptr) {
            return (peekExecutionStatus() == CL_SUBMITTED);
        } else {
            return (*executionStatusSnapshot == CL_SUBMITTED);
        }
    }

    //commands blocked by user event depencies
    bool isReadyForSubmission();

    // adds a callback (execution state change listener) to this event's list of callbacks
    void addCallback(Callback::ClbFuncT fn, cl_int type, void *data);

    //returns true on success
    //if(blocking==false), will return with false instead of blocking while waiting for completion
    virtual bool wait(bool blocking);

    bool isUserEvent() const {
        return (CL_COMMAND_USER == cmdType);
    }

    Context *getContext() {
        return ctx;
    }

    CommandQueue *getCommandQueue() {
        return cmdQueue;
    }

    cl_command_type getCommandType() {
        return cmdType;
    }

    virtual uint32_t getTaskLevel();

    cl_int peekExecutionStatus() {
        return executionStatus;
    }

    cl_int updateEventAndReturnCurrentStatus() {
        updateExecutionStatus();
        return executionStatus;
    }

    bool peekIsBlocked() const {
        return (peekNumEventsBlockingThis() > 0);
    }

    void unblockEventBy(Event &event, uint32_t taskLevel, int32_t transitionStatus);

    void updateTaskCount(uint32_t taskCount) {
        if (taskCount == Event::eventNotReady) {
            DEBUG_BREAK_IF(true);
            return;
        }

        uint32_t prevTaskCount = this->taskCount.exchange(taskCount);
        if ((prevTaskCount != Event::eventNotReady) && (prevTaskCount > taskCount)) {
            this->taskCount = prevTaskCount;
            DEBUG_BREAK_IF(true);
        }
    }

    bool isCurrentCmdQVirtualEvent() {
        return currentCmdQVirtualEvent;
    }

    void setCurrentCmdQVirtualEvent(bool isCurrentVirtualEvent) {
        currentCmdQVirtualEvent = isCurrentVirtualEvent;
    }

    virtual void updateExecutionStatus();
    void tryFlushEvent();

    uint32_t peekTaskCount() const {
        return this->taskCount;
    }

    void setQueueTimeStamp(TimeStampData *queueTimeStamp) {
        this->queueTimeStamp = *queueTimeStamp;
    };

    void setSubmitTimeStamp(TimeStampData *submitTimeStamp) {
        this->submitTimeStamp = *submitTimeStamp;
    };

    void setQueueTimeStamp();
    void setSubmitTimeStamp();

    void setStartTimeStamp();
    void setEndTimeStamp();

    void setCmdType(uint32_t cmdType) {
        this->cmdType = cmdType;
    }

    std::vector<Event *> &getParentEvents() { return this->parentEvents; }

  protected:
    Event(Context *ctx, CommandQueue *cmdQueue, cl_command_type cmdType,
          uint32_t taskLevel, uint32_t taskCount);

    ECallbackTarget translateToCallbackTarget(cl_int execStatus) {
        switch (execStatus) {
        default: {
            DEBUG_BREAK_IF(true);
            return ECallbackTarget::Invalid;
        }

        case CL_QUEUED:
            return ECallbackTarget::Queued;
        case CL_SUBMITTED:
            return ECallbackTarget::Submitted;
        case CL_RUNNING:
            return ECallbackTarget::Running;
        case CL_COMPLETE:
            return ECallbackTarget::Completed;
        }
    }

    // executes all callbacks associated with this event
    void executeCallbacks(int32_t executionStatus);

    // transitions event to new execution state
    // guarantees that newStatus <= oldStatus
    void transitionExecutionStatus(int32_t newExecutionStatus) const {
        int32_t prevStatus = executionStatus;
        DBG_LOG(EventsDebugEnable, "transitionExecutionStatus event", this, " new status", newExecutionStatus, "previousStatus", prevStatus);

        while (prevStatus > newExecutionStatus) {
            executionStatus.compare_exchange_weak(prevStatus, newExecutionStatus);
        }
    }

    //vector storing events that needs to be notified when this event is ready to go
    IFRefList<Event, true, true> childEventsToNotify;
    void unblockEventsBlockedByThis(int32_t transitionStatus);
    void submitCommand(bool abortBlockedTasks);

    bool currentCmdQVirtualEvent;
    std::atomic<Command *> cmdToSubmit;
    std::atomic<Command *> submittedCmd;
    bool eventWithoutCommand = true;

    Context *ctx;
    CommandQueue *cmdQueue;
    cl_command_type cmdType;

    // callbacks to be executed when this event changes its execution state
    IFList<Callback, true, true> callbacks[(uint32_t)ECallbackTarget::MAX];

    // can be accessed only with transitionExecutionState
    // this is to ensure state consitency event when doning lock-free multithreading
    // e.g. CL_COMPLETE -> CL_SUBMITTED or CL_SUBMITTED -> CL_QUEUED becomes forbiden
    mutable std::atomic<int32_t> executionStatus;
    // Timestamps
    cl_bool profilingEnabled;
    cl_bool profilingCpuPath;
    bool dataCalculated;
    TimeStampData queueTimeStamp;
    TimeStampData submitTimeStamp;
    uint64_t startTimeStamp;
    uint64_t endTimeStamp;
    uint64_t completeTimeStamp;
    TagNode<HwTimeStamps> *timeStampNode;
    bool perfCountersEnabled;
    TagNode<HwPerfCounter> *perfCounterNode;
    InstrPmRegsCfg *perfConfigurationData;
    //number of events this event depends on
    std::atomic<int> parentCount;
    //event parents
    std::vector<Event *> parentEvents;

  private:
    // can be accessed only with updateTaskCount
    std::atomic<uint32_t> taskCount;
};
} // namespace OCLRT
Initial commit Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd 2017-12-21 07:45:38 +08:00			`/*`
			`* Copyright (c) 2017, Intel Corporation`
			`*`
			`* Permission is hereby granted, free of charge, to any person obtaining a`
			`* copy of this software and associated documentation files (the "Software"),`
			`* to deal in the Software without restriction, including without limitation`
			`* the rights to use, copy, modify, merge, publish, distribute, sublicense,`
			`* and/or sell copies of the Software, and to permit persons to whom the`
			`* Software is furnished to do so, subject to the following conditions:`
			`*`
			`* The above copyright notice and this permission notice shall be included`
			`* in all copies or substantial portions of the Software.`
			`*`
			`* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS`
			`* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,`
			`* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL`
			`* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR`
			`* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,`
			`* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR`
			`* OTHER DEALINGS IN THE SOFTWARE.`
			`*/`

			`#pragma once`
			`#include "runtime/api/cl_types.h"`
			`#include "runtime/helpers/base_object.h"`
			`#include <cstdint>`
			`#include <atomic>`
			`#include <vector>`
			`#include "runtime/helpers/task_information.h"`
			`#include "runtime/utilities/idlist.h"`
			`#include "runtime/utilities/iflist.h"`
			`#include "runtime/event/hw_timestamps.h"`
			`#include "runtime/os_interface/os_time.h"`
			`#include "runtime/os_interface/performance_counters.h"`
			`#include "runtime/helpers/completion_stamp.h"`
			`#include "runtime/helpers/flush_stamp.h"`
			`#include "runtime/utilities/arrayref.h"`

			`#define OCLRT_NUM_TIMESTAMP_BITS (32)`

			`namespace OCLRT {`
			`template <typename TagType>`
			`struct TagNode;`
			`class CommandQueue;`
			`class Context;`
			`class Device;`

			`template <>`
			`struct OpenCLObjectMapper<_cl_event> {`
			`typedef class Event DerivedType;`
			`};`

			`class Event : public BaseObject<_cl_event>, public IDNode<Event> {`
			`public:`
			`enum class ECallbackTarget : uint32_t {`
			`Queued = 0,`
			`Submitted,`
			`Running,`
			`Completed,`
			`MAX,`
			`Invalid`
			`};`

			`struct Callback : public IFNode<Callback> {`
			`typedef void(CL_CALLBACK ClbFuncT)(cl_event, cl_int, void );`

			`Callback(cl_event event, ClbFuncT clb, cl_int type, void *data)`
			`: event(event), callbackFunction(clb), callbackExecutionStatusTarget(type), userData(data) {`
			`}`

			`void execute() {`
			`callbackFunction(event, callbackExecutionStatusTarget, userData);`
			`}`

			`int32_t getCallbackExecutionStatusTarget() const {`
			`return callbackExecutionStatusTarget;`
			`}`

			`// From OCL spec :`
			`// "If the callback is called as the result of the command associated with`
			`// event being abnormally terminated, an appropriate error code for the error that caused`
			`// the termination will be passed to event_command_exec_status instead."`
			`// This function allows to override this value`
			`void overrideCallbackExecutionStatusTarget(int32_t newCallbackExecutionStatusTarget) {`
			`DEBUG_BREAK_IF(newCallbackExecutionStatusTarget >= 0);`
			`callbackExecutionStatusTarget = newCallbackExecutionStatusTarget;`
			`}`

			`private:`
			`cl_event event;`
			`ClbFuncT callbackFunction;`
			`int32_t callbackExecutionStatusTarget; // minimum event execution status that will triger this callback`
			`void *userData;`
			`};`

			`static const cl_ulong objectMagic = 0x80134213A43C981ALL;`
			`static const cl_uint eventNotReady;`

			`Event(CommandQueue *cmdQueue, cl_command_type cmdType,`
			`uint32_t taskLevel, uint32_t taskCount);`

			`Event(const Event &) = delete;`
			`Event &operator=(const Event &) = delete;`

			`~Event() override;`

			`uint32_t getCompletionStamp(void) const;`
			`void updateCompletionStamp(uint32_t taskCount, uint32_t tasklevel, FlushStamp flushStamp);`
			`cl_ulong getDelta(cl_ulong startTime,`
			`cl_ulong endTime);`
			`bool calcProfilingData();`
			`void setCPUProfilingPath(bool isCPUPath) { isCPUPath ? profilingCpuPath = CL_TRUE : profilingCpuPath = CL_FALSE; }`
			`cl_bool isCPUProfilingPath() {`
			`return profilingCpuPath;`
			`}`

			`cl_int getEventProfilingInfo(cl_profiling_info paramName,`
			`size_t paramValueSize,`
			`void *paramValue,`
			`size_t *paramValueSizeRet);`

			`cl_bool isProfilingEnabled() { return profilingEnabled; }`

			`void setProfilingEnabled(cl_bool profilingEnabled) {`
			`this->profilingEnabled = profilingEnabled;`
			`}`

			`HwTimeStamps *getHwTimeStamp();`
			`GraphicsAllocation *getHwTimeStampAllocation();`

			`bool isPerfCountersEnabled() {`
			`return perfCountersEnabled;`
			`}`

			`void setPerfCountersEnabled(bool perfCountersEnabled) {`
			`this->perfCountersEnabled = perfCountersEnabled;`
			`}`

			`void copyPerfCounters(InstrPmRegsCfg *config);`

			`HwPerfCounter *getHwPerfCounter();`
			`GraphicsAllocation *getHwPerfCounterAllocation();`

			`std::unique_ptr<FlushStampTracker> flushStamp;`
			`std::atomic<uint32_t> taskLevel;`

			`void addChild(Event &e);`

			`virtual bool setStatus(cl_int status);`

			`static cl_int waitForEvents(cl_uint numEvents,`
			`const cl_event *eventList);`

			`std::unique_ptr<Command> setCommand(std::unique_ptr<Command> newCmd) {`
			`std::unique_ptr<Command> prevCmd;`
			`prevCmd.reset(cmdToSubmit.exchange(newCmd.release()));`
			`eventWithoutCommand = false;`
			`return prevCmd;`
			`}`
			`Command *peekCommand() {`
			`return cmdToSubmit;`
			`}`

			`IFNodeRef<Event> *peekChildEvents() {`
			`return childEventsToNotify.peekHead();`
			`}`

			`bool peekHasChildEvents() {`
			`return (peekChildEvents() != nullptr);`
			`}`

			`bool peekHasCallbacks(ECallbackTarget target) {`
			`if (target >= ECallbackTarget::MAX) {`
			`DEBUG_BREAK_IF(true);`
			`return false;`
			`}`
			`return (callbacks[(uint32_t)target].peekHead() != nullptr);`
			`}`

			`bool peekHasCallbacks() {`
			`for (uint32_t i = 0; i < (uint32_t)ECallbackTarget::MAX; ++i) {`
			`if (peekHasCallbacks((ECallbackTarget)i)) {`
			`return true;`
			`}`
			`}`
			`return false;`
			`}`

			`// return the number of events that are blocking this event`
			`uint32_t peekNumEventsBlockingThis() const {`
			`return parentCount;`
			`}`

			`// returns true if event is completed (in terms of definition provided by OCL spec)`
			`bool peekIsCompleted(const int32_t *executionStatusSnapshot = nullptr) {`
			`// Note from OLC spec :`
			`// "A command is considered complete if its execution status`
			`// is CL_COMPLETE or a negative value."`
			`int32_t statusSnapshot = 0;`
			`if (executionStatusSnapshot != nullptr) {`
			`statusSnapshot = *executionStatusSnapshot;`
			`} else {`
			`statusSnapshot = updateEventAndReturnCurrentStatus();`
			`}`
			`return (statusSnapshot == CL_COMPLETE) \|\| (statusSnapshot < 0);`
			`}`

			`// Note from OCL spec :`
			`// "A negative integer value causes all enqueued commands that wait on this user event`
			`// to be terminated."`
			`bool peekIsCompletedByTermination(const int32_t *executionStatusSnapshot = nullptr) {`
			`if (executionStatusSnapshot == nullptr) {`
			`return (peekExecutionStatus() < 0);`
			`} else {`
			`return (*executionStatusSnapshot < 0);`
			`}`
			`}`

			`bool peekIsSubmitted(const int32_t *executionStatusSnapshot = nullptr) {`
			`if (executionStatusSnapshot == nullptr) {`
			`return (peekExecutionStatus() == CL_SUBMITTED);`
			`} else {`
			`return (*executionStatusSnapshot == CL_SUBMITTED);`
			`}`
			`}`

			`//commands blocked by user event depencies`
			`bool isReadyForSubmission();`

			`// adds a callback (execution state change listener) to this event's list of callbacks`
			`void addCallback(Callback::ClbFuncT fn, cl_int type, void *data);`

			`//returns true on success`
			`//if(blocking==false), will return with false instead of blocking while waiting for completion`
			`virtual bool wait(bool blocking);`

			`bool isUserEvent() const {`
			`return (CL_COMMAND_USER == cmdType);`
			`}`

			`Context *getContext() {`
			`return ctx;`
			`}`

			`CommandQueue *getCommandQueue() {`
			`return cmdQueue;`
			`}`

			`cl_command_type getCommandType() {`
			`return cmdType;`
			`}`

			`virtual uint32_t getTaskLevel();`

			`cl_int peekExecutionStatus() {`
			`return executionStatus;`
			`}`

			`cl_int updateEventAndReturnCurrentStatus() {`
			`updateExecutionStatus();`
			`return executionStatus;`
			`}`

			`bool peekIsBlocked() const {`
			`return (peekNumEventsBlockingThis() > 0);`
			`}`

			`void unblockEventBy(Event &event, uint32_t taskLevel, int32_t transitionStatus);`

			`void updateTaskCount(uint32_t taskCount) {`
			`if (taskCount == Event::eventNotReady) {`
			`DEBUG_BREAK_IF(true);`
			`return;`
			`}`

			`uint32_t prevTaskCount = this->taskCount.exchange(taskCount);`
			`if ((prevTaskCount != Event::eventNotReady) && (prevTaskCount > taskCount)) {`
			`this->taskCount = prevTaskCount;`
			`DEBUG_BREAK_IF(true);`
			`}`
			`}`

			`bool isCurrentCmdQVirtualEvent() {`
			`return currentCmdQVirtualEvent;`
			`}`

			`void setCurrentCmdQVirtualEvent(bool isCurrentVirtualEvent) {`
			`currentCmdQVirtualEvent = isCurrentVirtualEvent;`
			`}`

			`virtual void updateExecutionStatus();`
			`void tryFlushEvent();`

			`uint32_t peekTaskCount() const {`
			`return this->taskCount;`
			`}`

			`void setQueueTimeStamp(TimeStampData *queueTimeStamp) {`
			`this->queueTimeStamp = *queueTimeStamp;`
			`};`

			`void setSubmitTimeStamp(TimeStampData *submitTimeStamp) {`
			`this->submitTimeStamp = *submitTimeStamp;`
			`};`

			`void setQueueTimeStamp();`
			`void setSubmitTimeStamp();`

			`void setStartTimeStamp();`
			`void setEndTimeStamp();`

			`void setCmdType(uint32_t cmdType) {`
			`this->cmdType = cmdType;`
			`}`

			`std::vector<Event *> &getParentEvents() { return this->parentEvents; }`

			`protected:`
			`Event(Context ctx, CommandQueue cmdQueue, cl_command_type cmdType,`
			`uint32_t taskLevel, uint32_t taskCount);`

			`ECallbackTarget translateToCallbackTarget(cl_int execStatus) {`
			`switch (execStatus) {`
			`default: {`
			`DEBUG_BREAK_IF(true);`
			`return ECallbackTarget::Invalid;`
			`}`

			`case CL_QUEUED:`
			`return ECallbackTarget::Queued;`
			`case CL_SUBMITTED:`
			`return ECallbackTarget::Submitted;`
			`case CL_RUNNING:`
			`return ECallbackTarget::Running;`
			`case CL_COMPLETE:`
			`return ECallbackTarget::Completed;`
			`}`
			`}`

			`// executes all callbacks associated with this event`
			`void executeCallbacks(int32_t executionStatus);`

			`// transitions event to new execution state`
			`// guarantees that newStatus <= oldStatus`
			`void transitionExecutionStatus(int32_t newExecutionStatus) const {`
			`int32_t prevStatus = executionStatus;`
			`DBG_LOG(EventsDebugEnable, "transitionExecutionStatus event", this, " new status", newExecutionStatus, "previousStatus", prevStatus);`

			`while (prevStatus > newExecutionStatus) {`
			`executionStatus.compare_exchange_weak(prevStatus, newExecutionStatus);`
			`}`
			`}`

			`//vector storing events that needs to be notified when this event is ready to go`
			`IFRefList<Event, true, true> childEventsToNotify;`
			`void unblockEventsBlockedByThis(int32_t transitionStatus);`
			`void submitCommand(bool abortBlockedTasks);`

			`bool currentCmdQVirtualEvent;`
			`std::atomic<Command *> cmdToSubmit;`
			`std::atomic<Command *> submittedCmd;`
			`bool eventWithoutCommand = true;`

			`Context *ctx;`
			`CommandQueue *cmdQueue;`
			`cl_command_type cmdType;`

			`// callbacks to be executed when this event changes its execution state`
			`IFList<Callback, true, true> callbacks[(uint32_t)ECallbackTarget::MAX];`

			`// can be accessed only with transitionExecutionState`
			`// this is to ensure state consitency event when doning lock-free multithreading`
			`// e.g. CL_COMPLETE -> CL_SUBMITTED or CL_SUBMITTED -> CL_QUEUED becomes forbiden`
			`mutable std::atomic<int32_t> executionStatus;`
			`// Timestamps`
			`cl_bool profilingEnabled;`
			`cl_bool profilingCpuPath;`
			`bool dataCalculated;`
			`TimeStampData queueTimeStamp;`
			`TimeStampData submitTimeStamp;`
			`uint64_t startTimeStamp;`
			`uint64_t endTimeStamp;`
			`uint64_t completeTimeStamp;`
			`TagNode<HwTimeStamps> *timeStampNode;`
			`bool perfCountersEnabled;`
			`TagNode<HwPerfCounter> *perfCounterNode;`
			`InstrPmRegsCfg *perfConfigurationData;`
			`//number of events this event depends on`
			`std::atomic<int> parentCount;`
			`//event parents`
			`std::vector<Event *> parentEvents;`

			`private:`
			`// can be accessed only with updateTaskCount`
			`std::atomic<uint32_t> taskCount;`
			`};`
			`} // namespace OCLRT`