86 lignes
3.3 KiB
C
86 lignes
3.3 KiB
C
/*************************************************************************
|
|
* Copyright (c) 2024, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* See LICENSE.txt for license information
|
|
************************************************************************/
|
|
|
|
#ifndef PROFILER_H_
|
|
#define PROFILER_H_
|
|
|
|
#include <stdint.h>
|
|
#include <stdlib.h>
|
|
|
|
#include "common.h"
|
|
|
|
enum {
|
|
ncclProfileGroup = (1 << 0), // group event type
|
|
ncclProfileColl = (1 << 1), // host collective call event type
|
|
ncclProfileP2p = (1 << 2), // host point-to-point call event type
|
|
ncclProfileProxyOp = (1 << 3), // proxy operation event type
|
|
ncclProfileProxyStep = (1 << 4), // proxy step event type
|
|
ncclProfileProxyCtrl = (1 << 5), // proxy control event type
|
|
ncclProfileKernelCh = (1 << 6), // kernel channel event type
|
|
ncclProfileNetPlugin = (1 << 7), // network plugin-defined, events
|
|
ncclProfileGroupApi = (1 << 8), // Group API events
|
|
ncclProfileCollApi = (1 << 9), // Collective API events
|
|
ncclProfileP2pApi = (1 << 10), // Point-to-Point API events
|
|
ncclProfileKernelLaunch = (1 << 11), // Kernel launch events
|
|
};
|
|
|
|
typedef enum {
|
|
ncclProfilerProxyOpSendPosted = 0, // deprecated in v4
|
|
ncclProfilerProxyOpSendRemFifoWait = 1, // deprecated in v4
|
|
ncclProfilerProxyOpSendTransmitted = 2, // deprecated in v4
|
|
ncclProfilerProxyOpSendDone = 3, // deprecated in v4
|
|
ncclProfilerProxyOpRecvPosted = 4, // deprecated in v4
|
|
ncclProfilerProxyOpRecvReceived = 5, // deprecated in v4
|
|
ncclProfilerProxyOpRecvTransmitted = 6, // deprecated in v4
|
|
ncclProfilerProxyOpRecvDone = 7, // deprecated in v4
|
|
ncclProfilerProxyOpInProgress_v4 = 19,
|
|
|
|
/* Legacy proxy profiler states */
|
|
ncclProfilerProxyStepSendGPUWait = 8,
|
|
ncclProfilerProxyStepSendPeerWait_v4 = 20,
|
|
ncclProfilerProxyStepSendWait = 9,
|
|
ncclProfilerProxyStepRecvWait = 10,
|
|
ncclProfilerProxyStepRecvFlushWait = 11,
|
|
ncclProfilerProxyStepRecvGPUWait = 12,
|
|
|
|
/* Legacy proxy control states */
|
|
ncclProfilerProxyCtrlIdle = 13,
|
|
ncclProfilerProxyCtrlActive = 14,
|
|
ncclProfilerProxyCtrlSleep = 15,
|
|
ncclProfilerProxyCtrlWakeup = 16,
|
|
ncclProfilerProxyCtrlAppend = 17,
|
|
ncclProfilerProxyCtrlAppendEnd = 18,
|
|
|
|
/* Network defined events states */
|
|
ncclProfilerNetPluginUpdate = 21,
|
|
|
|
/* Kernel event states */
|
|
ncclProfilerKernelChStop = 22,
|
|
|
|
/* Group API States */
|
|
ncclProfilerEndGroupApiStart = 23,
|
|
ncclProfilerBeginGroupApiEnd = 24
|
|
} ncclProfilerEventState_t;
|
|
|
|
typedef ncclProfilerEventState_t ncclProfilerEventState_v1_t;
|
|
typedef ncclProfilerEventState_t ncclProfilerEventState_v2_t;
|
|
typedef ncclProfilerEventState_t ncclProfilerEventState_v3_t;
|
|
typedef ncclProfilerEventState_t ncclProfilerEventState_v4_t;
|
|
typedef ncclProfilerEventState_t ncclProfilerEventState_v5_t;
|
|
|
|
#include "profiler_v5.h"
|
|
#include "profiler_v4.h"
|
|
#include "profiler_v3.h"
|
|
#include "profiler_v2.h"
|
|
#include "profiler_v1.h"
|
|
#include "profiler_net.h"
|
|
|
|
typedef ncclProfiler_v5_t ncclProfiler_t;
|
|
typedef ncclProfilerEventDescr_v5_t ncclProfilerEventDescr_t;
|
|
typedef ncclProfilerEventStateArgs_v5_t ncclProfilerEventStateArgs_t;
|
|
|
|
#endif // end include guard
|