docs/hdk/gpu__profiler__common_8h_source.html

 #pragma once


 #include "core/common/profiler_common.h"

 #include "core/common/inlined_containers.h"


 #include <map>

 #include <memory>

 #include <mutex>

 #include <sstream>

 #include <string>

 #include <vector>

 #include <utility>


 namespace onnxruntime {

 namespace profiling {


 // The classes in this header are implemented as template/inline classes

 // to avoid having to export symbols from the main onnxruntime shared library

 // to ExecutionProvider (EP) shared libraries.

 // More context: The main onnxruntime shared library is optimized for size

 // using --gc-sections during link time to ensure that any unreferenced code

 // is not retained. This poses a problem in using a design pattern where the

 // (abstract) base class is implemented in the main onnxruntime shared library,

 // but (concrete) subclasses are implemented in EP shared libraries. Now, because

 // EP shared libraries are loaded at runtime (as of 11/2022), there will be no

 // references to the base class symbols when the main onnxruntime shared library

 // is compiled. Thus, the base class symbols will not be included in the

 // main onnxruntime shared library. This manifests in being unable to load

 // EP shared libs (because the base class symbols referenced by derived

 // classes are missing).

 // We solve this by implementing base classes that are common to all GPU profilers

 // inline in this header.


 class ProfilerActivityBuffer {

  public:

   ProfilerActivityBuffer() noexcept

       : data_(nullptr), size_(0) {}


   ProfilerActivityBuffer(const char* data, size_t size) noexcept

       : data_(std::make_unique<char[]>(size)), size_(size) {

     memcpy(data_.get(), data, size_);

   }


   ProfilerActivityBuffer(const ProfilerActivityBuffer& other) noexcept

       : ProfilerActivityBuffer(other.GetData(), other.GetSize()) {}


   ProfilerActivityBuffer(ProfilerActivityBuffer&& other) noexcept

       : ProfilerActivityBuffer() {

     std::swap(data_, other.data_);

     std::swap(size_, other.size_);

   }


   ProfilerActivityBuffer& operator=(const ProfilerActivityBuffer& other) noexcept {

     if (&other == this) {

       return *this;

     }


     new (this) ProfilerActivityBuffer{other};

     return *this;

   }


   ProfilerActivityBuffer& operator=(ProfilerActivityBuffer&& other) noexcept {

     if (&other == this) {

       return *this;

     }


     new (this) ProfilerActivityBuffer{std::move(other)};

     return *this;

   }


   static ProfilerActivityBuffer CreateFromPreallocatedBuffer(std::unique_ptr<char[]>&& buffer_ptr, size_t size) {

     ProfilerActivityBuffer res{};

     res.data_ = std::move(buffer_ptr);

     res.size_ = size;

     return res;

   }


   // accessors

   char* GetData() { return data_.get(); }

   const char* GetData() const { return data_.get(); }

   size_t GetSize() const { return size_; }


  private:

   std::unique_ptr<char[]> data_;

   size_t size_;

 }; /* end class ProfilerActivityBuffer */


 template <typename TDerived>

 class GPUTracerManager {

  public:

   ORT_DISALLOW_COPY_ASSIGNMENT_AND_MOVE(GPUTracerManager);

   virtual ~GPUTracerManager() {}


   uint64_t RegisterClient() {

     std::lock_guard<std::mutex> lock(manager_instance_mutex_);

     auto res = next_client_id_++;

     per_client_events_by_ext_correlation_.insert({res, {}});

     ++num_active_clients_;

     return res;

   }


   void DeregisterClient(uint64_t client_handle) {

     std::lock_guard<std::mutex> lock(manager_instance_mutex_);

     auto it = per_client_events_by_ext_correlation_.find(client_handle);

     if (it == per_client_events_by_ext_correlation_.end()) {

       return;

     }

     per_client_events_by_ext_correlation_.erase(it);

     --num_active_clients_;

     if (num_active_clients_ == 0 && tracing_enabled_) {

       StopLogging();

     }

   }


   void StartLogging() {

     std::lock_guard<std::mutex> lock(manager_instance_mutex_);

     if (tracing_enabled_) {

       return;

     }


     auto this_as_derived = static_cast<TDerived*>(this);

     tracing_enabled_ = this_as_derived->OnStartLogging();

   }


   void Consume(uint64_t client_handle, const TimePoint& start_time, std::map<uint64_t, Events>& events) {

     auto this_as_derived = static_cast<TDerived*>(this);

     events.clear();

     {

       // Flush any pending activity records before starting

       // to process the accumulated activity records.

       std::lock_guard<std::mutex> lock_manager(manager_instance_mutex_);

       if (!tracing_enabled_) {

         return;

       }


       this_as_derived->FlushActivities();

     }


     std::vector<ProfilerActivityBuffer> activity_buffers;

     {

       std::lock_guard<std::mutex> lock(unprocessed_activity_buffers_mutex_);

       std::swap(unprocessed_activity_buffers_, activity_buffers);

       unprocessed_activity_buffers_.clear();

     }


     {

       // Ensure that at most one thread is working through the activity buffers at any time.

       std::lock_guard<std::mutex> lock_two(activity_buffer_processor_mutex_);

       this_as_derived->ProcessActivityBuffers(activity_buffers, start_time);

       auto it = per_client_events_by_ext_correlation_.find(client_handle);

       if (it == per_client_events_by_ext_correlation_.end()) {

         return;

       }

       std::swap(events, it->second);

     }

   }


   void PushCorrelation(uint64_t client_handle,

                        uint64_t external_correlation_id,

                        TimePoint profiling_start_time) {

     auto this_as_derived = static_cast<TDerived*>(this);

     std::lock_guard<std::mutex> lock(manager_instance_mutex_);

     if (!tracing_enabled_) {

       return;

     }


     auto it = per_client_events_by_ext_correlation_.find(client_handle);

     if (it == per_client_events_by_ext_correlation_.end()) {

       // not a registered client, do nothing

       return;

     }


     // external_correlation_id is simply the timestamp of this event,

     // relative to profiling_start_time. i.e., it was computed as:

     // external_correlation_id =

     //      std::chrono::duration_cast<std::chrono::microseconds>(event_start_time - profiling_start_time).count()

     //

     // Because of the relative nature of the external_correlation_id, the same

     // external_correlation_id can be reused across different clients, which then makes it

     // impossible to recover the client from the external_correlation_id, which in turn

     // makes it impossible to map events (which are tagged with external_correlation_id) to clients.

     //

     // To address these difficulties, we construct a new correlation_id (let's call it unique_cid)

     // as follows:

     // unique_cid =

     //    external_correlation_id +

     //    std::chrono::duration_cast<std::chrono::microseconds>(profiling_start_time.time_since_epoch()).count()

     // now, unique_cid is monotonically increasing with time, so it can be used to reliably map events to clients.

     //

     // Of course, clients expect lists of events to be returned (on a call to Consume()), that are

     // still keyed on the external_correlation_id that they've specified here, so we need to remember the

     // offset to be subtracted

     uint64_t offset = std::chrono::duration_cast<std::chrono::microseconds>(profiling_start_time.time_since_epoch()).count();

     auto unique_cid = external_correlation_id + offset;

     unique_correlation_id_to_client_offset_[unique_cid] = std::make_pair(client_handle, offset);

     this_as_derived->PushUniqueCorrelation(unique_cid);

   }


   void PopCorrelation(uint64_t& popped_external_correlation_id) {

     auto this_as_derived = static_cast<TDerived*>(this);

     std::lock_guard<std::mutex> lock(manager_instance_mutex_);

     if (!tracing_enabled_) {

       return;

     }

     uint64_t unique_cid;

     this_as_derived->PopUniqueCorrelation(unique_cid);

     // lookup the offset and subtract it before returning popped_external_correlation_id to the client

     auto client_it = unique_correlation_id_to_client_offset_.find(unique_cid);

     if (client_it == unique_correlation_id_to_client_offset_.end()) {

       popped_external_correlation_id = 0;

       return;

     }

     popped_external_correlation_id = unique_cid - client_it->second.second;

   }


   void PopCorrelation() {

     uint64_t unused;

     PopCorrelation(unused);

   }


  protected:

   GPUTracerManager() {

     auto this_as_derived = static_cast<TDerived*>(this);

     uint64_t gpu_ts1, gpu_ts2, cpu_ts;


     // Get the CPU and GPU timestamps to warm up

     gpu_ts1 = this_as_derived->GetGPUTimestampInNanoseconds();

     cpu_ts = this->GetCPUTimestampInNanoseconds();


     // Estimate the skew/offset between the CPU and GPU timestamps.

     gpu_ts1 = this_as_derived->GetGPUTimestampInNanoseconds();

     cpu_ts = this->GetCPUTimestampInNanoseconds();

     gpu_ts2 = this_as_derived->GetGPUTimestampInNanoseconds();


     auto gpu_ts = (gpu_ts1 + gpu_ts2) / 2;

     offset_to_add_to_gpu_timestamps_ = cpu_ts - gpu_ts;

   }


 #if 0

   // Functional API to be implemented by subclasses

   // Included here only for documentation purposes

 protected:

   bool OnStartLogging();

   void OnStopLogging();

   void ProcessActivityBuffers(const std::vector<ProfilerActivityBuffer>& buffers,

                               const TimePoint& start_time);

   bool PushUniqueCorrelation(uint64_t unique_cid);

   void PopUniqueCorrelation(uint64_t& popped_unique_cid);

   void FlushActivities();

   uint64_t GetGPUTimestampInNanoseconds();

 #endif


   void EnqueueActivityBuffer(ProfilerActivityBuffer&& buffer) {

     std::lock_guard<std::mutex> lock(unprocessed_activity_buffers_mutex_);

     unprocessed_activity_buffers_.emplace_back(std::move(buffer));

   }


   // To be called by subclasses only from ProcessActivityBuffers

   void MapEventToClient(uint64_t tracer_correlation_id, EventRecord&& event) {

     auto it = tracer_correlation_to_unique_correlation_.find(tracer_correlation_id);

     if (it == tracer_correlation_to_unique_correlation_.end()) {

       // We're yet to receive a mapping to unique_correlation_id for this tracer_correlation_id

       DeferEventMapping(std::move(event), tracer_correlation_id);

       return;

     }

     auto unique_correlation_id = it->second;

     auto p_event_list = GetEventListForUniqueCorrelationId(unique_correlation_id);

     if (p_event_list != nullptr) {

       p_event_list->emplace_back(std::move(event));

     }

   }


   // To be called by subclasses only from ProcessActivityBuffers

   void NotifyNewCorrelation(uint64_t tracer_correlation_id, uint64_t unique_correlation_id) {

     tracer_correlation_to_unique_correlation_[tracer_correlation_id] = unique_correlation_id;

     auto pending_it = events_pending_client_mapping_.find(tracer_correlation_id);

     if (pending_it == events_pending_client_mapping_.end()) {

       return;

     }

     // Map the pending events to the right client

     MapEventsToClient(unique_correlation_id, std::move(pending_it->second));

     events_pending_client_mapping_.erase(pending_it);

   }


   uint64_t NormalizeGPUTimestampToCPUEpoch(uint64_t gpu_timestamp_in_nanoseconds) {

     return gpu_timestamp_in_nanoseconds + this->offset_to_add_to_gpu_timestamps_;

   }


  private:

   // Requires: manager_instance_mutex_ should be held

   void StopLogging() {

     auto this_as_derived = static_cast<TDerived*>(this);

     if (!tracing_enabled_) {

       return;

     }

     this_as_derived->OnStopLogging();

     tracing_enabled_ = false;

     Clear();

   }


   // Requires: manager_instance_mutex_ should be held

   void Clear() {

     unprocessed_activity_buffers_.clear();

     unique_correlation_id_to_client_offset_.clear();

     per_client_events_by_ext_correlation_.clear();

     tracer_correlation_to_unique_correlation_.clear();

     events_pending_client_mapping_.clear();

   }


   Events* GetEventListForUniqueCorrelationId(uint64_t unique_correlation_id) {

     auto client_it = unique_correlation_id_to_client_offset_.find(unique_correlation_id);

     if (client_it == unique_correlation_id_to_client_offset_.end()) {

       return nullptr;

     }


     // See the comments on the GetUniqueCorrelationId method for an explanation of

     // of this offset computation and why it's required.

     auto const& client_handle_offset = client_it->second;

     auto external_correlation = unique_correlation_id - client_handle_offset.second;

     auto& event_list = per_client_events_by_ext_correlation_[client_handle_offset.first][external_correlation];

     return &event_list;

   }


   void MapEventsToClient(uint64_t unique_correlation_id, std::vector<EventRecord>&& events) {

     auto p_event_list = GetEventListForUniqueCorrelationId(unique_correlation_id);

     if (p_event_list != nullptr) {

       p_event_list->insert(p_event_list->end(),

                            std::make_move_iterator(events.begin()),

                            std::make_move_iterator(events.end()));

     }

   }


   void DeferEventMapping(EventRecord&& event, uint64_t tracer_correlation_id) {

     events_pending_client_mapping_[tracer_correlation_id].emplace_back(std::move(event));

   }


   uint64_t GetCPUTimestampInNanoseconds() {

     return std::chrono::duration_cast<std::chrono::nanoseconds>(

                std::chrono::high_resolution_clock::now().time_since_epoch())

         .count();

   }


   std::mutex manager_instance_mutex_;

   uint64_t next_client_id_ = 1;

   uint64_t num_active_clients_ = 0;

   bool tracing_enabled_ = false;

   std::mutex unprocessed_activity_buffers_mutex_;

   std::mutex activity_buffer_processor_mutex_;


   // Unprocessed activity buffers

   std::vector<ProfilerActivityBuffer> unprocessed_activity_buffers_;


   // Keyed on unique_correlation_id -> (client_id/client_handle, offset)

   // unique_correlation_id - offset == external_correlation_id

   InlinedHashMap<uint64_t, std::pair<uint64_t, uint64_t>> unique_correlation_id_to_client_offset_;


   // Keyed on tracer_correlation_id -> unique_correlation_id

   InlinedHashMap<uint64_t, uint64_t> tracer_correlation_to_unique_correlation_;


   // client_id/client_handle -> external_correlation_id -> events

   InlinedHashMap<uint64_t, std::map<uint64_t, Events>> per_client_events_by_ext_correlation_;


   // Keyed on tracer correlation_id, keeps track of activity records

   // for which we haven't established the external_correlation_id yet.

   InlinedHashMap<uint64_t, std::vector<EventRecord>> events_pending_client_mapping_;


   // An offset to add to (the possibly skewed) GPU timestamps

   // to normalize GPU timestamps with CPU timestamps

   int64_t offset_to_add_to_gpu_timestamps_;

 }; /* class GPUTracerManager */


 // Base class for a GPU profiler

 template <typename TManager>

 class GPUProfilerBase : public EpProfiler {

  protected:

   GPUProfilerBase() = default;

   virtual ~GPUProfilerBase() {}


   void MergeEvents(std::map<uint64_t, Events>& events_to_merge, Events& events) {

     Events merged_events;


     auto event_iter = std::make_move_iterator(events.begin());

     auto event_end = std::make_move_iterator(events.end());

     for (auto& map_iter : events_to_merge) {

       if (map_iter.second.empty()) {

         continue;

       }


       auto ts = static_cast<long long>(map_iter.first);


       // find the last occurrence of a matching timestamp,

       // if one exists

       while (event_iter != event_end &&

              (event_iter->ts < ts ||

               (event_iter->ts == ts &&

                (event_iter + 1) != event_end &&

                (event_iter + 1)->ts == ts))) {

         merged_events.emplace_back(*event_iter);

         ++event_iter;

       }


       bool copy_op_names = false;

       std::string op_name;

       std::string parent_name;


       if (event_iter != event_end && event_iter->ts == ts) {

         // We've located a parent event, copy the op_name and set

         // this event's parent_name property to the name of the parent.

         copy_op_names = true;

         op_name = event_iter->args["op_name"];

         parent_name = event_iter->name;

         merged_events.emplace_back(*event_iter);

         ++event_iter;

       }


       for (auto& evt : map_iter.second) {

         if (copy_op_names) {

           // If we have found a matching parent event,

           // then inherit some names from the parent.

           evt.args["op_name"] = op_name;

           evt.args["parent_name"] = parent_name;

         }

       }


       merged_events.insert(merged_events.end(),

                            std::make_move_iterator(map_iter.second.begin()),

                            std::make_move_iterator(map_iter.second.end()));

     }


     // move any remaining events

     merged_events.insert(merged_events.end(), event_iter, event_end);

     std::swap(events, merged_events);

   }


   uint64_t client_handle_;

   TimePoint profiling_start_time_;


  public:

   virtual bool StartProfiling(TimePoint profiling_start_time) override {

     auto& manager = TManager::GetInstance();

     manager.StartLogging();

     profiling_start_time_ = profiling_start_time;

     return true;

   }


   virtual void EndProfiling(TimePoint start_time, Events& events) override {

     auto& manager = TManager::GetInstance();

     std::map<uint64_t, Events> event_map;

     manager.Consume(client_handle_, start_time, event_map);

     MergeEvents(event_map, events);

   }


   virtual void Start(uint64_t id) override {

     auto& manager = TManager::GetInstance();

     manager.PushCorrelation(client_handle_, id, profiling_start_time_);

   }


   virtual void Stop(uint64_t) override {

     auto& manager = TManager::GetInstance();

     manager.PopCorrelation();

   }

 }; /* class GPUProfilerBase */


 // Convert a pointer to a hex string

 static inline std::string PointerToHexString(const void* ptr) {

   std::ostringstream sstr;

   sstr << std::hex << ptr;

   return sstr.str();

 }


 } /* end namespace profiling */

 } /* end namespace onnxruntime */

onnxruntime::profiling::ProfilerActivityBuffer::CreateFromPreallocatedBuffer
static ProfilerActivityBuffer CreateFromPreallocatedBuffer(std::unique_ptr< char[]> &&buffer_ptr, size_t size)
Definition: gpu_profiler_common.h:71

onnxruntime::profiling::GPUTracerManager::ORT_DISALLOW_COPY_ASSIGNMENT_AND_MOVE
ORT_DISALLOW_COPY_ASSIGNMENT_AND_MOVE(GPUTracerManager)

onnxruntime::profiling::ProfilerActivityBuffer::ProfilerActivityBuffer
ProfilerActivityBuffer(ProfilerActivityBuffer &&other) noexcept
Definition: gpu_profiler_common.h:47

onnxruntime::profiling::GPUProfilerBase::GPUProfilerBase
GPUProfilerBase()=default

data
GLboolean * data
Definition: glcorearb.h:131

std::swap
void swap(UT::ArraySet< Key, MULTI, MAX_LOAD_FACTOR_256, Clearer, Hash, KeyEqual > &a, UT::ArraySet< Key, MULTI, MAX_LOAD_FACTOR_256, Clearer, Hash, KeyEqual > &b)
Definition: UT_ArraySet.h:1631

string
GLsizei const GLchar *const * string
Definition: glcorearb.h:814

onnxruntime::profiling::GPUTracerManager::RegisterClient
uint64_t RegisterClient()
Definition: gpu_profiler_common.h:94

onnxruntime::profiling::EpProfiler
Definition: profiler_common.h:79

onnxruntime::profiling::ProfilerActivityBuffer::GetData
char * GetData()
Definition: gpu_profiler_common.h:79

onnxruntime::profiling::GPUProfilerBase::MergeEvents
void MergeEvents(std::map< uint64_t, Events > &events_to_merge, Events &events)
Definition: gpu_profiler_common.h:379

onnxruntime::profiling::GPUTracerManager::EnqueueActivityBuffer
void EnqueueActivityBuffer(ProfilerActivityBuffer &&buffer)
Definition: gpu_profiler_common.h:253

onnxruntime::profiling::GPUProfilerBase::Start
virtual void Start(uint64_t id) override
Definition: gpu_profiler_common.h:453

event
struct _cl_event * event
Definition: glcorearb.h:2961

onnxruntime::profiling::GPUTracerManager::DeregisterClient
void DeregisterClient(uint64_t client_handle)
Definition: gpu_profiler_common.h:102

offset
GLintptr offset
Definition: glcorearb.h:665

buffer
Definition: core.h:760

onnxruntime::profiling::ProfilerActivityBuffer::ProfilerActivityBuffer
ProfilerActivityBuffer() noexcept
Definition: gpu_profiler_common.h:36

onnxruntime::profiling::GPUTracerManager::~GPUTracerManager
virtual ~GPUTracerManager()
Definition: gpu_profiler_common.h:92

onnxruntime::profiling::GPUTracerManager::Consume
void Consume(uint64_t client_handle, const TimePoint &start_time, std::map< uint64_t, Events > &events)
Definition: gpu_profiler_common.h:125

onnxruntime::profiling::GPUProfilerBase::EndProfiling
virtual void EndProfiling(TimePoint start_time, Events &events) override
Definition: gpu_profiler_common.h:446

onnxruntime::TimePoint
std::chrono::high_resolution_clock::time_point TimePoint
Definition: common.h:43

onnxruntime::profiling::ProfilerActivityBuffer
Definition: gpu_profiler_common.h:34

buffers
const GLuint * buffers
Definition: glcorearb.h:661

onnxruntime::profiling::GPUTracerManager::MapEventToClient
void MapEventToClient(uint64_t tracer_correlation_id, EventRecord &&event)
Definition: gpu_profiler_common.h:259

onnxruntime::profiling::GPUProfilerBase::client_handle_
uint64_t client_handle_
Definition: gpu_profiler_common.h:435

onnxruntime::profiling::Events
std::vector< EventRecord > Events
Definition: profiler_common.h:76

onnxruntime::profiling::ProfilerActivityBuffer::ProfilerActivityBuffer
ProfilerActivityBuffer(const char *data, size_t size) noexcept
Definition: gpu_profiler_common.h:39

onnxruntime::profiling::GPUTracerManager::StartLogging
void StartLogging()
Definition: gpu_profiler_common.h:115

profiler_common.h

onnxruntime::profiling::GPUTracerManager::PushCorrelation
void PushCorrelation(uint64_t client_handle, uint64_t external_correlation_id, TimePoint profiling_start_time)
Definition: gpu_profiler_common.h:158

onnxruntime::profiling::GPUTracerManager::PopCorrelation
void PopCorrelation()
Definition: gpu_profiler_common.h:216

onnxruntime::profiling::GPUTracerManager
Definition: gpu_profiler_common.h:89

onnxruntime::profiling::ProfilerActivityBuffer::operator=
ProfilerActivityBuffer & operator=(ProfilerActivityBuffer &&other) noexcept
Definition: gpu_profiler_common.h:62

inlined_containers.h

size
GLsizeiptr size
Definition: glcorearb.h:664

onnxruntime::profiling::ProfilerActivityBuffer::GetData
const char * GetData() const
Definition: gpu_profiler_common.h:80

onnxruntime::profiling::GPUProfilerBase
Definition: gpu_profiler_common.h:374

onnxruntime::profiling::GPUTracerManager::PopCorrelation
void PopCorrelation(uint64_t &popped_external_correlation_id)
Definition: gpu_profiler_common.h:199

onnxruntime::profiling::GPUProfilerBase::Stop
virtual void Stop(uint64_t) override
Definition: gpu_profiler_common.h:458

onnxruntime::profiling::EventRecord
Definition: profiler_common.h:30

ptr
auto ptr(T p) -> const void *
Definition: format.h:2448

onnxruntime::profiling::ProfilerActivityBuffer::GetSize
size_t GetSize() const
Definition: gpu_profiler_common.h:81

onnxruntime::profiling::ProfilerActivityBuffer::ProfilerActivityBuffer
ProfilerActivityBuffer(const ProfilerActivityBuffer &other) noexcept
Definition: gpu_profiler_common.h:44

onnxruntime::profiling::ProfilerActivityBuffer::operator=
ProfilerActivityBuffer & operator=(const ProfilerActivityBuffer &other) noexcept
Definition: gpu_profiler_common.h:53

onnxruntime::profiling::GPUTracerManager::NotifyNewCorrelation
void NotifyNewCorrelation(uint64_t tracer_correlation_id, uint64_t unique_correlation_id)
Definition: gpu_profiler_common.h:274

onnxruntime::profiling::GPUProfilerBase::~GPUProfilerBase
virtual ~GPUProfilerBase()
Definition: gpu_profiler_common.h:377

onnxruntime::profiling::GPUTracerManager::GPUTracerManager
GPUTracerManager()
Definition: gpu_profiler_common.h:222

onnxruntime::profiling::GPUProfilerBase::profiling_start_time_
TimePoint profiling_start_time_
Definition: gpu_profiler_common.h:436

onnxruntime::profiling::GPUProfilerBase::StartProfiling
virtual bool StartProfiling(TimePoint profiling_start_time) override
Definition: gpu_profiler_common.h:439

onnxruntime::profiling::GPUTracerManager::NormalizeGPUTimestampToCPUEpoch
uint64_t NormalizeGPUTimestampToCPUEpoch(uint64_t gpu_timestamp_in_nanoseconds)
Definition: gpu_profiler_common.h:285

count
GLint GLsizei count
Definition: glcorearb.h:405

data
Definition: format.h:895