OClCollMeshEngn: perf profile and print kernel exec durations

This commit is contained in:
2025-11-12 13:03:39 -04:00
parent 33b534355a
commit d87c71b794
3 changed files with 49 additions and 0 deletions
@@ -164,6 +164,12 @@ public:
std::cout << __func__ << ": Successfully compacted and collated frame" << std::endl;
}
// Print kernel execution durations
auto compactDuration = stimBuff.openClCollatingAndMeshingEngine.getCompactKernelDuration();
auto collateDuration = stimBuff.openClCollatingAndMeshingEngine.getCollateKernelDuration();
std::cout << __func__ << ": compactKernelDuration=" << compactDuration.count()
<< "ms, collateKernelDuration=" << collateDuration.count() << "ms" << std::endl;
callOriginalCallback();
}
};