mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-17 11:30:02 +00:00
Modularize ckProfiler operations (#514)
* Re-structure ckProfiler source files
* Rename profiler.cpp to main.cpp
* Modularize ckProfiler operations
* Add description for profiler operations
* Use longer name to avoid name collision
* Use macro to delay expansion
* Use std::move() to avoid object copying
* Prohibit users from calling dtor
* Use macro to eliminate redundant code
* Make friend function hidden
* Add missing include directive <iostream>
* Fix wrong include directives
* Remove int8 from batchnorm-forward instances since it is not needed for forward training and could fail test
Co-authored-by: Qianfeng Zhang <Qianfeng.Zhang@amd.com>
[ROCm/composable_kernel commit: 8784a72e23]
This commit is contained in:
@@ -13,8 +13,9 @@
|
||||
|
||||
#include "ck/library/utility/host_common_util.hpp"
|
||||
|
||||
#include "profiler/include/profile_reduce_impl.hpp"
|
||||
#include "profiler/include/data_type_enum.hpp"
|
||||
#include "profiler/profile_reduce_impl.hpp"
|
||||
#include "profiler/data_type_enum.hpp"
|
||||
#include "profiler_operation_registry.hpp"
|
||||
|
||||
using namespace std;
|
||||
|
||||
@@ -429,3 +430,5 @@ int profile_reduce(int argc, char* argv[])
|
||||
|
||||
return (0);
|
||||
};
|
||||
|
||||
REGISTER_PROFILER_OPERATION("reduce", "Reduce", profile_reduce);
|
||||
|
||||
Reference in New Issue
Block a user