Add host API (#220)

* Add host API

* manually rebase on develop

* clean

* manually rebase on develop

* exclude tests from all target

* address review comments

* update client app name

* fix missing lib name

* clang-format update

* refactor

* refactor

* refactor

* refactor

* refactor

* fix test issue

* refactor

* refactor

* refactor

* upate cmake and readme

Co-authored-by: Chao Liu <chao.liu2@amd.com>
This commit is contained in:
JD
2022-05-12 09:21:01 -05:00
committed by GitHub
parent 0f912e205e
commit cec69bc3bc
131 changed files with 1666 additions and 1089 deletions

View File

@@ -44,7 +44,7 @@ int profile_conv_bwd_data(int argc, char* argv[])
printf("arg6: verification (0: no; 1: yes)\n");
printf("arg7: initialization (0: no init; 1: integer value; 2: decimal value)\n");
printf("arg8: print tensor value (0: no; 1: yes)\n");
printf("arg9: run kernel # of times (>1)\n");
printf("arg9: time kernel (0=n0, 1=yes)\n");
printf("arg10 to 24: N, K, C, Y, X, Hi, Wi, Sy, Sx, Dy, Dx, LeftPy, LeftPx, RightPy, "
"RightPx\n");
exit(1);
@@ -57,7 +57,7 @@ int profile_conv_bwd_data(int argc, char* argv[])
const bool do_verification = std::stoi(argv[6]);
const int init_method = std::stoi(argv[7]);
const bool do_log = std::stoi(argv[8]);
const int nrepeat = std::stoi(argv[9]);
const bool time_kernel = std::stoi(argv[9]);
const ck::index_t N = std::stoi(argv[10]);
const ck::index_t K = std::stoi(argv[11]);
@@ -96,7 +96,7 @@ int profile_conv_bwd_data(int argc, char* argv[])
do_verification,
init_method,
do_log,
nrepeat,
StreamControl{nullptr, time_kernel},
N,
K,
C,
@@ -122,7 +122,7 @@ int profile_conv_bwd_data(int argc, char* argv[])
do_verification,
init_method,
do_log,
nrepeat,
StreamControl{nullptr, time_kernel},
N,
K,
C,
@@ -148,7 +148,7 @@ int profile_conv_bwd_data(int argc, char* argv[])
do_verification,
init_method,
do_log,
nrepeat,
StreamControl{nullptr, time_kernel},
N,
K,
C,
@@ -174,7 +174,7 @@ int profile_conv_bwd_data(int argc, char* argv[])
do_verification,
init_method,
do_log,
nrepeat,
StreamControl{nullptr, time_kernel},
N,
K,
C,