mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-19 22:39:03 +00:00
* fix compile error * fix typo of padding * Add smoothquant op * Add smoothquant instance library * refine type * add test script * Re-generate smoothquant.hpp * Always use 'current year' in copyright * use Generic2dBlockShape instead * Add vector = 8 instance back * Find exe path automatically * Simplify the api condition * Remove debugging code * update year * Add blank line between function declaration * explicitly cast return value to dim3 * refine return value * Fix default warmup and repeat value * Add comment * refactor sommthquant cmake * Add README * Fix typo --------- Co-authored-by: Po Yen, Chen <PoYen.Chen@amd.com>
90 lines
2.8 KiB
Python
90 lines
2.8 KiB
Python
from datetime import datetime
|
|
import pathlib
|
|
from pathlib import Path
|
|
import subprocess
|
|
import os
|
|
import copy
|
|
|
|
NS = 'ck_tile'
|
|
OPS = 'ops'
|
|
OPS_COMMON = 'common' # common header will be duplicated into ops/* other module
|
|
|
|
HEADER_COMMON = f"""// SPDX-License-Identifier: MIT
|
|
// Copyright (c) 2018-{datetime.now().year}, Advanced Micro Devices, Inc. All rights reserved.\n
|
|
"""
|
|
|
|
# aa/bb/cc/file.hpp -> (aa, bb, cc, file.hpp)
|
|
def get_module(f, level = 0):
|
|
all_parts = f.parts
|
|
return str(all_parts[level])
|
|
|
|
all_files = []
|
|
for p in sorted(Path("./").rglob("*")):
|
|
if p.suffix == '.hpp':
|
|
all_files.append(pathlib.PurePath(p))
|
|
|
|
class submodule_t:
|
|
def __init__(self):
|
|
self.m = dict()
|
|
def push(self, f):
|
|
if len(f.parents) != 1: # ignore ./xxx.hpp
|
|
mod = get_module(f)
|
|
if mod == OPS:
|
|
if mod not in self.m.keys():
|
|
self.m[mod] = dict()
|
|
mod2 = get_module(f, 1)
|
|
if Path(mod2).suffix != '.hpp':
|
|
# ignore ops/xxx.hpp
|
|
if mod2 not in self.m[mod].keys():
|
|
self.m[mod][mod2] = list()
|
|
self.m[mod][mod2].append(f)
|
|
else:
|
|
if mod not in self.m.keys():
|
|
self.m[mod] = list()
|
|
self.m[mod].append(f)
|
|
|
|
def gen(self):
|
|
def gen_header(hpath, include_list):
|
|
# print(hpath)
|
|
if os.path.exists(str(hpath)):
|
|
os.remove(str(hpath))
|
|
with hpath.open('w') as f:
|
|
f.write(HEADER_COMMON)
|
|
f.write('#pragma once\n')
|
|
f.write('\n')
|
|
for individual_header in include_list:
|
|
header_path = NS + '/' + str(individual_header)
|
|
f.write(f'#include \"{header_path}\"\n')
|
|
# f.write('\n') # otherwise clang-format will complain
|
|
# print(self.m)
|
|
# restructure common
|
|
for k, v in self.m.items():
|
|
if k == OPS and OPS_COMMON in v.keys():
|
|
common_list = copy.deepcopy(v[OPS_COMMON])
|
|
# v.pop(OPS_COMMON)
|
|
for km in v.keys():
|
|
if km != OPS_COMMON:
|
|
v[km].extend(common_list)
|
|
|
|
for k, v in self.m.items():
|
|
if k == OPS:
|
|
for km, kv in v.items():
|
|
gen_header(Path(k) / (f'{km}.hpp'), kv)
|
|
else:
|
|
gen_header(Path(f'{k}.hpp'), v)
|
|
|
|
|
|
submodule = submodule_t()
|
|
# formatting
|
|
for x in all_files:
|
|
subprocess.Popen(f'dos2unix {str(x)}', shell=True)
|
|
cmd = f'clang-format-12 -style=file -i {str(x)}'
|
|
#for xp in x.parents:
|
|
#print(get_file_base(x))
|
|
subprocess.Popen(cmd, shell=True)
|
|
submodule.push(x)
|
|
|
|
submodule.gen()
|
|
|
|
#print(all_files)
|