mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-02 04:31:25 +00:00
* [CK TILE STREAMK] Introduce initial support for tile engine in streamk GEMM. - This commit lays the groundwork for integrating the tile engine into streamk GEMM. It focuses on creating benchmark executables for streamk GEMM. - Additional scripts like test_benchmark.sh and gemm_benchmark.py will be added once the streamk implementation reaches stability. * [CK TILE STREAMK] Enable CI to execute tile engine benchmarks for StreamK GEMM * [CK TILE STREAMK] Refactor: Extract common utility functions. * [CK TILE STREAMK] Revise tile engine of streamk to align with the updated implementation * Add pre-commit * [CK TILE STREAMK] Add 'dp_persistent' and 'reduction_strategy' in output of CK TILE STREAMK * [CK TILE STREAMK] Fix a bug about value of 'dp_persistent' of CK TILE STREAMK * [CK TILE STREAMK] Update Jenkinsfile * [CK TILE Engine] Update StreamK tile engine help message Remove default value messages as they are automatically printed * [CK TILE Engine] Update StreamK tile engine - Remove namespace reboot * [CK TILE Engine] Update StreamK tile engine - Fix merge error
106 lines
1.9 KiB
JSON
106 lines
1.9 KiB
JSON
{
|
|
"problem": {
|
|
},
|
|
"tile_config": {
|
|
"tile_m": {
|
|
"max": 256,
|
|
"min": 64,
|
|
"step": 64
|
|
},
|
|
"tile_n": {
|
|
"max": 256,
|
|
"min": 64,
|
|
"step": 64
|
|
},
|
|
"tile_k": {
|
|
"max": 256,
|
|
"min": 64,
|
|
"step": 64
|
|
},
|
|
"warp_m": {
|
|
"values": [
|
|
4,
|
|
2,
|
|
1
|
|
]
|
|
},
|
|
"warp_n": {
|
|
"values": [
|
|
4,
|
|
2,
|
|
1
|
|
]
|
|
},
|
|
"warp_k": {
|
|
"values": [
|
|
1
|
|
]
|
|
},
|
|
"warp_tile_m": {
|
|
"values": [
|
|
4,
|
|
16,
|
|
32
|
|
]
|
|
},
|
|
"warp_tile_n": {
|
|
"values": [
|
|
16,
|
|
32,
|
|
64
|
|
]
|
|
},
|
|
"warp_tile_k": {
|
|
"values": [
|
|
8,
|
|
16,
|
|
32,
|
|
64,
|
|
128
|
|
]
|
|
}
|
|
},
|
|
"trait_config": {
|
|
"pipeline": {
|
|
"values": [
|
|
"compv3"
|
|
]
|
|
},
|
|
"scheduler": {
|
|
"values": [
|
|
"intrawave"
|
|
]
|
|
},
|
|
"epilogue": {
|
|
"values": [
|
|
"cshuffle"
|
|
]
|
|
},
|
|
"pad_m": {
|
|
"values": [
|
|
false
|
|
]
|
|
},
|
|
"pad_n": {
|
|
"values": [
|
|
false
|
|
]
|
|
},
|
|
"pad_k": {
|
|
"values": [
|
|
false
|
|
]
|
|
},
|
|
"persistent": {
|
|
"values": [
|
|
false, true
|
|
]
|
|
},
|
|
"reduction_strategy": {
|
|
"values": [
|
|
"reduction", "atomic"
|
|
]
|
|
}
|
|
}
|
|
}
|