From 3c6aae58f78a5486c01da2ab7f822bf09fdcdcd8 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Ville=20Pietil=C3=A4?= <> Date: Wed, 5 Nov 2025 04:08:53 -0600 Subject: [PATCH] Refactor JSON scripts. --- ...nvert_instantiations_to_structured_json.py | 21 +- ...orward_conv_structured_instantiations.json | 2849 +++++++++-------- .../move_elementwise_to_signature.py | 67 + .../instances/refactor_json_structure.py | 82 + 4 files changed, 1585 insertions(+), 1434 deletions(-) create mode 100644 experimental/builder/instances/move_elementwise_to_signature.py create mode 100644 experimental/builder/instances/refactor_json_structure.py diff --git a/experimental/builder/instances/convert_instantiations_to_structured_json.py b/experimental/builder/instances/convert_instantiations_to_structured_json.py index efa7d069f9..9671fb37f0 100644 --- a/experimental/builder/instances/convert_instantiations_to_structured_json.py +++ b/experimental/builder/instances/convert_instantiations_to_structured_json.py @@ -63,10 +63,10 @@ def parse_xdl_cshuffle_params(params: List[str]) -> Dict[str, Any]: "shuffle": map_data_type(params[8]) if len(params) > 8 else "FP32", "output": map_data_type(params[10]) if len(params) > 10 else "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": int(params[17]) if len(params) > 17 else 256, @@ -183,10 +183,10 @@ def parse_xdl_cshuffle_v3_params(params: List[str]) -> Dict[str, Any]: "shuffle": map_data_type(params[8]) if len(params) > 8 else "FP32", "output": map_data_type(params[10]) if len(params) > 10 else "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": int(params[16]) if len(params) > 16 else 256, @@ -311,10 +311,10 @@ def parse_xdl_cshuffle_params_with_lds_extra(params: List[str]) -> Dict[str, Any "shuffle": map_data_type(params[8]) if len(params) > 8 else "FP32", "output": map_data_type(params[10]) if len(params) > 10 else "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": int(params[17]) if len(params) > 17 else 256, @@ -427,10 +427,10 @@ def parse_wmma_cshuffle_params(params: List[str]) -> Dict[str, Any]: "shuffle": map_data_type(params[8]) if len(params) > 8 else "FP16", "output": map_data_type(params[10]) if len(params) > 10 else "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleD_Wmma_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleD_Wmma_CShuffle", "algorithm_type": "WMMA", "thread_block": { "block_size": int(params[17]) if len(params) > 17 else 128, @@ -648,11 +648,11 @@ def convert_instantiations(input_file: str, output_file: str): "shuffle": "enum (FP32, FP16, BF16, FP8, I8, I32, U8)", "output": "enum (FP32, FP16, BF16, FP8, I8, I32, U8)" }, - "elementwise_operation": "enum (BIAS, BIAS_CLAMP, BIAS_BNORM_CLAMP, BILINEAR, CLAMP, SCALE, PASS_THROUGH)", - "device_operation": "string (DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle, DeviceGroupedConvFwdMultipleD_Wmma_CShuffle, etc.)" + "elementwise_operation": "enum (BIAS, BIAS_CLAMP, BIAS_BNORM_CLAMP, BILINEAR, CLAMP, SCALE, PASS_THROUGH)" }, "algorithm_xdl": { "description": "Algorithm schema for XDL-based operations (algorithm_type = 'XDL')", + "device_operation": "string (DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle, DeviceGroupedConvFwdMultipleD_Wmma_CShuffle, etc.)", "algorithm_type": "string literal 'XDL'", "gridwise_xdl_gemm": { "ak1": "integer - A matrix K dimension vectorization", @@ -666,6 +666,7 @@ def convert_instantiations(input_file: str, output_file: str): }, "algorithm_wmma": { "description": "Algorithm schema for WMMA-based operations (algorithm_type = 'WMMA')", + "device_operation": "string (DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle, DeviceGroupedConvFwdMultipleD_Wmma_CShuffle, etc.)", "algorithm_type": "string literal 'WMMA'", "gridwise_wmma_gemm": { "k1": "integer - K dimension vectorization", diff --git a/experimental/builder/instances/forward_conv_structured_instantiations.json b/experimental/builder/instances/forward_conv_structured_instantiations.json index 4c4ca07f68..b47524404d 100644 --- a/experimental/builder/instances/forward_conv_structured_instantiations.json +++ b/experimental/builder/instances/forward_conv_structured_instantiations.json @@ -22,10 +22,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -142,10 +142,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -262,10 +262,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -382,10 +382,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -502,10 +502,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -622,10 +622,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -742,10 +742,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -862,10 +862,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -982,10 +982,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -1102,10 +1102,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -1222,10 +1222,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -1342,10 +1342,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -1462,10 +1462,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -1582,10 +1582,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -1702,10 +1702,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -1822,10 +1822,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -1942,10 +1942,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -2062,10 +2062,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -2182,10 +2182,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -2302,10 +2302,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -2422,10 +2422,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -2542,10 +2542,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -2662,10 +2662,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -2782,10 +2782,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -2902,10 +2902,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -3022,10 +3022,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -3142,10 +3142,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -3262,10 +3262,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -3382,10 +3382,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -3502,10 +3502,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -3622,10 +3622,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -3742,10 +3742,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -3862,10 +3862,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -3982,10 +3982,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -4102,10 +4102,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -4222,10 +4222,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -4342,10 +4342,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -4462,10 +4462,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -4582,10 +4582,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -4702,10 +4702,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -4822,10 +4822,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -4942,10 +4942,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -5062,10 +5062,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -5182,10 +5182,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -5302,10 +5302,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -5422,10 +5422,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -5542,10 +5542,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -5662,10 +5662,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -5782,10 +5782,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -5902,10 +5902,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -6022,10 +6022,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -6142,10 +6142,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -6262,10 +6262,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -6382,10 +6382,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -6502,10 +6502,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -6622,10 +6622,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -6742,10 +6742,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -6862,10 +6862,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -6982,10 +6982,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -7102,10 +7102,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -7222,10 +7222,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -7342,10 +7342,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -7462,10 +7462,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -7582,10 +7582,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -7702,10 +7702,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -7822,10 +7822,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -7942,10 +7942,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -8062,10 +8062,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -8182,10 +8182,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -8302,10 +8302,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -8422,10 +8422,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -8542,10 +8542,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -8662,10 +8662,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -8782,10 +8782,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -8902,10 +8902,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -9022,10 +9022,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -9142,10 +9142,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -9262,10 +9262,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -9382,10 +9382,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -9502,10 +9502,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -9622,10 +9622,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -9742,10 +9742,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -9862,10 +9862,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -9982,10 +9982,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -10102,10 +10102,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -10222,10 +10222,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -10342,10 +10342,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -10462,10 +10462,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -10582,10 +10582,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -10702,10 +10702,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -10822,10 +10822,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -10942,10 +10942,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -11062,10 +11062,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -11182,10 +11182,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -11302,10 +11302,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -11422,10 +11422,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -11542,10 +11542,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -11662,10 +11662,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -11782,10 +11782,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -11902,10 +11902,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -12022,10 +12022,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -12142,10 +12142,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -12262,10 +12262,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -12382,10 +12382,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -12502,10 +12502,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -12622,10 +12622,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -12742,10 +12742,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -12862,10 +12862,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -12982,10 +12982,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -13102,10 +13102,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -13222,10 +13222,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -13342,10 +13342,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -13462,10 +13462,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -13582,10 +13582,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -13702,10 +13702,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -13822,10 +13822,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -13942,10 +13942,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -14062,10 +14062,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -14182,10 +14182,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -14302,10 +14302,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -14422,10 +14422,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -14542,10 +14542,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -14662,10 +14662,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -14782,10 +14782,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -14902,10 +14902,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -15022,10 +15022,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -15142,10 +15142,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -15262,10 +15262,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -15382,10 +15382,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -15502,10 +15502,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -15622,10 +15622,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -15742,10 +15742,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -15862,10 +15862,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -15982,10 +15982,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -16102,10 +16102,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -16222,10 +16222,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -16342,10 +16342,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -16462,10 +16462,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -16582,10 +16582,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -16702,10 +16702,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -16822,10 +16822,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -16942,10 +16942,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -17062,10 +17062,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -17182,10 +17182,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -17302,10 +17302,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -17422,10 +17422,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -17542,10 +17542,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -17662,10 +17662,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -17782,10 +17782,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -17902,10 +17902,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -18022,10 +18022,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -18142,10 +18142,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -18262,10 +18262,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -18382,10 +18382,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -18502,10 +18502,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -18622,10 +18622,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -18742,10 +18742,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -18862,10 +18862,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -18982,10 +18982,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -19102,10 +19102,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -19222,10 +19222,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -19342,10 +19342,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -19462,10 +19462,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -19582,10 +19582,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -19702,10 +19702,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -19822,10 +19822,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -19942,10 +19942,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -20062,10 +20062,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -20182,10 +20182,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -20302,10 +20302,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -20422,10 +20422,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -20542,10 +20542,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -20662,10 +20662,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -20782,10 +20782,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -20902,10 +20902,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -21022,10 +21022,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -21142,10 +21142,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -21262,10 +21262,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -21382,10 +21382,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -21502,10 +21502,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -21622,10 +21622,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -21742,10 +21742,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -21862,10 +21862,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -21982,10 +21982,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -22102,10 +22102,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -22222,10 +22222,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -22342,10 +22342,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -22462,10 +22462,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -22582,10 +22582,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -22702,10 +22702,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -22822,10 +22822,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -22942,10 +22942,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -23062,10 +23062,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -23182,10 +23182,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -23302,10 +23302,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -23422,10 +23422,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -23542,10 +23542,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -23662,10 +23662,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -23782,10 +23782,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -23902,10 +23902,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -24022,10 +24022,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -24142,10 +24142,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -24262,10 +24262,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -24382,10 +24382,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -24502,10 +24502,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -24622,10 +24622,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -24742,10 +24742,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -24862,10 +24862,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -24982,10 +24982,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -25102,10 +25102,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -25222,10 +25222,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -25342,10 +25342,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -25462,10 +25462,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -25582,10 +25582,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -25702,10 +25702,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -25822,10 +25822,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -25942,10 +25942,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -26062,10 +26062,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -26182,10 +26182,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -26302,10 +26302,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -26422,10 +26422,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -26542,10 +26542,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -26662,10 +26662,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -26782,10 +26782,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -26902,10 +26902,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -27022,10 +27022,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -27142,10 +27142,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -27262,10 +27262,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -27382,10 +27382,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -27502,10 +27502,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -27622,10 +27622,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -27742,10 +27742,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -27862,10 +27862,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -27982,10 +27982,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -28102,10 +28102,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -28222,10 +28222,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -28342,10 +28342,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -28462,10 +28462,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -28582,10 +28582,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -28702,10 +28702,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -28822,10 +28822,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -28942,10 +28942,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -29062,10 +29062,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -29182,10 +29182,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -29302,10 +29302,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -29422,10 +29422,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -29542,10 +29542,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -29662,10 +29662,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -29782,10 +29782,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -29902,10 +29902,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -30022,10 +30022,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -30142,10 +30142,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -30262,10 +30262,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -30382,10 +30382,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -30502,10 +30502,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -30622,10 +30622,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -30742,10 +30742,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -30862,10 +30862,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -30982,10 +30982,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -31102,10 +31102,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -31222,10 +31222,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -31342,10 +31342,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -31462,10 +31462,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -31582,10 +31582,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -31702,10 +31702,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -31822,10 +31822,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -31942,10 +31942,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -32062,10 +32062,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -32182,10 +32182,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -32302,10 +32302,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -32422,10 +32422,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -32542,10 +32542,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -32662,10 +32662,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -32782,10 +32782,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -32902,10 +32902,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -33022,10 +33022,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -33142,10 +33142,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -33262,10 +33262,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -33382,10 +33382,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -33502,10 +33502,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -33622,10 +33622,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -33742,10 +33742,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -33862,10 +33862,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -33982,10 +33982,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -34102,10 +34102,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -34222,10 +34222,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -34342,10 +34342,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -34462,10 +34462,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -34582,10 +34582,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -34702,10 +34702,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -34822,10 +34822,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -34942,10 +34942,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -35062,10 +35062,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -35182,10 +35182,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -35302,10 +35302,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -35422,10 +35422,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -35542,10 +35542,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -35662,10 +35662,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -35782,10 +35782,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -35902,10 +35902,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -36022,10 +36022,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -36142,10 +36142,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -36262,10 +36262,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -36382,10 +36382,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -36502,10 +36502,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -36622,10 +36622,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -36742,10 +36742,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -36862,10 +36862,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -36982,10 +36982,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -37102,10 +37102,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -37222,10 +37222,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -37342,10 +37342,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -37462,10 +37462,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -37582,10 +37582,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -37702,10 +37702,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -37822,10 +37822,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -37942,10 +37942,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -38062,10 +38062,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -38182,10 +38182,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -38302,10 +38302,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -38422,10 +38422,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -38542,10 +38542,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -38662,10 +38662,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -38782,10 +38782,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -38902,10 +38902,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -39022,10 +39022,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -39142,10 +39142,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -39262,10 +39262,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -39382,10 +39382,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -39502,10 +39502,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -39622,10 +39622,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -39742,10 +39742,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -39862,10 +39862,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -39982,10 +39982,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -40102,10 +40102,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -40222,10 +40222,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -40342,10 +40342,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -40462,10 +40462,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -40582,10 +40582,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -40702,10 +40702,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -40822,10 +40822,10 @@ "shuffle": "FP32", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -40942,10 +40942,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -41062,10 +41062,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -41182,10 +41182,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -41302,10 +41302,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -41422,10 +41422,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -41542,10 +41542,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -41662,10 +41662,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -41782,10 +41782,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -41902,10 +41902,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -42022,10 +42022,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -42142,10 +42142,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -42262,10 +42262,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -42382,10 +42382,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -42502,10 +42502,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -42622,10 +42622,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -42742,10 +42742,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -42862,10 +42862,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -42982,10 +42982,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -43102,10 +43102,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -43222,10 +43222,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -43342,10 +43342,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -43462,10 +43462,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -43582,10 +43582,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -43702,10 +43702,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -43822,10 +43822,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -43942,10 +43942,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -44062,10 +44062,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -44182,10 +44182,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -44302,10 +44302,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -44422,10 +44422,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -44542,10 +44542,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -44662,10 +44662,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -44782,10 +44782,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -44902,10 +44902,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -45022,10 +45022,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -45142,10 +45142,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -45262,10 +45262,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -45382,10 +45382,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -45502,10 +45502,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -45622,10 +45622,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -45742,10 +45742,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -45862,10 +45862,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -45982,10 +45982,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -46102,10 +46102,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -46222,10 +46222,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -46342,10 +46342,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -46462,10 +46462,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -46582,10 +46582,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -46702,10 +46702,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -46822,10 +46822,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -46942,10 +46942,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -47062,10 +47062,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -47182,10 +47182,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -47302,10 +47302,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -47422,10 +47422,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -47542,10 +47542,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -47662,10 +47662,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -47782,10 +47782,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -47902,10 +47902,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -48022,10 +48022,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -48142,10 +48142,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -48262,10 +48262,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -48382,10 +48382,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -48502,10 +48502,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -48622,10 +48622,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -48742,10 +48742,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -48862,10 +48862,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -48982,10 +48982,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -49102,10 +49102,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -49222,10 +49222,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -49342,10 +49342,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -49462,10 +49462,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -49582,10 +49582,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -49702,10 +49702,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -49822,10 +49822,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -49942,10 +49942,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -50062,10 +50062,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -50182,10 +50182,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -50302,10 +50302,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -50422,10 +50422,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -50542,10 +50542,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -50662,10 +50662,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -50782,10 +50782,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -50902,10 +50902,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -51022,10 +51022,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -51142,10 +51142,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -51262,10 +51262,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -51382,10 +51382,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -51502,10 +51502,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -51622,10 +51622,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -51742,10 +51742,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -51862,10 +51862,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -51982,10 +51982,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -52102,10 +52102,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -52222,10 +52222,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -52342,10 +52342,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -52462,10 +52462,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -52582,10 +52582,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -52702,10 +52702,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -52822,10 +52822,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -52942,10 +52942,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -53062,10 +53062,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -53182,10 +53182,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -53302,10 +53302,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -53422,10 +53422,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -53542,10 +53542,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -53662,10 +53662,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -53782,10 +53782,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -53902,10 +53902,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -54022,10 +54022,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -54142,10 +54142,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -54262,10 +54262,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -54382,10 +54382,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -54502,10 +54502,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -54622,10 +54622,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -54742,10 +54742,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -54862,10 +54862,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -54982,10 +54982,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -55102,10 +55102,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -55222,10 +55222,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -55342,10 +55342,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -55462,10 +55462,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -55582,10 +55582,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -55702,10 +55702,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -55822,10 +55822,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -55942,10 +55942,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -56062,10 +56062,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -56182,10 +56182,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -56302,10 +56302,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -56422,10 +56422,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -56542,10 +56542,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -56662,10 +56662,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -56782,10 +56782,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -56902,10 +56902,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -57022,10 +57022,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -57142,10 +57142,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -57262,10 +57262,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -57382,10 +57382,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -57502,10 +57502,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -57622,10 +57622,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -57742,10 +57742,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -57862,10 +57862,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -57982,10 +57982,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -58102,10 +58102,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -58222,10 +58222,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -58342,10 +58342,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -58462,10 +58462,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -58582,10 +58582,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -58702,10 +58702,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -58822,10 +58822,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -58942,10 +58942,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -59062,10 +59062,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -59182,10 +59182,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -59302,10 +59302,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -59422,10 +59422,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -59542,10 +59542,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -59662,10 +59662,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -59782,10 +59782,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -59902,10 +59902,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -60022,10 +60022,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -60142,10 +60142,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -60262,10 +60262,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -60382,10 +60382,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -60502,10 +60502,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -60622,10 +60622,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -60742,10 +60742,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -60862,10 +60862,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -60982,10 +60982,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -61102,10 +61102,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -61222,10 +61222,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -61342,10 +61342,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -61462,10 +61462,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -61582,10 +61582,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -61702,10 +61702,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -61822,10 +61822,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -61942,10 +61942,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -62062,10 +62062,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -62182,10 +62182,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -62302,10 +62302,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -62422,10 +62422,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -62542,10 +62542,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -62662,10 +62662,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -62782,10 +62782,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -62902,10 +62902,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -63022,10 +63022,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -63142,10 +63142,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -63262,10 +63262,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -63382,10 +63382,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -63502,10 +63502,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -63622,10 +63622,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -63742,10 +63742,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -63862,10 +63862,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -63982,10 +63982,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -64102,10 +64102,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -64222,10 +64222,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -64342,10 +64342,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -64462,10 +64462,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -64582,10 +64582,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -64702,10 +64702,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -64822,10 +64822,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -64942,10 +64942,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -65062,10 +65062,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -65182,10 +65182,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -65302,10 +65302,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -65422,10 +65422,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -65542,10 +65542,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -65662,10 +65662,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -65782,10 +65782,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -65902,10 +65902,10 @@ "shuffle": "FP8", "output": "FP8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -66022,10 +66022,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -66142,10 +66142,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -66262,10 +66262,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -66382,10 +66382,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -66502,10 +66502,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -66622,10 +66622,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -66742,10 +66742,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -66862,10 +66862,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -66982,10 +66982,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -67102,10 +67102,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -67222,10 +67222,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -67342,10 +67342,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -67462,10 +67462,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -67582,10 +67582,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -67702,10 +67702,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -67822,10 +67822,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -67942,10 +67942,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -68062,10 +68062,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -68182,10 +68182,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -68302,10 +68302,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -68422,10 +68422,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -68538,10 +68538,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -68654,10 +68654,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -68770,10 +68770,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -68886,10 +68886,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -69002,10 +69002,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -69118,10 +69118,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -69234,10 +69234,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -69350,10 +69350,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -69466,10 +69466,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -69582,10 +69582,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -69698,10 +69698,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -69814,10 +69814,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -69930,10 +69930,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -70046,10 +70046,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -70162,10 +70162,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -70278,10 +70278,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -70394,10 +70394,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -70510,10 +70510,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -70626,10 +70626,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -70742,10 +70742,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -70858,10 +70858,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -70974,10 +70974,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -71090,10 +71090,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -71206,10 +71206,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -71322,10 +71322,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -71438,10 +71438,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -71554,10 +71554,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -71670,10 +71670,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -71786,10 +71786,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -71902,10 +71902,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -72018,10 +72018,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -72134,10 +72134,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -72250,10 +72250,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -72366,10 +72366,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -72482,10 +72482,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -72598,10 +72598,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -72714,10 +72714,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -72830,10 +72830,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -72946,10 +72946,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -73062,10 +73062,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -73178,10 +73178,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -73294,10 +73294,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -73410,10 +73410,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -73526,10 +73526,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -73642,10 +73642,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -73758,10 +73758,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -73874,10 +73874,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -73990,10 +73990,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -74106,10 +74106,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -74222,10 +74222,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -74338,10 +74338,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -74454,10 +74454,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -74570,10 +74570,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -74686,10 +74686,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -74802,10 +74802,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -74918,10 +74918,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -75034,10 +75034,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -75150,10 +75150,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -75266,10 +75266,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -75382,10 +75382,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -75498,10 +75498,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -75614,10 +75614,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -75730,10 +75730,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -75846,10 +75846,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -75962,10 +75962,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -76078,10 +76078,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -76194,10 +76194,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -76310,10 +76310,10 @@ "shuffle": "BF16", "output": "BF16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -76426,10 +76426,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -76542,10 +76542,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -76658,10 +76658,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -76774,10 +76774,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -76890,10 +76890,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -77006,10 +77006,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -77122,10 +77122,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -77238,10 +77238,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -77354,10 +77354,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -77470,10 +77470,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -77586,10 +77586,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -77702,10 +77702,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -77818,10 +77818,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -77934,10 +77934,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -78050,10 +78050,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -78166,10 +78166,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -78282,10 +78282,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -78398,10 +78398,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -78514,10 +78514,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -78630,10 +78630,10 @@ "shuffle": "FP16", "output": "FP16" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -78746,10 +78746,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -78862,10 +78862,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -78978,10 +78978,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -79094,10 +79094,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -79210,10 +79210,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -79326,10 +79326,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -79442,10 +79442,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -79558,10 +79558,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -79674,10 +79674,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -79790,10 +79790,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -79906,10 +79906,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -80022,10 +80022,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -80138,10 +80138,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -80254,10 +80254,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -80370,10 +80370,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -80486,10 +80486,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -80602,10 +80602,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -80718,10 +80718,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -80834,10 +80834,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -80950,10 +80950,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -81066,10 +81066,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -81182,10 +81182,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -81298,10 +81298,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -81414,10 +81414,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -81530,10 +81530,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -81646,10 +81646,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -81762,10 +81762,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -81878,10 +81878,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -81994,10 +81994,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -82110,10 +82110,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -82226,10 +82226,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -82342,10 +82342,10 @@ "shuffle": "FP32", "output": "FP32" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -82458,10 +82458,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -82574,10 +82574,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -82690,10 +82690,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -82806,10 +82806,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -82922,10 +82922,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -83038,10 +83038,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -83154,10 +83154,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -83270,10 +83270,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -83386,10 +83386,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -83502,10 +83502,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -83618,10 +83618,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -83734,10 +83734,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -83850,10 +83850,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 64, @@ -83966,10 +83966,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -84082,10 +84082,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -84198,10 +84198,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -84314,10 +84314,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -84430,10 +84430,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 128, @@ -84546,10 +84546,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -84662,10 +84662,10 @@ "shuffle": "I8", "output": "I8" }, - "elementwise_operation": "PASS_THROUGH", - "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3" + "elementwise_operation": "PASS_THROUGH" }, "algorithm": { + "device_operation": "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3", "algorithm_type": "XDL", "thread_block": { "block_size": 256, @@ -84780,10 +84780,10 @@ "shuffle": "enum (FP32, FP16, BF16, FP8, I8, I32, U8)", "output": "enum (FP32, FP16, BF16, FP8, I8, I32, U8)" }, - "elementwise_operation": "enum (BIAS, BIAS_CLAMP, BIAS_BNORM_CLAMP, BILINEAR, CLAMP, SCALE, PASS_THROUGH)", - "device_operation": "string (DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle, DeviceGroupedConvFwdMultipleD_Wmma_CShuffle, etc.)" + "elementwise_operation": "enum (BIAS, BIAS_CLAMP, BIAS_BNORM_CLAMP, BILINEAR, CLAMP, SCALE, PASS_THROUGH)" }, "algorithm_xdl": { + "device_operation": "string (DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle, DeviceGroupedConvFwdMultipleD_Wmma_CShuffle, etc.)", "description": "Algorithm schema for XDL-based operations (algorithm_type = 'XDL')", "algorithm_type": "string literal 'XDL'", "gridwise_xdl_gemm": { @@ -84797,6 +84797,7 @@ "note": "Use gridwise_xdl_gemm for XDL-based convolution operations" }, "algorithm_wmma": { + "device_operation": "string (DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle, DeviceGroupedConvFwdMultipleD_Wmma_CShuffle, etc.)", "description": "Algorithm schema for WMMA-based operations (algorithm_type = 'WMMA')", "algorithm_type": "string literal 'WMMA'", "gridwise_wmma_gemm": { diff --git a/experimental/builder/instances/move_elementwise_to_signature.py b/experimental/builder/instances/move_elementwise_to_signature.py new file mode 100644 index 0000000000..b26c541757 --- /dev/null +++ b/experimental/builder/instances/move_elementwise_to_signature.py @@ -0,0 +1,67 @@ +#!/usr/bin/env python3 +""" +Script to move elementwise_operation back to signature section +while keeping device_operation in algorithm section. +""" + +import json +import sys + +def refactor_instantiation(inst: dict) -> dict: + """Move elementwise_operation back to signature, keep device_operation in algorithm""" + + # Extract elementwise_operation from algorithm + elementwise_op = inst["algorithm"].pop("elementwise_operation", "PASS_THROUGH") + + # Add to signature + inst["signature"]["elementwise_operation"] = elementwise_op + + return inst + +def refactor_json(input_file: str, output_file: str): + """Main refactoring function""" + + print(f"Loading {input_file}...") + with open(input_file, 'r') as f: + data = json.load(f) + + print(f"Refactoring {len(data['instantiations'])} instantiations...") + + # Refactor each instantiation + for inst in data["instantiations"]: + refactor_instantiation(inst) + + # Update schema documentation + if "schemas" in data: + # Add elementwise_operation back to signature schema + if "signature" in data["schemas"]: + sig_schema = data["schemas"]["signature"] + # Add after data_type + new_sig_schema = {} + for key, value in sig_schema.items(): + new_sig_schema[key] = value + if key == "data_type": + new_sig_schema["elementwise_operation"] = "enum (BIAS, BIAS_CLAMP, BIAS_BNORM_CLAMP, BILINEAR, CLAMP, SCALE, PASS_THROUGH)" + data["schemas"]["signature"] = new_sig_schema + + # Remove elementwise_operation from algorithm schemas (keep device_operation) + for algo_schema_key in ["algorithm_xdl", "algorithm_wmma"]: + if algo_schema_key in data["schemas"]: + data["schemas"][algo_schema_key].pop("elementwise_operation", None) + + print(f"Writing to {output_file}...") + with open(output_file, 'w') as f: + json.dump(data, f, indent=2) + + print("Done!") + +if __name__ == "__main__": + input_file = "experimental/builder/instances/forward_conv_structured_instantiations.json" + output_file = "experimental/builder/instances/forward_conv_structured_instantiations.json" + + if len(sys.argv) > 1: + input_file = sys.argv[1] + if len(sys.argv) > 2: + output_file = sys.argv[2] + + refactor_json(input_file, output_file) diff --git a/experimental/builder/instances/refactor_json_structure.py b/experimental/builder/instances/refactor_json_structure.py new file mode 100644 index 0000000000..c84d9f4c89 --- /dev/null +++ b/experimental/builder/instances/refactor_json_structure.py @@ -0,0 +1,82 @@ +#!/usr/bin/env python3 +""" +Script to refactor forward_conv_structured_instantiations.json +to move elementwise_operation and device_operation from signature to algorithm. +""" + +import json +import sys + +def refactor_instantiation(inst: dict) -> dict: + """Move elementwise_operation and device_operation from signature to algorithm""" + + # Extract fields from signature + elementwise_op = inst["signature"].pop("elementwise_operation", "PASS_THROUGH") + device_op = inst["signature"].pop("device_operation", "DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle") + + # Add to algorithm at the beginning for better readability + algorithm = inst["algorithm"] + new_algorithm = { + "elementwise_operation": elementwise_op, + "device_operation": device_op + } + + # Copy rest of algorithm fields + for key, value in algorithm.items(): + new_algorithm[key] = value + + inst["algorithm"] = new_algorithm + + return inst + +def refactor_json(input_file: str, output_file: str): + """Main refactoring function""" + + print(f"Loading {input_file}...") + with open(input_file, 'r') as f: + data = json.load(f) + + print(f"Refactoring {len(data['instantiations'])} instantiations...") + + # Refactor each instantiation + for inst in data["instantiations"]: + refactor_instantiation(inst) + + # Update schema documentation + if "schemas" in data: + # Update signature schema - remove elementwise_operation and device_operation + if "signature" in data["schemas"]: + sig_schema = data["schemas"]["signature"] + sig_schema.pop("elementwise_operation", None) + sig_schema.pop("device_operation", None) + + # Add these fields to algorithm schemas + for algo_schema_key in ["algorithm_xdl", "algorithm_wmma"]: + if algo_schema_key in data["schemas"]: + algo_schema = data["schemas"][algo_schema_key] + # Add at the beginning of the description + if "elementwise_operation" not in algo_schema: + # Insert before other fields + new_schema = { + "elementwise_operation": "enum (BIAS, BIAS_CLAMP, BIAS_BNORM_CLAMP, BILINEAR, CLAMP, SCALE, PASS_THROUGH)", + "device_operation": "string (DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle, DeviceGroupedConvFwdMultipleD_Wmma_CShuffle, etc.)" + } + new_schema.update(algo_schema) + data["schemas"][algo_schema_key] = new_schema + + print(f"Writing to {output_file}...") + with open(output_file, 'w') as f: + json.dump(data, f, indent=2) + + print("Done!") + +if __name__ == "__main__": + input_file = "experimental/builder/instances/forward_conv_structured_instantiations.json" + output_file = "experimental/builder/instances/forward_conv_structured_instantiations.json" + + if len(sys.argv) > 1: + input_file = sys.argv[1] + if len(sys.argv) > 2: + output_file = sys.argv[2] + + refactor_json(input_file, output_file)