mirror of
https://github.com/amd/blis.git
synced 2026-05-11 09:39:59 +00:00
Added experimental bli_gemm_ker_var5().
Details: - Added support for an experimental gemm macro-kernel incrementally packs one micro-panel of B at a time. This is useful for certain special cases of gemm where m is small. - Minor changes to default values of clarksville configuration. - Defined BLIS_PACKED_BLOCKS as part of pack_t type, even though we do not yet have any use (or implementation support) for block storage. - Comment update to bli_packm_init.c.
This commit is contained in:
@@ -243,6 +243,12 @@
|
||||
#define bli_cndup BLIS_DEFAULT_NUM_DUPL_C
|
||||
#define bli_zndup BLIS_DEFAULT_NUM_DUPL_Z
|
||||
|
||||
// Incremental packing factors
|
||||
|
||||
#define bli_snifac BLIS_DEFAULT_NI_FAC
|
||||
#define bli_dnifac BLIS_DEFAULT_NI_FAC
|
||||
#define bli_cnifac BLIS_DEFAULT_NI_FAC
|
||||
#define bli_znifac BLIS_DEFAULT_NI_FAC
|
||||
|
||||
|
||||
#endif
|
||||
|
||||
@@ -89,6 +89,7 @@
|
||||
#define BLIS_BITVAL_PACKED_COLUMNS 0x40000
|
||||
#define BLIS_BITVAL_PACKED_ROW_PANELS 0x50000
|
||||
#define BLIS_BITVAL_PACKED_COL_PANELS 0x60000
|
||||
#define BLIS_BITVAL_PACKED_BLOCKS 0x70000
|
||||
#define BLIS_BITVAL_PACK_FWD_IF_UPPER 0x0
|
||||
#define BLIS_BITVAL_PACK_REV_IF_UPPER 0x80000
|
||||
#define BLIS_BITVAL_PACK_FWD_IF_LOWER 0x0
|
||||
@@ -195,7 +196,8 @@ typedef enum
|
||||
BLIS_PACKED_ROWS = BLIS_BITVAL_PACKED_ROWS,
|
||||
BLIS_PACKED_COLUMNS = BLIS_BITVAL_PACKED_COLUMNS,
|
||||
BLIS_PACKED_ROW_PANELS = BLIS_BITVAL_PACKED_ROW_PANELS,
|
||||
BLIS_PACKED_COL_PANELS = BLIS_BITVAL_PACKED_COL_PANELS
|
||||
BLIS_PACKED_COL_PANELS = BLIS_BITVAL_PACKED_COL_PANELS,
|
||||
BLIS_PACKED_BLOCKS = BLIS_BITVAL_PACKED_BLOCKS
|
||||
} pack_t;
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user