mirror of
https://github.com/amd/blis.git
synced 2026-04-19 23:28:52 +00:00
Tuned decision logic for DGEMV multithreading for skinny sizes. (#301)
AMD-Internal: [CPUPL-7769]
This commit is contained in:
@@ -4,7 +4,7 @@
|
||||
An object-based framework for developing high-performance BLAS-like
|
||||
libraries.
|
||||
|
||||
Copyright (C) 2025, Advanced Micro Devices, Inc. All rights reserved.
|
||||
Copyright (C) 2025-26, Advanced Micro Devices, Inc. All rights reserved.
|
||||
|
||||
Redistribution and use in source and binary forms, with or without
|
||||
modification, are permitted provided that the following conditions are
|
||||
@@ -1511,7 +1511,7 @@ void bli_dgemv_n_zen4_int (
|
||||
|
||||
{
|
||||
#ifdef BLIS_ENABLE_OPENMP
|
||||
if ( m < 1250 || size >= (700000 * 128))
|
||||
if (( m < 1250 ) || ( size >= (700000 * 128) && ( m / n ) < 10000 ))
|
||||
{
|
||||
ker_ft = bli_dgemv_m_zen4_int_40x8_mt_Ndiv;
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user