mirror of
https://github.com/amd/blis.git
synced 2026-05-11 17:50:00 +00:00
Fix for sblat3.x failure in make check
Details: Using of ymm registers storing 8 float values than 4 floats values Changed register from ymm to xmm in required places. This can be found only when leading dimension is greater than the actual dimension. Change-Id: I39f04eac18c4fa3a8c93048c977d6a83aa92b800
This commit is contained in:
@@ -290,9 +290,9 @@ void bli_sgemmsup_rd_zen_asm_2x16
|
||||
label(.SBETAZERO)
|
||||
|
||||
label(.SROWSTORBZ)
|
||||
vmovups(ymm4, mem(rcx))
|
||||
vmovups(xmm4, mem(rcx))
|
||||
add(rdi, rcx)
|
||||
vmovups(ymm5, mem(rcx))
|
||||
vmovups(xmm5, mem(rcx))
|
||||
|
||||
label(.SDONE)
|
||||
add(imm(4), r15) // jj += 4;
|
||||
@@ -817,9 +817,9 @@ void bli_sgemmsup_rd_zen_asm_2x8
|
||||
label(.SBETAZERO)
|
||||
|
||||
label(.SROWSTORBZ)
|
||||
vmovups(ymm4, mem(rcx))
|
||||
vmovups(xmm4, mem(rcx))
|
||||
add(rdi, rcx)
|
||||
vmovups(ymm5, mem(rcx))
|
||||
vmovups(xmm5, mem(rcx))
|
||||
|
||||
label(.SDONE)
|
||||
|
||||
@@ -1051,7 +1051,7 @@ void bli_sgemmsup_rd_zen_asm_1x8
|
||||
label(.SBETAZERO)
|
||||
|
||||
label(.SROWSTORBZ)
|
||||
vmovups(ymm4, mem(rcx))
|
||||
vmovups(xmm4, mem(rcx))
|
||||
|
||||
label(.SDONE)
|
||||
add(imm(4), r15) // jj += 4;
|
||||
@@ -1323,9 +1323,9 @@ void bli_sgemmsup_rd_zen_asm_2x4
|
||||
label(.SBETAZERO)
|
||||
|
||||
label(.SROWSTORBZ)
|
||||
vmovups(ymm4, mem(rcx))
|
||||
vmovups(xmm4, mem(rcx))
|
||||
add(rdi, rcx)
|
||||
vmovups(ymm5, mem(rcx))
|
||||
vmovups(xmm5, mem(rcx))
|
||||
label(.SDONE)
|
||||
end_asm(
|
||||
: // output operands (none)
|
||||
@@ -1536,7 +1536,7 @@ void bli_sgemmsup_rd_zen_asm_1x4
|
||||
|
||||
label(.SBETAZERO)
|
||||
label(.SROWSTORBZ)
|
||||
vmovups(ymm4, mem(rcx))
|
||||
vmovups(xmm4, mem(rcx))
|
||||
|
||||
label(.SDONE)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user