Files
blis/frame/0/bli_l0_tapi.c
Field G. Van Zee 86969873b5 Reclassified amaxv operation as a level-1v kernel.
Details:
- Moved amaxv from being a utility operation to being a level-1v operation.
  This includes the establishment of a new amaxv kernel to live beside all
  of the other level-1v kernels.
- Added two new functions to bli_part.c:
    bli_acquire_mij()
    bli_acquire_vi()
  The first acquires a scalar object for the (i,j) element of a matrix,
  and the second acquires a scalar object for the ith element of a vector.
- Added integer support to bli_getsc level-0 operation. This involved
  adding integer support to the bli_*gets level-0 scalar macros.
- Added a new test module to test amaxv as a level-1v operation. The test
  module works by comparing the value identified by bli_amaxv() to the
  the value found from a reference-like code local to the test module
  source file. In other words, it (intentionally) does not guarantee the
  same index is found; only the same value. This allows for different
  implementations in the case where a vector contains two or more elements
  containing exactly the same floating point value (or values, in the case
  of the complex domain).
- Removed the directory frame/include/old/.
2016-10-04 14:24:59 -05:00

252 lines
5.5 KiB
C

/*
BLIS
An object-based framework for developing high-performance BLAS-like
libraries.
Copyright (C) 2014, The University of Texas at Austin
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are
met:
- Redistributions of source code must retain the above copyright
notice, this list of conditions and the following disclaimer.
- Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer in the
documentation and/or other materials provided with the distribution.
- Neither the name of The University of Texas at Austin nor the names
of its contributors may be used to endorse or promote products
derived from this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "blis.h"
//
// Define BLAS-like interfaces with typed operands.
//
#undef GENTFUNC
#define GENTFUNC( ctype, ch, opname, kername ) \
\
void PASTEMAC(ch,opname) \
( \
conj_t conjchi, \
ctype* chi, \
ctype* psi \
) \
{ \
ctype chi_conj; \
\
PASTEMAC(ch,copycjs)( conjchi, *chi, chi_conj ); \
PASTEMAC(ch,kername)( chi_conj, *psi ); \
}
INSERT_GENTFUNC_BASIC( addsc, adds )
INSERT_GENTFUNC_BASIC( divsc, invscals )
INSERT_GENTFUNC_BASIC( subsc, subs )
#undef GENTFUNC
#define GENTFUNC( ctype, ch, opname, kername ) \
\
void PASTEMAC(ch,opname) \
( \
conj_t conjchi, \
ctype* chi \
) \
{ \
ctype chi_conj; \
\
PASTEMAC(ch,copycjs)( conjchi, *chi, chi_conj ); \
PASTEMAC(ch,kername)( chi_conj ); \
PASTEMAC(ch,copys)( chi_conj, *chi ); \
}
INSERT_GENTFUNC_BASIC( invertsc, inverts )
#undef GENTFUNC
#define GENTFUNC( ctype, ch, opname, kername ) \
\
void PASTEMAC(ch,opname) \
( \
conj_t conjchi, \
ctype* chi, \
ctype* psi \
) \
{ \
if ( PASTEMAC(ch,eq0)( *chi ) ) \
{ \
/* Overwrite potential Infs and NaNs. */ \
PASTEMAC(ch,set0s)( *psi ); \
} \
else \
{ \
ctype chi_conj; \
\
PASTEMAC(ch,copycjs)( conjchi, *chi, chi_conj ); \
PASTEMAC(ch,kername)( chi_conj, *psi ); \
} \
}
INSERT_GENTFUNC_BASIC( mulsc, scals )
#undef GENTFUNCR
#define GENTFUNCR( ctype, ctype_r, ch, chr, opname ) \
\
void PASTEMAC(ch,opname) \
( \
ctype* chi, \
ctype_r* absq \
) \
{ \
ctype_r chi_r; \
ctype_r chi_i; \
ctype_r absq_i; \
\
( void )absq_i; \
\
PASTEMAC2(ch,chr,gets)( *chi, chi_r, chi_i ); \
\
/* absq = chi_r * chi_r + chi_i * chi_i; \
absq_r = 0.0; (thrown away) */ \
PASTEMAC(ch,absq2ris)( chi_r, chi_i, *absq, absq_i ); \
\
( void )chi_i; \
}
INSERT_GENTFUNCR_BASIC0( absqsc )
#undef GENTFUNCR
#define GENTFUNCR( ctype, ctype_r, ch, chr, opname ) \
\
void PASTEMAC(ch,opname) \
( \
ctype* chi, \
ctype_r* norm \
) \
{ \
/* norm = sqrt( chi_r * chi_r + chi_i * chi_i ); */ \
PASTEMAC2(ch,chr,abval2s)( *chi, *norm ); \
}
INSERT_GENTFUNCR_BASIC0( normfsc )
#undef GENTFUNC
#define GENTFUNC( ctype, ch, opname ) \
\
void PASTEMAC(ch,opname) \
( \
ctype* chi, \
ctype* psi \
) \
{ \
/* NOTE: sqrtsc/sqrt2s differs from normfsc/abval2s in the complex domain. */ \
PASTEMAC(ch,sqrt2s)( *chi, *psi ); \
}
INSERT_GENTFUNC_BASIC0( sqrtsc )
#undef GENTFUNC
#define GENTFUNC( ctype, ch, opname ) \
\
void PASTEMAC(ch,opname) \
( \
ctype* chi, \
double* zeta_r, \
double* zeta_i \
) \
{ \
PASTEMAC2(ch,d,gets)( *chi, *zeta_r, *zeta_i ); \
}
INSERT_GENTFUNC_BASIC0( getsc )
#undef GENTFUNC
#define GENTFUNC( ctype, ch, opname ) \
\
void PASTEMAC(ch,opname) \
( \
double zeta_r, \
double zeta_i, \
ctype* chi \
) \
{ \
PASTEMAC2(d,ch,sets)( zeta_r, zeta_i, *chi ); \
}
INSERT_GENTFUNC_BASIC0( setsc )
#undef GENTFUNCR
#define GENTFUNCR( ctype, ctype_r, ch, chr, opname ) \
\
void PASTEMAC(ch,opname) \
( \
ctype* chi, \
ctype_r* zeta_r, \
ctype_r* zeta_i \
) \
{ \
PASTEMAC2(ch,chr,gets)( *chi, *zeta_r, *zeta_i ); \
}
INSERT_GENTFUNCR_BASIC0( unzipsc )
#undef GENTFUNCR
#define GENTFUNCR( ctype, ctype_r, ch, chr, opname ) \
\
void PASTEMAC(ch,opname) \
( \
ctype_r* zeta_r, \
ctype_r* zeta_i, \
ctype* chi \
) \
{ \
PASTEMAC2(chr,ch,sets)( *zeta_r, *zeta_i, *chi ); \
}
INSERT_GENTFUNCR_BASIC0( zipsc )
// -----------------------------------------------------------------------------
void bli_igetsc
(
dim_t* chi,
double* zeta_r,
double* zeta_i
)
{
PASTEMAC2(i,d,gets)( *chi, *zeta_r, *zeta_i );
}
void bli_isetsc
(
double zeta_r,
double zeta_i,
dim_t* chi
)
{
PASTEMAC2(d,i,sets)( zeta_r, zeta_i, *chi );
}