diff options
Diffstat (limited to 'kaldi_io/src/tools/ATLAS/include/atlas_kernel2.h')
-rw-r--r-- | kaldi_io/src/tools/ATLAS/include/atlas_kernel2.h | 5408 |
1 files changed, 5408 insertions, 0 deletions
diff --git a/kaldi_io/src/tools/ATLAS/include/atlas_kernel2.h b/kaldi_io/src/tools/ATLAS/include/atlas_kernel2.h new file mode 100644 index 0000000..4663def --- /dev/null +++ b/kaldi_io/src/tools/ATLAS/include/atlas_kernel2.h @@ -0,0 +1,5408 @@ +/* --------------------------------------------------------------------- + * + * -- Automatically Tuned Linear Algebra Software (ATLAS) + * (C) Copyright 2000 All Rights Reserved + * + * -- ATLAS routine -- Version 3.2 -- December 25, 2000 + * + * Author : Antoine P. Petitet + * Contributor(s) : R. Clint Whaley + * Originally developed at the University of Tennessee, + * Innovative Computing Laboratory, Knoxville TN, 37996-1301, USA. + * + * --------------------------------------------------------------------- + * + * -- Copyright notice and Licensing terms: + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted provided that the following conditions + * are met: + * + * 1. Redistributions of source code must retain the above copyright + * notice, this list of conditions and the following disclaimer. + * 2. Redistributions in binary form must reproduce the above copyright + * notice, this list of conditions, and the following disclaimer in + * the documentation and/or other materials provided with the distri- + * bution. + * 3. The name of the University, the ATLAS group, or the names of its + * contributors may not be used to endorse or promote products deri- + * ved from this software without specific written permission. + * + * -- Disclaimer: + * + * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS + * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT + * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR + * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY + * OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPE- + * CIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED + * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, + * OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEO- + * RY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (IN- + * CLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF + * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + * + * --------------------------------------------------------------------- + */ +#ifndef ATLAS_KERNEL2_H +#define ATLAS_KERNEL2_H +/* + * ===================================================================== + * Macro function definitions + * ===================================================================== + */ +#define ATL_GetPartSBMV ATL_GetPartSYMV +#define ATL_GetPartSPMV ATL_GetPartSYMV +#define ATL_GetPartP1 ATL_GetPartR1 + +#define MLpprev( n_, a_, lda_ ) \ + { a_ -= ( (((n_) * (lda_)) + (((n_)*((n_)+1)) >> 1)) SHIFT ); lda_ += (n_); } +#define MUpprev( n_, a_, lda_ ) \ + { a_ -= ( (((n_) * (lda_)) - (((n_)*((n_)-1)) >> 1)) SHIFT ); lda_ -= (n_); } +#define MLpnext( n_, a_, lda_ ) \ + { a_ += ( (((n_) * (lda_)) - (((n_)*((n_)-1)) >> 1)) SHIFT ); lda_ -= (n_); } +#define MUpnext( n_, a_, lda_ ) \ + { a_ += ( (((n_) * (lda_)) + (((n_)*((n_)+1)) >> 1)) SHIFT ); lda_ += (n_); } + +#define MLrprev( n_, a_, lda_ ) \ + { a_ -= ( ((n_) * ((lda_)+1)) SHIFT ); } +#define MUrprev( n_, a_, lda_ ) \ + { a_ -= ( ((n_) * ((lda_)+1)) SHIFT ); } +#define MLrnext( n_, a_, lda_ ) \ + { a_ += ( ((n_) * ((lda_)+1)) SHIFT ); } +#define MUrnext( n_, a_, lda_ ) \ + { a_ += ( ((n_) * ((lda_)+1)) SHIFT ); } +/* + * ===================================================================== + * Recursive Level 2 BLAS function prototypes + * ===================================================================== + */ +void ATL_strsvLTU +( + const int, + const float *, const int, + float * +); + +void ATL_strsvLNU +( + const int, + const float *, const int, + float * +); + +void ATL_strsvLTN +( + const int, + const float *, const int, + float * +); + +void ATL_strsvLNN +( + const int, + const float *, const int, + float * +); + +void ATL_strsvUTU +( + const int, + const float *, const int, + float * +); + +void ATL_strsvUNU +( + const int, + const float *, const int, + float * +); + +void ATL_strsvUTN +( + const int, + const float *, const int, + float * +); + +void ATL_strsvUNN +( + const int, + const float *, const int, + float * +); + +void ATL_strsvLT +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_strsvLN +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_strsvUT +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_strsvUN +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stpsvLTU +( + const int, + const float *, const int, + float * +); + +void ATL_stpsvLNU +( + const int, + const float *, const int, + float * +); + +void ATL_stpsvLTN +( + const int, + const float *, const int, + float * +); + +void ATL_stpsvLNN +( + const int, + const float *, const int, + float * +); + +void ATL_stpsvUTU +( + const int, + const float *, const int, + float * +); + +void ATL_stpsvUNU +( + const int, + const float *, const int, + float * +); + +void ATL_stpsvUTN +( + const int, + const float *, const int, + float * +); + +void ATL_stpsvUNN +( + const int, + const float *, const int, + float * +); + +void ATL_stpsvLT +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stpsvLN +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stpsvUT +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stpsvUN +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stbsvLTU +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvLNU +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvLTN +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvLNN +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvUTU +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvUNU +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvUTN +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvUNN +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvLT +( + const enum ATLAS_DIAG, + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvLN +( + const enum ATLAS_DIAG, + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvUT +( + const enum ATLAS_DIAG, + const int, const int, + const float *, const int, + float * +); + +void ATL_stbsvUN +( + const enum ATLAS_DIAG, + const int, const int, + const float *, const int, + float * +); + +void ATL_strmvLTU +( + const int, + const float *, const int, + float * +); + +void ATL_strmvLNU +( + const int, + const float *, const int, + float * +); + +void ATL_strmvLTN +( + const int, + const float *, const int, + float * +); + +void ATL_strmvLNN +( + const int, + const float *, const int, + float * +); + +void ATL_strmvUTU +( + const int, + const float *, const int, + float * +); + +void ATL_strmvUNU +( + const int, + const float *, const int, + float * +); + +void ATL_strmvUTN +( + const int, + const float *, const int, + float * +); + +void ATL_strmvUNN +( + const int, + const float *, const int, + float * +); + +void ATL_strmvLT +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_strmvLN +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_strmvUT +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_strmvUN +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stpmvLTU +( + const int, + const float *, const int, + float * +); + +void ATL_stpmvLNU +( + const int, + const float *, const int, + float * +); + +void ATL_stpmvLTN +( + const int, + const float *, const int, + float * +); + +void ATL_stpmvLNN +( + const int, + const float *, const int, + float * +); + +void ATL_stpmvUTU +( + const int, + const float *, const int, + float * +); + +void ATL_stpmvUNU +( + const int, + const float *, const int, + float * +); + +void ATL_stpmvUTN +( + const int, + const float *, const int, + float * +); + +void ATL_stpmvUNN +( + const int, + const float *, const int, + float * +); + +void ATL_stpmvLT +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stpmvLN +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stpmvUT +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stpmvUN +( + const enum ATLAS_DIAG, + const int, + const float *, const int, + float * +); + +void ATL_stbmvLTU +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvLNU +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvLTN +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvLNN +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvUTU +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvUNU +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvUTN +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvUNN +( + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvLT +( + const enum ATLAS_DIAG, + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvLN +( + const enum ATLAS_DIAG, + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvUT +( + const enum ATLAS_DIAG, + const int, const int, + const float *, const int, + float * +); + +void ATL_stbmvUN +( + const enum ATLAS_DIAG, + const int, const int, + const float *, const int, + float * +); + +void ATL_ssyr2U +( + const int, + const float *, + const float *, + float *, const int +); + +void ATL_ssyr2L +( + const int, + const float *, + const float *, + float *, const int +); + +void ATL_sspr2U +( + const int, + const float *, + const float *, + float *, const int +); + +void ATL_sspr2L +( + const int, + const float *, + const float *, + float *, const int +); + +void ATL_ssyrU +( + const int, + const float *, + const float *, const int, + float *, const int +); + +void ATL_ssyrL +( + const int, + const float *, + const float *, const int, + float *, const int +); + +void ATL_ssprU +( + const int, + const float *, + const float *, const int, + float *, const int +); + +void ATL_ssprL +( + const int, + const float *, + const float *, const int, + float *, const int +); + +void ATL_ssymvU +( + const int, + const float *, const int, + const float *, + const float, + float * +); + +void ATL_ssymvL +( + const int, + const float *, const int, + const float *, + const float, + float * +); + +void ATL_sspmvU +( + const int, + const float *, const int, + const float *, + const float, + float * +); + +void ATL_sspmvL +( + const int, + const float *, const int, + const float *, + const float, + float * +); + +void ATL_ssbmvU +( + const int, const int, + const float *, const int, + const float *, + const float, + float * +); + +void ATL_ssbmvL +( + const int, const int, + const float *, const int, + const float *, + const float, + float * +); + +void ATL_sgpmv +( + const enum ATLAS_UPLO, const enum ATLAS_TRANS, + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgprU +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + float *, const int +); + +void ATL_sgprL +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + float *, const int +); + +void ATL_sgpr +( + const enum ATLAS_UPLO, + const int, const int, + const float, + const float *, const int, + const float *, const int, + float *, const int +); + +void ATL_sgpr1U_a1_x1_yX +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + float *, const int +); + +void ATL_sgpr1L_a1_x1_yX +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + float *, const int +); + +void ATL_sgpmvUT_a1_x1_bX_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvUN_a1_x1_bX_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvUT_a1_x1_b1_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvUN_a1_x1_b1_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvUT_a1_x1_b0_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvUN_a1_x1_b0_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvLT_a1_x1_bX_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvLN_a1_x1_bX_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvLT_a1_x1_b1_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvLN_a1_x1_b1_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvLT_a1_x1_b0_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgpmvLN_a1_x1_b0_y1 +( + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgbmvT_a1_x1_bX_y1 +( + const int, const int, + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgbmvN_a1_x1_bX_y1 +( + const int, const int, + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgbmvT_a1_x1_b1_y1 +( + const int, const int, + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgbmvN_a1_x1_b1_y1 +( + const int, const int, + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgbmvT_a1_x1_b0_y1 +( + const int, const int, + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_sgbmvN_a1_x1_b0_y1 +( + const int, const int, + const int, const int, + const float, + const float *, const int, + const float *, const int, + const float, + float *, const int +); + +void ATL_dtrsvLTU +( + const int, + const double *, const int, + double * +); + +void ATL_dtrsvLNU +( + const int, + const double *, const int, + double * +); + +void ATL_dtrsvLTN +( + const int, + const double *, const int, + double * +); + +void ATL_dtrsvLNN +( + const int, + const double *, const int, + double * +); + +void ATL_dtrsvUTU +( + const int, + const double *, const int, + double * +); + +void ATL_dtrsvUNU +( + const int, + const double *, const int, + double * +); + +void ATL_dtrsvUTN +( + const int, + const double *, const int, + double * +); + +void ATL_dtrsvUNN +( + const int, + const double *, const int, + double * +); + +void ATL_dtrsvLT +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtrsvLN +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtrsvUT +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtrsvUN +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtpsvLTU +( + const int, + const double *, const int, + double * +); + +void ATL_dtpsvLNU +( + const int, + const double *, const int, + double * +); + +void ATL_dtpsvLTN +( + const int, + const double *, const int, + double * +); + +void ATL_dtpsvLNN +( + const int, + const double *, const int, + double * +); + +void ATL_dtpsvUTU +( + const int, + const double *, const int, + double * +); + +void ATL_dtpsvUNU +( + const int, + const double *, const int, + double * +); + +void ATL_dtpsvUTN +( + const int, + const double *, const int, + double * +); + +void ATL_dtpsvUNN +( + const int, + const double *, const int, + double * +); + +void ATL_dtpsvLT +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtpsvLN +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtpsvUT +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtpsvUN +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtbsvLTU +( + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvLNU +( + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvLTN +( + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvLNN +( + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvUTU +( + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvUNU +( + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvUTN +( + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvUNN +( + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvLT +( + const enum ATLAS_DIAG, + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvLN +( + const enum ATLAS_DIAG, + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvUT +( + const enum ATLAS_DIAG, + const int, const int, + const double *, const int, + double * +); + +void ATL_dtbsvUN +( + const enum ATLAS_DIAG, + const int, const int, + const double *, const int, + double * +); + +void ATL_dtrmvLTU +( + const int, + const double *, const int, + double * +); + +void ATL_dtrmvLNU +( + const int, + const double *, const int, + double * +); + +void ATL_dtrmvLTN +( + const int, + const double *, const int, + double * +); + +void ATL_dtrmvLNN +( + const int, + const double *, const int, + double * +); + +void ATL_dtrmvUTU +( + const int, + const double *, const int, + double * +); + +void ATL_dtrmvUNU +( + const int, + const double *, const int, + double * +); + +void ATL_dtrmvUTN +( + const int, + const double *, const int, + double * +); + +void ATL_dtrmvUNN +( + const int, + const double *, const int, + double * +); + +void ATL_dtrmvLT +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtrmvLN +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtrmvUT +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtrmvUN +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtpmvLTU +( + const int, + const double *, const int, + double * +); + +void ATL_dtpmvLNU +( + const int, + const double *, const int, + double * +); + +void ATL_dtpmvLTN +( + const int, + const double *, const int, + double * +); + +void ATL_dtpmvLNN +( + const int, + const double *, const int, + double * +); + +void ATL_dtpmvUTU +( + const int, + const double *, const int, + double * +); + +void ATL_dtpmvUNU +( + const int, + const double *, const int, + double * +); + +void ATL_dtpmvUTN +( + const int, + const double *, const int, + double * +); + +void ATL_dtpmvUNN +( + const int, + const double *, const int, + double * +); + +void ATL_dtpmvLT +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtpmvLN +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtpmvUT +( + const enum ATLAS_DIAG, + const int, + const double *, const int, + double * +); + +void ATL_dtpmvUN +( + const enum ATLAS_DIAG, + const int, |