cavis/libnd4j/include/cblas.h

665 lines
29 KiB
C
Raw Normal View History

2019-06-06 14:21:15 +02:00
/*******************************************************************************
* Copyright (c) 2015-2018 Skymind, Inc.
*
* This program and the accompanying materials are made available under the
* terms of the Apache License, Version 2.0 which is available at
* https://www.apache.org/licenses/LICENSE-2.0.
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
* License for the specific language governing permissions and limitations
* under the License.
*
* SPDX-License-Identifier: Apache-2.0
******************************************************************************/
//
// Created by agibsonccc on 1/26/16.
//
#ifndef NATIVEOPERATIONS_CBLAS_H
#define NATIVEOPERATIONS_CBLAS_H
#ifndef __STANDALONE_BUILD__
#include "config.h"
#endif
#ifdef __MKL_CBLAS_H__
// CBLAS from MKL is already included
#define CBLAS_H
#endif
#ifdef HAVE_MKLDNN
Platform helpers (#8216) * platform helpers draft Signed-off-by: raver119 <raver119@gmail.com> * typo Signed-off-by: raver119 <raver119@gmail.com> * disable platform cmake Signed-off-by: raver119 <raver119@gmail.com> * another draft Signed-off-by: raver119 <raver119@gmail.com> * mkldnn convolution refactored Signed-off-by: raver119 <raver119@gmail.com> * minor tweaks Signed-off-by: raver119 <raver119@gmail.com> * one more safety check Signed-off-by: raver119 <raver119@gmail.com> * prototype works Signed-off-by: raver119 <raver119@gmail.com> * meh Signed-off-by: raver119 <raver119@gmail.com> * force static library mode for mkldnn Signed-off-by: raver119 <raver119@gmail.com> * - ismax fix - experimental arg fix - don't enforce openblas on Apple hardware Signed-off-by: raver119 <raver119@gmail.com> * bunch of small fixes Signed-off-by: raver119@gmail.com <raver119@gmail.com> * declare concurrent Signed-off-by: raver119@gmail.com <raver119@gmail.com> * - MKLDNN version upgrade to 1.0.2 - avgpool2d/maxpool2d APIs update Signed-off-by: raver119 <raver119@gmail.com> * - avgpool2d_bp/maxpool2d_bp APIs update Signed-off-by: raver119 <raver119@gmail.com> * - conv2d/batchnorm APIs update Signed-off-by: raver119 <raver119@gmail.com> * - lrn/conv2d_bp/conv3d/conv3d_bp APIs update Signed-off-by: raver119 <raver119@gmail.com> * all ops converted to MKLDNN 1.x Signed-off-by: raver119 <raver119@gmail.com> * bunch of tweaks Signed-off-by: raver119 <raver119@gmail.com> * namespace for platform helpers Signed-off-by: raver119 <raver119@gmail.com> * make sure platform helpers aren't opimized out Signed-off-by: raver119 <raver119@gmail.com> * build cpu_features on x86 systems Signed-off-by: raver119 <raver119@gmail.com> * build cpu_features on x86 systems Signed-off-by: raver119 <raver119@gmail.com> * more of cpu_features Signed-off-by: raver119 <raver119@gmail.com> * - mkldnn removed from java - cpu_features checks in CpuNDArrayFactory Signed-off-by: raver119 <raver119@gmail.com> * F16C definition renamed Signed-off-by: raver119 <raver119@gmail.com> * some mkldnn rearrangements Signed-off-by: raver119 <raver119@gmail.com> * check supported instructions before doing anything Signed-off-by: raver119 <raver119@gmail.com> * typo Signed-off-by: raver119 <raver119@gmail.com> * missied impl Signed-off-by: raver119 <raver119@gmail.com> * BUILD_PIC option Signed-off-by: raver119 <raver119@gmail.com> * conv2d fix Signed-off-by: raver119 <raver119@gmail.com> * avgpool3d fix Signed-off-by: raver119 <raver119@gmail.com> * avgpool3d_bp fix Signed-off-by: raver119 <raver119@gmail.com> * avgpool2d_bp leak fix Signed-off-by: raver119 <raver119@gmail.com> * avgpool3d_bp leak fix Signed-off-by: raver119 <raver119@gmail.com> * maxpool bp leaks fixed Signed-off-by: raver119 <raver119@gmail.com> * printf removed Signed-off-by: raver119 <raver119@gmail.com> * batchnorm fix Signed-off-by: raver119 <raver119@gmail.com> * AVX warning/error polishing Signed-off-by: AlexDBlack <blacka101@gmail.com> * Fix Signed-off-by: AlexDBlack <blacka101@gmail.com> * More polish Signed-off-by: AlexDBlack <blacka101@gmail.com> * Polish Signed-off-by: AlexDBlack <blacka101@gmail.com> * remove previous MKL-DNN support layer Signed-off-by: raver119 <raver119@gmail.com> * avx2 tweak Signed-off-by: raver119 <raver119@gmail.com> * allow static for apple Signed-off-by: raver119@gmail.com <raver119@gmail.com> * exclude mkldnn in one more place Signed-off-by: raver119 <raver119@gmail.com> * exclude mkldnn in one more place Signed-off-by: raver119 <raver119@gmail.com> * restore OPENBLAS_PATH use Signed-off-by: raver119 <raver119@gmail.com> * add runtime check for avx/avx2 support Signed-off-by: raver119 <raver119@gmail.com> * convolution_auto Signed-off-by: raver119 <raver119@gmail.com> * Add logic for helper argument * minor test fix Signed-off-by: raver119 <raver119@gmail.com> * few tweaks Signed-off-by: raver119 <raver119@gmail.com> * few tweaks Signed-off-by: raver119 <raver119@gmail.com> * skip OpTracker props for non-x86 builds Signed-off-by: raver119 <raver119@gmail.com> * linux arm isn't x86 :) Signed-off-by: raver119 <raver119@gmail.com> * avx-512 Signed-off-by: raver119 <raver119@gmail.com> * CUDA presets fix Signed-off-by: raver119 <raver119@gmail.com> * BUILD_PIC Signed-off-by: raver119 <raver119@gmail.com> * prefetchw for avx2 Signed-off-by: raver119 <raver119@gmail.com> * BUILD_PIC again Signed-off-by: raver119 <raver119@gmail.com>
2019-09-11 20:50:28 +02:00
// FIXME: latest mkldnn doesn't ship mklml anymore?
2019-06-06 14:21:15 +02:00
// include CBLAS from MKL-DNN
Platform helpers (#8216) * platform helpers draft Signed-off-by: raver119 <raver119@gmail.com> * typo Signed-off-by: raver119 <raver119@gmail.com> * disable platform cmake Signed-off-by: raver119 <raver119@gmail.com> * another draft Signed-off-by: raver119 <raver119@gmail.com> * mkldnn convolution refactored Signed-off-by: raver119 <raver119@gmail.com> * minor tweaks Signed-off-by: raver119 <raver119@gmail.com> * one more safety check Signed-off-by: raver119 <raver119@gmail.com> * prototype works Signed-off-by: raver119 <raver119@gmail.com> * meh Signed-off-by: raver119 <raver119@gmail.com> * force static library mode for mkldnn Signed-off-by: raver119 <raver119@gmail.com> * - ismax fix - experimental arg fix - don't enforce openblas on Apple hardware Signed-off-by: raver119 <raver119@gmail.com> * bunch of small fixes Signed-off-by: raver119@gmail.com <raver119@gmail.com> * declare concurrent Signed-off-by: raver119@gmail.com <raver119@gmail.com> * - MKLDNN version upgrade to 1.0.2 - avgpool2d/maxpool2d APIs update Signed-off-by: raver119 <raver119@gmail.com> * - avgpool2d_bp/maxpool2d_bp APIs update Signed-off-by: raver119 <raver119@gmail.com> * - conv2d/batchnorm APIs update Signed-off-by: raver119 <raver119@gmail.com> * - lrn/conv2d_bp/conv3d/conv3d_bp APIs update Signed-off-by: raver119 <raver119@gmail.com> * all ops converted to MKLDNN 1.x Signed-off-by: raver119 <raver119@gmail.com> * bunch of tweaks Signed-off-by: raver119 <raver119@gmail.com> * namespace for platform helpers Signed-off-by: raver119 <raver119@gmail.com> * make sure platform helpers aren't opimized out Signed-off-by: raver119 <raver119@gmail.com> * build cpu_features on x86 systems Signed-off-by: raver119 <raver119@gmail.com> * build cpu_features on x86 systems Signed-off-by: raver119 <raver119@gmail.com> * more of cpu_features Signed-off-by: raver119 <raver119@gmail.com> * - mkldnn removed from java - cpu_features checks in CpuNDArrayFactory Signed-off-by: raver119 <raver119@gmail.com> * F16C definition renamed Signed-off-by: raver119 <raver119@gmail.com> * some mkldnn rearrangements Signed-off-by: raver119 <raver119@gmail.com> * check supported instructions before doing anything Signed-off-by: raver119 <raver119@gmail.com> * typo Signed-off-by: raver119 <raver119@gmail.com> * missied impl Signed-off-by: raver119 <raver119@gmail.com> * BUILD_PIC option Signed-off-by: raver119 <raver119@gmail.com> * conv2d fix Signed-off-by: raver119 <raver119@gmail.com> * avgpool3d fix Signed-off-by: raver119 <raver119@gmail.com> * avgpool3d_bp fix Signed-off-by: raver119 <raver119@gmail.com> * avgpool2d_bp leak fix Signed-off-by: raver119 <raver119@gmail.com> * avgpool3d_bp leak fix Signed-off-by: raver119 <raver119@gmail.com> * maxpool bp leaks fixed Signed-off-by: raver119 <raver119@gmail.com> * printf removed Signed-off-by: raver119 <raver119@gmail.com> * batchnorm fix Signed-off-by: raver119 <raver119@gmail.com> * AVX warning/error polishing Signed-off-by: AlexDBlack <blacka101@gmail.com> * Fix Signed-off-by: AlexDBlack <blacka101@gmail.com> * More polish Signed-off-by: AlexDBlack <blacka101@gmail.com> * Polish Signed-off-by: AlexDBlack <blacka101@gmail.com> * remove previous MKL-DNN support layer Signed-off-by: raver119 <raver119@gmail.com> * avx2 tweak Signed-off-by: raver119 <raver119@gmail.com> * allow static for apple Signed-off-by: raver119@gmail.com <raver119@gmail.com> * exclude mkldnn in one more place Signed-off-by: raver119 <raver119@gmail.com> * exclude mkldnn in one more place Signed-off-by: raver119 <raver119@gmail.com> * restore OPENBLAS_PATH use Signed-off-by: raver119 <raver119@gmail.com> * add runtime check for avx/avx2 support Signed-off-by: raver119 <raver119@gmail.com> * convolution_auto Signed-off-by: raver119 <raver119@gmail.com> * Add logic for helper argument * minor test fix Signed-off-by: raver119 <raver119@gmail.com> * few tweaks Signed-off-by: raver119 <raver119@gmail.com> * few tweaks Signed-off-by: raver119 <raver119@gmail.com> * skip OpTracker props for non-x86 builds Signed-off-by: raver119 <raver119@gmail.com> * linux arm isn't x86 :) Signed-off-by: raver119 <raver119@gmail.com> * avx-512 Signed-off-by: raver119 <raver119@gmail.com> * CUDA presets fix Signed-off-by: raver119 <raver119@gmail.com> * BUILD_PIC Signed-off-by: raver119 <raver119@gmail.com> * prefetchw for avx2 Signed-off-by: raver119 <raver119@gmail.com> * BUILD_PIC again Signed-off-by: raver119 <raver119@gmail.com>
2019-09-11 20:50:28 +02:00
//#include <mkl_cblas.h>
//#define CBLAS_H
2019-06-06 14:21:15 +02:00
#endif
#ifdef HAVE_OPENBLAS
// include CBLAS from OpenBLAS
#ifdef __GNUC__
#include_next <cblas.h>
#else
#include <cblas.h>
#endif
#define CBLAS_H
#endif
#ifndef CBLAS_H
#include <system/dll.h>
2019-06-06 14:21:15 +02:00
#ifdef __cplusplus
extern "C" {
#endif
#ifndef CBLAS_ENUM_DEFINED_H
#define CBLAS_ENUM_DEFINED_H
enum CBLAS_ORDER {CblasRowMajor=101, CblasColMajor=102 };
enum CBLAS_TRANSPOSE {CblasNoTrans=111, CblasTrans=112, CblasConjTrans=113,
AtlasConj=114};
enum CBLAS_UPLO {CblasUpper=121, CblasLower=122};
enum CBLAS_DIAG {CblasNonUnit=131, CblasUnit=132};
enum CBLAS_SIDE {CblasLeft=141, CblasRight=142};
#endif
#ifndef CBLAS_ENUM_ONLY
#define CBLAS_H
#define CBLAS_INDEX int
int cblas_errprn(int ierr, int info, char *form, ...);
void cblas_xerbla(int p, char *rout, char *form, ...);
#ifdef __MKL
void MKL_Set_Num_Threads(int num);
int MKL_Domain_Set_Num_Threads(int num, int domain);
int MKL_Set_Num_Threads_Local(int num);
#elif __OPENBLAS
void openblas_set_num_threads(int num);
#else
// do nothing
#endif
/*
* ===========================================================================
* Prototypes for level 1 BLAS functions (complex are recast as routines)
* ===========================================================================
*/
float cblas_sdsdot(int N, float alpha, float *X,
int incX, float *Y, int incY);
double cblas_dsdot(int N, float *X, int incX, float *Y,
int incY);
float cblas_sdot(int N, float *X, int incX,
float *Y, int incY);
double cblas_ddot(int N, double *X, int incX,
double *Y, int incY);
/*
* Functions having prefixes Z and C only
*/
void cblas_cdotu_sub(int N, void *X, int incX,
void *Y, int incY, void *dotu);
void cblas_cdotc_sub(int N, void *X, int incX,
void *Y, int incY, void *dotc);
void cblas_zdotu_sub(int N, void *X, int incX,
void *Y, int incY, void *dotu);
void cblas_zdotc_sub(int N, void *X, int incX,
void *Y, int incY, void *dotc);
/*
* Functions having prefixes S D SC DZ
*/
float cblas_snrm2(int N, float *X, int incX);
float cblas_sasum(int N, float *X, int incX);
double cblas_dnrm2(int N, double *X, int incX);
double cblas_dasum(int N, double *X, int incX);
float cblas_scnrm2(int N, void *X, int incX);
float cblas_scasum(int N, void *X, int incX);
double cblas_dznrm2(int N, void *X, int incX);
double cblas_dzasum(int N, void *X, int incX);
/*
* Functions having standard 4 prefixes (S D C Z)
*/
CBLAS_INDEX cblas_isamax(int N, float *X, int incX);
CBLAS_INDEX cblas_idamax(int N, double *X, int incX);
CBLAS_INDEX cblas_icamax(int N, void *X, int incX);
CBLAS_INDEX cblas_izamax(int N, void *X, int incX);
/*
* ===========================================================================
* Prototypes for level 1 BLAS routines
* ===========================================================================
*/
/*
* Routines with standard 4 prefixes (s, d, c, z)
*/
void cblas_sswap(int N, float *X, int incX,
float *Y, int incY);
void cblas_scopy(int N, float *X, int incX,
float *Y, int incY);
void cblas_saxpy(int N, float alpha, float *X,
int incX, float *Y, int incY);
void catlas_saxpby(int N, float alpha, float *X,
int incX, float beta, float *Y, int incY);
void catlas_sset
(int N, float alpha, float *X, int incX);
void cblas_dswap(int N, double *X, int incX,
double *Y, int incY);
void cblas_dcopy(int N, double *X, int incX,
double *Y, int incY);
void cblas_daxpy(int N, double alpha, double *X,
int incX, double *Y, int incY);
void catlas_daxpby(int N, double alpha, double *X,
int incX, double beta, double *Y, int incY);
void catlas_dset
(int N, double alpha, double *X, int incX);
void cblas_cswap(int N, void *X, int incX,
void *Y, int incY);
void cblas_ccopy(int N, void *X, int incX,
void *Y, int incY);
void cblas_caxpy(int N, void *alpha, void *X,
int incX, void *Y, int incY);
void catlas_caxpby(int N, void *alpha, void *X,
int incX, void *beta, void *Y, int incY);
void catlas_cset
(int N, void *alpha, void *X, int incX);
void cblas_zswap(int N, void *X, int incX,
void *Y, int incY);
void cblas_zcopy(int N, void *X, int incX,
void *Y, int incY);
void cblas_zaxpy(int N, void *alpha, void *X,
int incX, void *Y, int incY);
void catlas_zaxpby(int N, void *alpha, void *X,
int incX, void *beta, void *Y, int incY);
void catlas_zset
(int N, void *alpha, void *X, int incX);
/*
* Routines with S and D prefix only
*/
void cblas_srotg(float *a, float *b, float *c, float *s);
void cblas_srotmg(float *d1, float *d2, float *b1, float b2, float *P);
void cblas_srot(int N, float *X, int incX,
float *Y, int incY, float c, float s);
void cblas_srotm(int N, float *X, int incX,
float *Y, int incY, float *P);
void cblas_drotg(double *a, double *b, double *c, double *s);
void cblas_drotmg(double *d1, double *d2, double *b1, double b2, double *P);
void cblas_drot(int N, double *X, int incX,
double *Y, int incY, double c, double s);
void cblas_drotm(int N, double *X, int incX,
double *Y, int incY, double *P);
/*
* Routines with S D C Z CS and ZD prefixes
*/
void cblas_sscal(int N, float alpha, float *X, int incX);
void cblas_dscal(int N, double alpha, double *X, int incX);
void cblas_cscal(int N, void *alpha, void *X, int incX);
void cblas_zscal(int N, void *alpha, void *X, int incX);
void cblas_csscal(int N, float alpha, void *X, int incX);
void cblas_zdscal(int N, double alpha, void *X, int incX);
/*
* Extra reference routines provided by ATLAS, but not mandated by the standard
*/
void cblas_crotg(void *a, void *b, void *c, void *s);
void cblas_zrotg(void *a, void *b, void *c, void *s);
void cblas_csrot(int N, void *X, int incX, void *Y, int incY,
float c, float s);
void cblas_zdrot(int N, void *X, int incX, void *Y, int incY,
double c, double s);
/*
* ===========================================================================
* Prototypes for level 2 BLAS
* ===========================================================================
*/
/*
* Routines with standard 4 prefixes (S, D, C, Z)
*/
void cblas_sgemv( enum CBLAS_ORDER Order,
enum CBLAS_TRANSPOSE TransA, int M, int N,
float alpha, float *A, int lda,
float *X, int incX, float beta,
float *Y, int incY);
void cblas_sgbmv( enum CBLAS_ORDER Order,
enum CBLAS_TRANSPOSE TransA, int M, int N,
int KL, int KU, float alpha,
float *A, int lda, float *X,
int incX, float beta, float *Y, int incY);
void cblas_strmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, float *A, int lda,
float *X, int incX);
void cblas_stbmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, int K, float *A, int lda,
float *X, int incX);
void cblas_stpmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, float *Ap, float *X, int incX);
void cblas_strsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, float *A, int lda, float *X,
int incX);
void cblas_stbsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, int K, float *A, int lda,
float *X, int incX);
void cblas_stpsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, float *Ap, float *X, int incX);
void cblas_dgemv( enum CBLAS_ORDER Order,
enum CBLAS_TRANSPOSE TransA, int M, int N,
double alpha, double *A, int lda,
double *X, int incX, double beta,
double *Y, int incY);
void cblas_dgbmv( enum CBLAS_ORDER Order,
enum CBLAS_TRANSPOSE TransA, int M, int N,
int KL, int KU, double alpha,
double *A, int lda, double *X,
int incX, double beta, double *Y, int incY);
void cblas_dtrmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, double *A, int lda,
double *X, int incX);
void cblas_dtbmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, int K, double *A, int lda,
double *X, int incX);
void cblas_dtpmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, double *Ap, double *X, int incX);
void cblas_dtrsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, double *A, int lda, double *X,
int incX);
void cblas_dtbsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, int K, double *A, int lda,
double *X, int incX);
void cblas_dtpsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, double *Ap, double *X, int incX);
void cblas_cgemv( enum CBLAS_ORDER Order,
enum CBLAS_TRANSPOSE TransA, int M, int N,
void *alpha, void *A, int lda,
void *X, int incX, void *beta,
void *Y, int incY);
void cblas_cgbmv( enum CBLAS_ORDER Order,
enum CBLAS_TRANSPOSE TransA, int M, int N,
int KL, int KU, void *alpha,
void *A, int lda, void *X,
int incX, void *beta, void *Y, int incY);
void cblas_ctrmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, void *A, int lda,
void *X, int incX);
void cblas_ctbmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, int K, void *A, int lda,
void *X, int incX);
void cblas_ctpmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, void *Ap, void *X, int incX);
void cblas_ctrsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, void *A, int lda, void *X,
int incX);
void cblas_ctbsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, int K, void *A, int lda,
void *X, int incX);
void cblas_ctpsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, void *Ap, void *X, int incX);
void cblas_zgemv( enum CBLAS_ORDER Order,
enum CBLAS_TRANSPOSE TransA, int M, int N,
void *alpha, void *A, int lda,
void *X, int incX, void *beta,
void *Y, int incY);
void cblas_zgbmv( enum CBLAS_ORDER Order,
enum CBLAS_TRANSPOSE TransA, int M, int N,
int KL, int KU, void *alpha,
void *A, int lda, void *X,
int incX, void *beta, void *Y, int incY);
void cblas_ztrmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, void *A, int lda,
void *X, int incX);
void cblas_ztbmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, int K, void *A, int lda,
void *X, int incX);
void cblas_ztpmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, void *Ap, void *X, int incX);
void cblas_ztrsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, void *A, int lda, void *X,
int incX);
void cblas_ztbsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, int K, void *A, int lda,
void *X, int incX);
void cblas_ztpsv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE TransA, enum CBLAS_DIAG Diag,
int N, void *Ap, void *X, int incX);
/*
* Routines with S and D prefixes only
*/
void cblas_ssymv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, float alpha, float *A,
int lda, float *X, int incX,
float beta, float *Y, int incY);
void cblas_ssbmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, int K, float alpha, float *A,
int lda, float *X, int incX,
float beta, float *Y, int incY);
void cblas_sspmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, float alpha, float *Ap,
float *X, int incX,
float beta, float *Y, int incY);
void cblas_sger( enum CBLAS_ORDER Order, int M, int N,
float alpha, float *X, int incX,
float *Y, int incY, float *A, int lda);
void cblas_ssyr( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, float alpha, float *X,
int incX, float *A, int lda);
void cblas_sspr( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, float alpha, float *X,
int incX, float *Ap);
void cblas_ssyr2( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, float alpha, float *X,
int incX, float *Y, int incY, float *A,
int lda);
void cblas_sspr2( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, float alpha, float *X,
int incX, float *Y, int incY, float *A);
void cblas_dsymv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, double alpha, double *A,
int lda, double *X, int incX,
double beta, double *Y, int incY);
void cblas_dsbmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, int K, double alpha, double *A,
int lda, double *X, int incX,
double beta, double *Y, int incY);
void cblas_dspmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, double alpha, double *Ap,
double *X, int incX,
double beta, double *Y, int incY);
void cblas_dger( enum CBLAS_ORDER Order, int M, int N,
double alpha, double *X, int incX,
double *Y, int incY, double *A, int lda);
void cblas_dsyr( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, double alpha, double *X,
int incX, double *A, int lda);
void cblas_dspr( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, double alpha, double *X,
int incX, double *Ap);
void cblas_dsyr2( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, double alpha, double *X,
int incX, double *Y, int incY, double *A,
int lda);
void cblas_dspr2( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, double alpha, double *X,
int incX, double *Y, int incY, double *A);
/*
* Routines with C and Z prefixes only
*/
void cblas_chemv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, void *alpha, void *A,
int lda, void *X, int incX,
void *beta, void *Y, int incY);
void cblas_chbmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, int K, void *alpha, void *A,
int lda, void *X, int incX,
void *beta, void *Y, int incY);
void cblas_chpmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, void *alpha, void *Ap,
void *X, int incX,
void *beta, void *Y, int incY);
void cblas_cgeru( enum CBLAS_ORDER Order, int M, int N,
void *alpha, void *X, int incX,
void *Y, int incY, void *A, int lda);
void cblas_cgerc( enum CBLAS_ORDER Order, int M, int N,
void *alpha, void *X, int incX,
void *Y, int incY, void *A, int lda);
void cblas_cher( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, float alpha, void *X, int incX,
void *A, int lda);
void cblas_chpr( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, float alpha, void *X,
int incX, void *A);
void cblas_cher2( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo, int N,
void *alpha, void *X, int incX,
void *Y, int incY, void *A, int lda);
void cblas_chpr2( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo, int N,
void *alpha, void *X, int incX,
void *Y, int incY, void *Ap);
void cblas_zhemv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, void *alpha, void *A,
int lda, void *X, int incX,
void *beta, void *Y, int incY);
void cblas_zhbmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, int K, void *alpha, void *A,
int lda, void *X, int incX,
void *beta, void *Y, int incY);
void cblas_zhpmv( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, void *alpha, void *Ap,
void *X, int incX,
void *beta, void *Y, int incY);
void cblas_zgeru( enum CBLAS_ORDER Order, int M, int N,
void *alpha, void *X, int incX,
void *Y, int incY, void *A, int lda);
void cblas_zgerc( enum CBLAS_ORDER Order, int M, int N,
void *alpha, void *X, int incX,
void *Y, int incY, void *A, int lda);
void cblas_zher( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, double alpha, void *X, int incX,
void *A, int lda);
void cblas_zhpr( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
int N, double alpha, void *X,
int incX, void *A);
void cblas_zher2( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo, int N,
void *alpha, void *X, int incX,
void *Y, int incY, void *A, int lda);
void cblas_zhpr2( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo, int N,
void *alpha, void *X, int incX,
void *Y, int incY, void *Ap);
/*
* ===========================================================================
* Prototypes for level 3 BLAS
* ===========================================================================
*/
/*
* Routines with standard 4 prefixes (S, D, C, Z)
*/
void cblas_sgemm( enum CBLAS_ORDER Order, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_TRANSPOSE TransB, int M, int N,
int K, float alpha, float *A,
int lda, float *B, int ldb,
float beta, float *C, int ldc);
void cblas_ssymm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, int M, int N,
float alpha, float *A, int lda,
float *B, int ldb, float beta,
float *C, int ldc);
void cblas_ssyrk( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
float alpha, float *A, int lda,
float beta, float *C, int ldc);
void cblas_ssyr2k( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
float alpha, float *A, int lda,
float *B, int ldb, float beta,
float *C, int ldc);
void cblas_strmm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_DIAG Diag, int M, int N,
float alpha, float *A, int lda,
float *B, int ldb);
void cblas_strsm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_DIAG Diag, int M, int N,
float alpha, float *A, int lda,
float *B, int ldb);
void cblas_dgemm( enum CBLAS_ORDER Order, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_TRANSPOSE TransB, int M, int N,
int K, double alpha, double *A,
int lda, double *B, int ldb,
double beta, double *C, int ldc);
void cblas_dsymm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, int M, int N,
double alpha, double *A, int lda,
double *B, int ldb, double beta,
double *C, int ldc);
void cblas_dsyrk( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
double alpha, double *A, int lda,
double beta, double *C, int ldc);
void cblas_dsyr2k( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
double alpha, double *A, int lda,
double *B, int ldb, double beta,
double *C, int ldc);
void cblas_dtrmm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_DIAG Diag, int M, int N,
double alpha, double *A, int lda,
double *B, int ldb);
void cblas_dtrsm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_DIAG Diag, int M, int N,
double alpha, double *A, int lda,
double *B, int ldb);
void cblas_cgemm( enum CBLAS_ORDER Order, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_TRANSPOSE TransB, int M, int N,
int K, void *alpha, void *A,
int lda, void *B, int ldb,
void *beta, void *C, int ldc);
void cblas_csymm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, int M, int N,
void *alpha, void *A, int lda,
void *B, int ldb, void *beta,
void *C, int ldc);
void cblas_csyrk( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
void *alpha, void *A, int lda,
void *beta, void *C, int ldc);
void cblas_csyr2k( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
void *alpha, void *A, int lda,
void *B, int ldb, void *beta,
void *C, int ldc);
void cblas_ctrmm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_DIAG Diag, int M, int N,
void *alpha, void *A, int lda,
void *B, int ldb);
void cblas_ctrsm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_DIAG Diag, int M, int N,
void *alpha, void *A, int lda,
void *B, int ldb);
void cblas_zgemm( enum CBLAS_ORDER Order, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_TRANSPOSE TransB, int M, int N,
int K, void *alpha, void *A,
int lda, void *B, int ldb,
void *beta, void *C, int ldc);
void cblas_zsymm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, int M, int N,
void *alpha, void *A, int lda,
void *B, int ldb, void *beta,
void *C, int ldc);
void cblas_zsyrk( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
void *alpha, void *A, int lda,
void *beta, void *C, int ldc);
void cblas_zsyr2k( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
void *alpha, void *A, int lda,
void *B, int ldb, void *beta,
void *C, int ldc);
void cblas_ztrmm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_DIAG Diag, int M, int N,
void *alpha, void *A, int lda,
void *B, int ldb);
void cblas_ztrsm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, enum CBLAS_TRANSPOSE TransA,
enum CBLAS_DIAG Diag, int M, int N,
void *alpha, void *A, int lda,
void *B, int ldb);
/*
* Routines with prefixes C and Z only
*/
void cblas_chemm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, int M, int N,
void *alpha, void *A, int lda,
void *B, int ldb, void *beta,
void *C, int ldc);
void cblas_cherk( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
float alpha, void *A, int lda,
float beta, void *C, int ldc);
void cblas_cher2k( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
void *alpha, void *A, int lda,
void *B, int ldb, float beta,
void *C, int ldc);
void cblas_zhemm( enum CBLAS_ORDER Order, enum CBLAS_SIDE Side,
enum CBLAS_UPLO Uplo, int M, int N,
void *alpha, void *A, int lda,
void *B, int ldb, void *beta,
void *C, int ldc);
void cblas_zherk( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
double alpha, void *A, int lda,
double beta, void *C, int ldc);
void cblas_zher2k( enum CBLAS_ORDER Order, enum CBLAS_UPLO Uplo,
enum CBLAS_TRANSPOSE Trans, int N, int K,
void *alpha, void *A, int lda,
void *B, int ldb, double beta,
void *C, int ldc);
int cblas_errprn(int ierr, int info, char *form, ...);
#ifdef __cplusplus
}
#endif
#endif /* end #ifdef CBLAS_ENUM_ONLY */
#endif
#endif //NATIVEOPERATIONS_CBLAS_H