summary | shortlog | log | commit | commitdiff | tree
raw | patch | inline | side by side (parent: cbbe431)
raw | patch | inline | side by side (parent: cbbe431)
author | Jianzhong Xu <xuj@ti.com> | |
Thu, 12 May 2016 14:30:51 +0000 (10:30 -0400) | ||
committer | Jianzhong Xu <xuj@ti.com> | |
Thu, 12 May 2016 14:30:51 +0000 (10:30 -0400) |
2. added offload tables for AM572x
3. cleaned up tuning code
4. added -ldl to linker options for building the examples
3. cleaned up tuning code
4. added -ldl to linker options for building the examples
205 files changed:
index 66cb3e6641be209f638cd51e96505b24c3657c8f..c3a042d30eaba2b4d5568d62812345704c328a49 100644 (file)
LIB_DIR = $(LINALG_DIR)/packages/ti/linalg/lib/
LD_FLAGS=-L$(TARGET_ROOTDIR)/lib -L$(TARGET_ROOTDIR)/usr/lib -Wl,-rpath-link,$(TARGET_ROOTDIR)/lib -Wl,-rpath-link,$(TARGET_ROOTDIR)/usr/lib
-#BLASLIB = $(LIB_DIR)libcblas_armplusdsp.a $(LIB_DIR)libblis.a -lOpenCL -locl_util -lstdc++ -lrt -lm -lgomp -lpthread
-BLASLIB = $(LIB_DIR)libcblas_armplusdsp.a -lOpenCL -locl_util -lstdc++ -lrt -lm -lgomp -lpthread
-LAPACKLIB = $(LIB_DIR)libcblaswr.a $(LIB_DIR)liblapack.a $(LIB_DIR)libf2c.a $(LIB_DIR)libcblas_armplusdsp.a -lOpenCL -locl_util -lstdc++ -lrt -lm -lgomp -lpthread
+BLASLIB = $(LIB_DIR)libcblas_armplusdsp.a -lOpenCL -locl_util -lstdc++ -lrt -lm -lgomp -lpthread -ldl
+LAPACKLIB = $(LIB_DIR)libcblaswr.a $(LIB_DIR)liblapack.a $(LIB_DIR)libf2c.a $(LIB_DIR)libcblas_armplusdsp.a -lOpenCL -locl_util -lstdc++ -lrt -lm -lgomp -lpthread -ldl
%.o: %.c
$(CC) -c $(CFLAGS) $<
index 5885abb81d0a1ec8c1b2d480dc6aaa008d42b7dd..3d9ee061c56c025215e7967a469e99741a67370a 100644 (file)
endif
CPP_DEBUG = -g
-CPP_FLAGS = -D_LITTLE_ENDIAN -D__ARMv7 -DMEM_MODEL_${MEM_MODEL} -D$(TARGET) -I../../cblas/include -I../../blis/install/arm/include/blis/ -I$(TI_OCL_INSTALL_DIR)/include -fopenmp
+CPP_FLAGS = -D_LITTLE_ENDIAN -D__ARMv7 -DMEM_MODEL_${MEM_MODEL} -I../../cblas/include -I../../blis/install/arm/include/blis/ -I$(TI_OCL_INSTALL_DIR)/include -fopenmp
CL6X_FLAGS = $(INCS) --openmp --use_g2 -D$(TARGET) -DLIB_OPENCL
CLOCL_FLAGS =
OBJCOPY_ARGS=
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_cgemm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_cgemm.c
index e9ca10dcfb969a338d9680fcc12c4c85cb24a35c..664a12d3c130daaa37eaf885adfb82ee65746864 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_cgemm[GEMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_cgemm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_cgemm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_csyrk.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_csyrk.c
index 74c637b8c29f1af78277048e32a85d8e0b9e30b4..f6349ee18176d3ec30be80f89220f7323096afa7 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_csyrk[SYRK_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_csyrk.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_csyrk.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_ctrmm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_ctrmm.c
index 1d0522cfe906a8ce216d6182ca89afcdc4da839a..6cfef2e6400057e781a0664e15c41d6734f2688e 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_ctrmm[TRMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_ctrmm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_ctrmm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_ctrsm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_ctrsm.c
index 21dcdaf7e2a7a418860ef9ce237f86261e913bf6..c5e271b9576a35fe29da343ed75c15191d8de12a 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_ctrsm[TRMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_ctrsm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_ctrsm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_dgemm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_dgemm.c
index 75819ee81081f97ab372f0f4087fb7844240f1be..1fb99090b2d22e6f9071fbe793f7a75d02ca4022 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_dgemm[GEMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_dgemm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_dgemm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_dsyrk.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_dsyrk.c
index 776469b243fcba5789a8c3a4eb7169419754351e..a300b42d9b0435e82c1ec7f74a9ff7216c1716ac 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_dsyrk[SYRK_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_dsyrk.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_dsyrk.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_dtrmm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_dtrmm.c
index 446189f43978c51e8a802b985670cda0ed2a9ad7..02a7000f7cbbe4e6f790d7b80c2b3defa104201c 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_dtrmm[TRMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_dtrmm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_dtrmm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_dtrsm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_dtrsm.c
index daeb38ba53c4633d809a81df30524e28aff58e81..a431f8e7bfbc7c8d4178e6f46949c18a823df10a 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_dtrsm[TRMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,
-0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_dtrsm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_dtrsm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_sgemm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_sgemm.c
index b058b2fc71543a14d0c789e1a2cd0032bfb7accd..a413b342c7a16717afe28fcfd26c0600ee127076 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_sgemm[GEMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_sgemm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_sgemm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_ssyrk.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_ssyrk.c
index 5b89cc96949345af939f91043e4f3667e16cb38c..68068b7c84f0f0087d8005c38419db99fe008d50 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_ssyrk[SYRK_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_ssyrk.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_ssyrk.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_strmm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_strmm.c
index 22f14e7ad1f5d14889ff04d2ffb6187e05ecfae5..d5336a36a5d58388a4dec643e1fbcf4a4bd0c195 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_strmm[TRMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_strmm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_strmm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_strsm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_strsm.c
index 68cc3ae8c6e40b9571c82dc91920a6d7d805fc96..4aeabea169d0d12886680adb231cfed23a1a9499 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_strsm[TRMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,
-0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_strsm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_strsm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_zgemm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_zgemm.c
index f7259284446da61c46a6b666b5c75e5cc6a7746a..f7df161bc26814ec9014d23d944da363bad6fde8 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_zgemm[GEMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_zgemm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_zgemm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_zsyrk.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_zsyrk.c
index 8df383eabbb90e63e03754c186af49196c64c714..a8cef5f5dcb8c33b6091d7812d40087089a1b1c5 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_zsyrk[SYRK_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_zsyrk.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_zsyrk.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_ztrmm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_ztrmm.c
index 0d9caa8943f49acd5e7c1da22b0eb6ee20febfc2..d2bffd6b914005b70bced8e19e02d189586f140e 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_ztrmm[TRMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,1,
-0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
-1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_ztrmm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_ztrmm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ofld_tbl_ztrsm.c b/src/ti/linalg/blasblisacc/src/ofld_tbl_ztrsm.c
index 2d630e8e4c0e0dfc0fc5caa0fb2c34dfe49e42ce..d4c65e5df7aed0ba99a7d76a08abd35b3d904bcd 100644 (file)
* THE POSSIBILITY OF SUCH DAMAGE.
*****************************************************************************/
-#include "ti_cblas_acc.h"
-
-char ofld_tbl_ztrsm[TRMM_OFFLOAD_TBL_SIZE] = {
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
-0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,
-0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,
-0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1};
+#ifdef MEM_MODEL_Large
+# include "ofld_tbls_K2H/ofld_tbl_ztrsm.c"
+#else
+# ifdef MEM_MODEL_Small
+# include "ofld_tbls_AM572x/ofld_tbl_ztrsm.c"
+# else
+# error "Unsupported memory model! Please specify either MEM_MODEL_Large or MEM_MODEL_Small"
+# endif
+#endif
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_acc.h b/src/ti/linalg/blasblisacc/src/ti_cblas_acc.h
index d2ba1ac48cc8d3243673b43f92d942eebe517115..77d8a473c11a44c4c3b0a3216faa4e8b7c0079f4 100644 (file)
#define TI_CBLAS_CBLAS_ZTRSV_IDX 144
#define TI_CBLAS_NUM_KERNELS 145
-
+/* Level 3 kernels offload table */
+/* Number of points in each dimension. ARM processing and DSP processing time
+ are measured for each point to determine offload or not. */
#define NUM_PNT_EACH_DIM 16
+
+/* Offload table size */
#define GEMM_OFFLOAD_TBL_SIZE (NUM_PNT_EACH_DIM*NUM_PNT_EACH_DIM*NUM_PNT_EACH_DIM)
#define SYRK_OFFLOAD_TBL_SIZE (NUM_PNT_EACH_DIM*NUM_PNT_EACH_DIM)
#define TRMM_OFFLOAD_TBL_SIZE (NUM_PNT_EACH_DIM*NUM_PNT_EACH_DIM)
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_caxpy.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_caxpy.c
index 9f20b26c5c959bd22f81091306731494796cd593..233c69bdb60ccc5ebe51c6bef7243e1473fdf142 100644 (file)
@@ -156,6 +156,11 @@ void cblas_caxpy(const int N, const void *alpha, const void *X, const int incX,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ccopy.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ccopy.c
index bf48d8435b8ebb2d106c242cd1e87bb2797835e3..2a5fa6b44b4a4cb9617c85ff36ea92c797334b05 100644 (file)
@@ -145,6 +145,11 @@ void cblas_ccopy(const int N, const void *X, const int incX, void *Y, const int
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cdotc_sub.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cdotc_sub.c
index c54530ef6cebdcdc221d47d613b5b5b405ba2ce3..bb8fd34c56a0993ca6a5d32c52475def166db262 100644 (file)
@@ -156,6 +156,11 @@ void cblas_cdotc_sub(const int N, const void *X, const int incX, const void *Y,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cdotu_sub.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cdotu_sub.c
index 4070c52189bb4baecbceff2636f44f78a3583df5..2ba90052037e43816c53652d5ec20ca3d5a0659b 100644 (file)
@@ -156,6 +156,11 @@ void cblas_cdotu_sub(const int N, const void *X, const int incX, const void *Y,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgbmv.c
index f425fa1f73742d0754dbdc86339d717072ac2e0f..4a04d07ad56c26c1a5490fd15b4dfa241f8070d0 100644 (file)
@@ -218,6 +218,11 @@ void cblas_cgbmv(const enum CBLAS_ORDER order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgemm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgemm.c
index 3eb73efaa015ccac8fb7a71cb33dd5c1b3daf95c..9880b6dfc89e374024e4e45d3b31b83cbf47b05b 100644 (file)
@@ -250,7 +250,7 @@ void cblas_cgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_cgemm is %d\n.", err_code);
+ printf("Error in offloaded cblas_cgemm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -266,6 +266,11 @@ void cblas_cgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgemv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgemv.c
index 05fe4cfa38d6ea3c18874a5be894dc2632ef0b4c..c4d35c856a1ba8d9562b82a1bc2e12581782bb27 100644 (file)
@@ -206,6 +206,11 @@ void cblas_cgemv(const enum CBLAS_ORDER order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgerc.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgerc.c
index d16e435a1c22065338c6d2de95c0db1ee822aac5..3c89112142405e95bbe0731daeff73a48e86f41c 100644 (file)
@@ -189,6 +189,11 @@ void cblas_cgerc(const enum CBLAS_ORDER order, const int M, const int N, const v
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgeru.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cgeru.c
index ebf8c199e75cd4246eedc8f70ac34187efc691e0..3e951aa8f6e579bb73a257e3aee7350f7c21d3e6 100644 (file)
@@ -189,6 +189,11 @@ void cblas_cgeru(const enum CBLAS_ORDER order, const int M, const int N, const v
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chbmv.c
index 98ad84a78b75120d2ef3dbddf55405c452afc3fc..cfdb1f1e1a438b3a65b6601210ce2308285493aa 100644 (file)
@@ -206,6 +206,11 @@ void cblas_chbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chemm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chemm.c
index f8348692443c0900bd911592622e6b64326ad181..0e8eb77d498a6fea8770dae8730d053e5d4e1083 100644 (file)
@@ -244,7 +244,7 @@ void cblas_chemm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_chemm is %d\n.", err_code);
+ printf("Error in offloaded cblas_chemm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -260,6 +260,11 @@ void cblas_chemm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chemv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chemv.c
index b81a5ca893498ff1851356a8dc0588dee46b23fd..7421539a7302fc193bb392ebef13a6ab629a4966 100644 (file)
@@ -200,6 +200,11 @@ void cblas_chemv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cher.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cher.c
index f0ea8143e8f473bd6e4efb3d7bbc585a0329057e..fb566fde870116d753abd4e2d6fa1704fc19e8aa 100644 (file)
@@ -163,6 +163,11 @@ void cblas_cher(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cher2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cher2.c
index 12ba685746c159533dc326afb43a520f3641febe..f65b3072b2ab0f4c99594e028010a591f6352f46 100644 (file)
@@ -189,6 +189,11 @@ void cblas_cher2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cher2k.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cher2k.c
index ac6e37f4e20db12efe3e74d170d9e7c791a2b4bd..51ed40667360f4285da4c8795f23de1868b21dd4 100644 (file)
@@ -239,7 +239,7 @@ void cblas_cher2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_cher2k is %d\n.", err_code);
+ printf("Error in offloaded cblas_cher2k with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -255,6 +255,11 @@ void cblas_cher2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cherk.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cherk.c
index bce49b1cd305abee7baa64eefc6f4b064cf26b26..5e45c12482c3d4f42cf31098b29fd47d54549602 100644 (file)
@@ -213,7 +213,7 @@ void cblas_cherk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_cherk is %d\n.", err_code);
+ printf("Error in offloaded cblas_cherk with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -229,6 +229,11 @@ void cblas_cherk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chpmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chpmv.c
index 3de67e443f5714b7acf185940575112751242127..03e14dd173acf0a5947b29f705f06c90d09cd882 100644 (file)
@@ -194,6 +194,11 @@ void cblas_chpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chpr.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chpr.c
index ec3155a58e59e5df7d40026b3d1ddece8e422b29..315d80d9ff23439a75ad4652d4b6d645425d16ed 100644 (file)
@@ -157,6 +157,11 @@ void cblas_chpr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chpr2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_chpr2.c
index e64057cbf75f07fab9af75620d3e99c189f82c17..7f0f765e28b88a3b07951f5ee12072139bc4fece 100644 (file)
@@ -183,6 +183,11 @@ void cblas_chpr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_crotg.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_crotg.c
index 190ec8f1cca21f5d78802f88b28ec476ebdc5533..8eb77ee8a817b579e526d73c112b5823a46d634f 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cscal.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cscal.c
index 4c930606f994d222ea6a9cbd085763678db343b0..7933cba2d9fc0c7953be17272f5f92b37727ea70 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_csscal.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_csscal.c
index a548c62aca96cd7f9884405a665c336488c6c2b5..161b6d5f8b8e7c831fc4ecc49e99fc60942c1643 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cswap.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_cswap.c
index e6d206a42c89e5be55b324d02633db0abc9cae19..1dac9fedd534ce7d44d7130fc68d153488f938ea 100644 (file)
@@ -156,6 +156,11 @@ void cblas_cswap(const int N, void *X, const int incX, void *Y, const int incY)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_csymm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_csymm.c
index 14785a23e6d2ac1ab59e6db6ff1f785ecc5a7eee..41558f8192a7e9d8a27382be64c8ea396b0e2395 100644 (file)
@@ -244,7 +244,7 @@ void cblas_csymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_csymm is %d\n.", err_code);
+ printf("Error in offloaded cblas_csymm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -260,6 +260,11 @@ void cblas_csymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_csyr2k.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_csyr2k.c
index 2e26948440d0a54513459e29a6e9949b5b1b7205..3a3611f1e7f531e6e7f11d0d859ea5b51d72e4ca 100644 (file)
@@ -244,7 +244,7 @@ void cblas_csyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_csyr2k is %d\n.", err_code);
+ printf("Error in offloaded cblas_csyr2k with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -260,6 +260,11 @@ void cblas_csyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_csyrk.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_csyrk.c
index c76555749e462a2415c7b12e9c1b6a08fced6c7b..8a0a4a4224058b659b209c8be272f12137d2028f 100644 (file)
@@ -223,7 +223,7 @@ void cblas_csyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_csyrk is %d\n.", err_code);
+ printf("Error in offloaded cblas_csyrk with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -239,6 +239,11 @@ void cblas_csyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctbmv.c
index 467cf853e1394d09354185b127fd28a83c0ad82b..237b7febe40b01b01ecb3a8afa78c9ba87f9669c 100644 (file)
@@ -175,6 +175,11 @@ void cblas_ctbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctbsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctbsv.c
index 9c9c9a92552ba3d01c88a3a187b6ac3c14d1ea6a..b03c3166381c64e2851634ffe9d4fa3a5e38f48b 100644 (file)
@@ -175,6 +175,11 @@ void cblas_ctbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctpmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctpmv.c
index 251ce80a821841bc1125932513e2330a2abe5f18..816fed24bfa6d2426eabc789356aedafc16846ca 100644 (file)
@@ -163,6 +163,11 @@ void cblas_ctpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctpsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctpsv.c
index 42b6a0bed910d142f0f870fa2ca2d1572e9f9f93..44d25ed595ae7aea9ebba6491e4c57e9709f6377 100644 (file)
@@ -163,6 +163,11 @@ void cblas_ctpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctrmm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctrmm.c
index 50d3607515a703784a85b67db26f5228ba228480..17713afbbdd62cd2edaa0a410876438a2cbc24cf 100644 (file)
@@ -224,7 +224,7 @@ void cblas_ctrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_ctrmm is %d\n.", err_code);
+ printf("Error in offloaded cblas_ctrmm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -240,6 +240,11 @@ void cblas_ctrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctrmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctrmv.c
index c501935c1d3d91f0c2199a1c8cfb2abb66576f86..e2461a537ffc44343583fb0d0737dff32e7717f8 100644 (file)
@@ -169,6 +169,11 @@ void cblas_ctrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctrsm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctrsm.c
index c03d8a0acb7997d19aaf56c2f5d31703f80bb753..7279d08ee39073af1f7c9dbd29cbb43171d285d4 100644 (file)
@@ -224,7 +224,7 @@ void cblas_ctrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_ctrsm is %d\n.", err_code);
+ printf("Error in offloaded cblas_ctrsm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -240,6 +240,11 @@ void cblas_ctrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctrsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ctrsv.c
index 39c3ee4f3b6c4d28c4d6f467fea3cf0ce70d45b1..2ecf16804f5a6d778ca1a9592d216636b7c942cf 100644 (file)
@@ -169,6 +169,11 @@ void cblas_ctrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dasum.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dasum.c
index 60527bd78fd82c1773f9bac6fb77abe3c4f2ed72..3425c225829197bd64c48ec22c05694b4d1629eb 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_daxpy.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_daxpy.c
index b673a31464acfc370cf5b15290ee488eb943a252..64a6824be27981387aec5cf4fa34656495730dcb 100644 (file)
@@ -151,6 +151,11 @@ void cblas_daxpy(const int N, const double alpha, const double *X, const int inc
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dcopy.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dcopy.c
index fa8877c17f807fc69412fa8eee340c4467c86171..c145e2da13925a3fe3d34183c8df8174bc6d5ca5 100644 (file)
@@ -145,6 +145,11 @@ void cblas_dcopy(const int N, const double *X, const int incX, double *Y, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ddot.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ddot.c
index de913e558c46dab97c2865f864490e5eb80db47c..aa1f769a67e9c6f4a7a829b0f303c262b62cf274 100644 (file)
@@ -158,6 +158,11 @@ double cblas_ddot(const int N, const double *X, const int incX, const double *Y,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dgbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dgbmv.c
index 4eb8ca18ff0bb15ef5f4bcb502a08e9987d5a9ba..1ce1c80d8f3db4f135bf9dd7d643bc49ad620be3 100644 (file)
@@ -208,6 +208,11 @@ void cblas_dgbmv(const enum CBLAS_ORDER order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dgemm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dgemm.c
index 4cfa7e56da6ae7414a4d2f43e454e62849416228..92ecb14c72cec6f4aafe2597f0cfd6f5edd73b82 100644 (file)
@@ -240,7 +240,7 @@ void cblas_dgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_dgemm is %d\n.", err_code);
+ printf("Error in offloaded cblas_dgemm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -256,6 +256,11 @@ void cblas_dgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dgemv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dgemv.c
index c624f6cca3a40c9c5fa0597d910ce015da291c80..2c3a5e2ad743bf11a6bbcfee2900ad824673273e 100644 (file)
@@ -196,6 +196,11 @@ void cblas_dgemv(const enum CBLAS_ORDER order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dger.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dger.c
index 0492d0aa90393e9e91e4c8f47eed80e36a021a9d..1c911e7245419c126c7177ae96b22483df096502 100644 (file)
@@ -184,6 +184,11 @@ void cblas_dger(const enum CBLAS_ORDER order, const int M, const int N, const do
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dnrm2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dnrm2.c
index bc200fa6b73a8483437b8be129743f34f50a0fe6..a3c14c681f8ce132a6d0c4edd4890358a9e6e44a 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_drot.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_drot.c
index 86bacba7ff9f9a8ccbc3e38c331251f153d8d0fe..dd86c24823efd90285b11eb31337c00f356080b0 100644 (file)
@@ -156,6 +156,11 @@ void cblas_drot(const int N, double *X, const int incX, double *Y, const int inc
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_drotg.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_drotg.c
index c535574abfa0498693584096376268f81f14520e..5b3732c187c57927bb951a96b8670f6afc3df8c5 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_drotm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_drotm.c
index 0cb941fd2abe30879be6c2c59814e806e1a3d741..0ba101a19437e65e64fa309688cfab33b4b1e32a 100644 (file)
@@ -155,6 +155,11 @@ void cblas_drotm(const int N, double *X, const int incX, double *Y, const int in
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_drotmg.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_drotmg.c
index 0cf5e8fa10c592ad895766bd4fdd07af8f603af5..efbcc94daccaaaab4b190248e904f5c861c4fdae 100644 (file)
@@ -144,6 +144,11 @@ void cblas_drotmg(double *d1, double *d2, double *b1, const double b2, double *P
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsbmv.c
index 920b40361577f965bfc38fb63842a17fa4d7a31c..b8267660872abad4e2f9e799e48183b5e87b7e3c 100644 (file)
@@ -196,6 +196,11 @@ void cblas_dsbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dscal.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dscal.c
index d75049f65afa31e77da37c9623bcde8b2a2fb6fb..93d81f0288417f8667eede5160578e686af68ded 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsdot.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsdot.c
index c976fefc2d1db46dff46a00058ce01f1755065c1..8f027918b92f909d41ece6b1671411d4550cb6a4 100644 (file)
@@ -158,6 +158,11 @@ double cblas_dsdot(const int N, const float *X, const int incX, const float *Y,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dspmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dspmv.c
index 48a0e452f080642d37d9fd16dd0e9f567247bdb6..13b403b29b4e710d6081aedadd1c45a87462c351 100644 (file)
@@ -184,6 +184,11 @@ void cblas_dspmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dspr.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dspr.c
index 93c94843f2675e378546df796d7ff164c7ff11cd..c3479696e95e8d5a19ffbda1d0554d250515909f 100644 (file)
@@ -157,6 +157,11 @@ void cblas_dspr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dspr2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dspr2.c
index 89aff959b3476b815b36e62be51e06c638c1ce63..812bb3bd7b903889e2de4439deacfde511307d44 100644 (file)
@@ -178,6 +178,11 @@ void cblas_dspr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dswap.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dswap.c
index b3e692928613b5f5f34a048a47df2bd8a27d52d2..d17893dd6a9d3cfaf42c827513869946d7e176c7 100644 (file)
@@ -156,6 +156,11 @@ void cblas_dswap(const int N, double *X, const int incX, double *Y, const int in
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsymm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsymm.c
index 52dd00838ae0bc335c17b15fcdff3215a8055161..d5c28bc24c720acfaf68bba9cc0be0c52bcb4cf1 100644 (file)
@@ -234,7 +234,7 @@ void cblas_dsymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_dsymm is %d\n.", err_code);
+ printf("Error in offloaded cblas_dsymm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -250,6 +250,11 @@ void cblas_dsymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsymv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsymv.c
index 7e6a9627ff427826615c8aaf8a4c4a20c359b6ed..80eb1a67ed2955a3c5472a2e2ce5a542a674ffe5 100644 (file)
@@ -190,6 +190,11 @@ void cblas_dsymv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsyr.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsyr.c
index 1d42f0bd40df24f47c96d9a097cb85c9721731fd..6b05e31db0cfc8d560f3c3563c31792a3fc33529 100644 (file)
@@ -163,6 +163,11 @@ void cblas_dsyr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsyr2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsyr2.c
index 5fa094ba29d3f72ba026ea29774e3460e2ec878f..86a5a48f4bca85f6dc7f60acd45e8cdd958af212 100644 (file)
@@ -184,6 +184,11 @@ void cblas_dsyr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsyr2k.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsyr2k.c
index 4c5f281b5d62fa41efb43e50c29f274fafaad2c7..4caffb7de298583d88eefabe161471684235edaa 100644 (file)
@@ -234,7 +234,7 @@ void cblas_dsyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_dsyr2k is %d\n.", err_code);
+ printf("Error in offloaded cblas_dsyr2k with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -250,6 +250,11 @@ void cblas_dsyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsyrk.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dsyrk.c
index e07661799bfb34b4af00823f737fd24490f8ef35..341ff82ff53a9e39fb0fef86642fd5c603166927 100644 (file)
@@ -213,7 +213,7 @@ void cblas_dsyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_dsyrk is %d\n.", err_code);
+ printf("Error in offloaded cblas_dsyrk with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -229,6 +229,11 @@ void cblas_dsyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtbmv.c
index 4856f3cb8a92bf0d1332cb118a6dee1470fcf8e0..d95c34f09a9124e55768e4a797874627e6d51652 100644 (file)
@@ -175,6 +175,11 @@ void cblas_dtbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtbsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtbsv.c
index f9aaf2d9d20c7277c82d9053cb0bd6f668c4afc2..c375c4ecf95729de4adca6e47839acd4a8681cba 100644 (file)
@@ -175,6 +175,11 @@ void cblas_dtbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtpmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtpmv.c
index d3740ee3cfecdc52912e75338f954cb094434303..105c178e34796cf8eb303b2c0dec1a392078fb40 100644 (file)
@@ -163,6 +163,11 @@ void cblas_dtpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtpsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtpsv.c
index 030eea6765d132fdf1ef7a895afe68bbc5c82ec5..32311ab056a1f767871ed3cec340bddfb5379323 100644 (file)
@@ -163,6 +163,11 @@ void cblas_dtpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtrmm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtrmm.c
index f2107933378711c35ae27855d4096eb5b0d668f2..cac7e276f6a73a63abaa363d2392ceab355a9693 100644 (file)
@@ -219,7 +219,7 @@ void cblas_dtrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_dtrmm is %d\n.", err_code);
+ printf("Error in offloaded cblas_dtrmm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -235,6 +235,11 @@ void cblas_dtrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtrmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtrmv.c
index 20d08c8d4b57582572ee6e67c76f9a41ae3df512..d281310446b5ae87da523ff7b950879cfdccee25 100644 (file)
@@ -169,6 +169,11 @@ void cblas_dtrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtrsm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtrsm.c
index 0dbfa28d843a8de0bdff5137f86cb8ce0372428c..a3bbc06c16a643f46c72233e6e26e57e8b9f5c6b 100644 (file)
@@ -219,7 +219,7 @@ void cblas_dtrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_dtrsm is %d\n.", err_code);
+ printf("Error in offloaded cblas_dtrsm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -235,6 +235,11 @@ void cblas_dtrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtrsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dtrsv.c
index d9229c0ae5af6723db06d1b0e26ecb4e96050690..4001c3f22e5b0ced5c9a0faaa6d4fb74a31a07f7 100644 (file)
@@ -169,6 +169,11 @@ void cblas_dtrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dzasum.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dzasum.c
index 6d5641bc9ea69bf9dbd245966dbc7069d4abf18b..5b79f68d7de150abf64c254dfda8f6e99a3bcb14 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dznrm2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_dznrm2.c
index 4557b2ef40342b27aa1b4cd4747397da85bdf5a7..81d7e539848459bedf09767664035d4296349c6a 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_icamax.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_icamax.c
index ce9e10c21c5f582e110dd01f75d7f28b0ad98f5f..7cbcfc3424fd833e3a0f46bef12b76eedbb0a91e 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_idamax.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_idamax.c
index d6bfedfdb6c8e5c7f032ab6819dac7fca6e9d388..d393ea2dee1592a4ae1d1a7dcd2a9dba407d6f52 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_isamax.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_isamax.c
index 5beae2407db6d0578d18afe45592d7786978e9c1..35d6aa6c433dad62251565649f141a6100b1e0f9 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_izamax.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_izamax.c
index c80492381b2fbef510666d734f23fb14de910c89..f23531903a6a78d7a71e504a4bed8a00134ce271 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sasum.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sasum.c
index 6f4172d8596c2196c515c80186af5cb4690d0abb..60b0b88da69eedd7c74e56d7c4841588c316f159 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_saxpy.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_saxpy.c
index 9c7af6ef5e3df994d1ebee6e3962b9e3724531a2..2caee520b15c109476508d843704657d17c276ac 100644 (file)
@@ -151,6 +151,11 @@ void cblas_saxpy(const int N, const float alpha, const float *X, const int incX,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_scasum.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_scasum.c
index 3f0a9a34a382de498be87f36cb82e93a37fb9014..67c18eafd9f856abb22474c2490ef5bbe95fdf4c 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_scnrm2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_scnrm2.c
index 43f0b2f8daee71bb7fbc2da09bd650cb34985650..a9e271381d91cf4b313ad573d9672107880d246d 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_scopy.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_scopy.c
index 7e225e88b36f50ae35a1526305af6ca5a1a1dc3d..2c3a8f3215480952678ca68cf5c71beeadc0849d 100644 (file)
@@ -145,6 +145,11 @@ void cblas_scopy(const int N, const float *X, const int incX, float *Y, const in
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sdot.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sdot.c
index 9cd85250c62450db3c743038082f3fba35f47f43..ab7d8d0eccebab4f57bdef72e11cee33e4419c98 100644 (file)
@@ -158,6 +158,11 @@ float cblas_sdot(const int N, const float *X, const int incX, const float *Y, co
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sdsdot.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sdsdot.c
index 268fb76d9fe697dbef58b7a2ede06fe3e8eef091..fd5adb9dea7f0e67464991fada1cdafe62eb7266 100644 (file)
@@ -164,6 +164,11 @@ float cblas_sdsdot(const int N, const float alpha, const float *X, const int inc
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sgbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sgbmv.c
index 956ee4110936c7bddf2c7d52798e3438249e2b22..32d800ae4a9308551d2b7c0d4b5ae3316bfd4a9d 100644 (file)
@@ -208,6 +208,11 @@ void cblas_sgbmv(const enum CBLAS_ORDER order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sgemm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sgemm.c
index 3385f80c8c17b0fe1a9321ca22ea50284d7a81d0..9599e84db0b23786fddfe3d5ca160697aad4e945 100644 (file)
@@ -240,7 +240,7 @@ void cblas_sgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_sgemm is %d\n.", err_code);
+ printf("Error in offloaded cblas_sgemm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -256,6 +256,11 @@ void cblas_sgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sgemv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sgemv.c
index 9acaf531852879ddc1df0546b8da64c99afbad4f..48a3de602e1fa7501f58a186a2cb7779a56a69b3 100644 (file)
@@ -196,6 +196,11 @@ void cblas_sgemv(const enum CBLAS_ORDER order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sger.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sger.c
index fcf4ca2447b629688d2508ee97467595506a823f..6780fa907d163c4a7c1032cb7a5632ab156184e8 100644 (file)
@@ -184,6 +184,11 @@ void cblas_sger(const enum CBLAS_ORDER order, const int M, const int N, const fl
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_snrm2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_snrm2.c
index 013acfabcdf148eb1bcc16480e45f5d9ee9b81f2..ba378a301b3b1015b3b5cbd4bc6f0c36ae93e4bf 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return 0;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_srot.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_srot.c
index cafda115a4d0d08b9352f6f0864a0812bb416330..a7c6bbcbb34ea476515cf25809415394c2a261bf 100644 (file)
@@ -156,6 +156,11 @@ void cblas_srot(const int N, float *X, const int incX, float *Y, const int incY,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_srotg.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_srotg.c
index dbe5e2d6c86d533809a642281dca108f4878cce8..f399accf8565f87503c65fc5edfad18a7b036d90 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_srotm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_srotm.c
index 42a2bf43dbfc23695ec3e34b15b19a5ec7b7ac7b..845a95436a5af53a86d90e0090d547807252ed17 100644 (file)
@@ -155,6 +155,11 @@ void cblas_srotm(const int N, float *X, const int incX, float *Y, const int incY
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_srotmg.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_srotmg.c
index 892f0646b2af12ee17521023641ef47b87f687fd..8a03f42e27dd026caa84c8636b62b3b0685fbf46 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssbmv.c
index 8e7f770cfccd9abf1cd3a93936bdd58f1289241b..24f9925a4fc1d2d912644bc98a269147a8b83773 100644 (file)
@@ -196,6 +196,11 @@ void cblas_ssbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sscal.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sscal.c
index d375b548ca045d954c31030bb01a3ef76b1d8941..df05602b088e4be22387053c4b045502bc068fc8 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sspmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sspmv.c
index d292322a2c27abfa3ffca743e9fb8305c7e6b31e..562ccec61399d31c7cb66817956295039323a5d9 100644 (file)
@@ -184,6 +184,11 @@ void cblas_sspmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sspr.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sspr.c
index 229cc92b922d28d3fa8096ac72c80a631caae19d..b2e934244e586b4f52eaa1f244004067451fde73 100644 (file)
@@ -157,6 +157,11 @@ void cblas_sspr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sspr2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sspr2.c
index 30c784ea1b50e838cfb8977fc2a79a642b1118ac..7b82e54573298f4083c600ffd0b07c5ce36e1efc 100644 (file)
@@ -178,6 +178,11 @@ void cblas_sspr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sswap.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_sswap.c
index 2f7865eecf9215983fac2111e695c37074930a53..d7590dd121ce2841f7fe3c7d3330513729a15b77 100644 (file)
@@ -156,6 +156,11 @@ void cblas_sswap(const int N, float *X, const int incX, float *Y, const int incY
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssymm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssymm.c
index f3852044622292eeb09776f982424e8d953e4617..bc86c8ec103dc7e4bfef3550fd8330b12e66ad03 100644 (file)
@@ -234,7 +234,7 @@ void cblas_ssymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_ssymm is %d\n.", err_code);
+ printf("Error in offloaded cblas_ssymm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -250,6 +250,11 @@ void cblas_ssymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssymv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssymv.c
index 6aedd21b2099f9c68f579f2b095647bebc6c6da6..bfe09acba07085ca1d1019b0b840b962e76667f0 100644 (file)
@@ -190,6 +190,11 @@ void cblas_ssymv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssyr.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssyr.c
index 64166fb7805017b77f8915fd5eaefb28dea769c6..e6c30c8fda1d3255af0f92fee18dad2a6dabb68f 100644 (file)
@@ -163,6 +163,11 @@ void cblas_ssyr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssyr2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssyr2.c
index d5edeac4e9449fe712ae4f487bdf0742bab36d92..fa56ed316d9dc1cfd461ab14a62c98add17d0379 100644 (file)
@@ -184,6 +184,11 @@ void cblas_ssyr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssyr2k.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssyr2k.c
index 8564f71b855ce2d164fa90786928001a17692661..40d85039f1b95e1ad6d11753cfe049406b9384b7 100644 (file)
@@ -234,7 +234,7 @@ void cblas_ssyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_ssyr2k is %d\n.", err_code);
+ printf("Error in offloaded cblas_ssyr2k with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -250,6 +250,11 @@ void cblas_ssyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssyrk.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ssyrk.c
index a9f8a2db47ddd19ef695eb5039aaf9e83e22b656..f9c0f31001877212bb62ea3b132cd518711a11de 100644 (file)
@@ -213,7 +213,7 @@ void cblas_ssyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_ssyrk is %d\n.", err_code);
+ printf("Error in offloaded cblas_ssyrk with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -229,6 +229,11 @@ void cblas_ssyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_stbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_stbmv.c
index 60fe80300ab035b668a733666a499ca83e86844e..607394c273ddd7610f46ebfee76aa49e66f8661c 100644 (file)
@@ -175,6 +175,11 @@ void cblas_stbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_stbsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_stbsv.c
index 7ac2d478afac27e1f380af80382e6de53045f293..96e6cab5bd9f474bf3004b92a4763c388761a819 100644 (file)
@@ -175,6 +175,11 @@ void cblas_stbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_stpmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_stpmv.c
index 0e0a326afeca05ba803d6f0944cc47f5b386e047..b45b877c4c5bfbcc9b77258ca2487c9ef7c27984 100644 (file)
@@ -163,6 +163,11 @@ void cblas_stpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_stpsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_stpsv.c
index e54e5650deb312b09f00c746d4247f5f0e8d8780..0681ed8f644185c6cec6ce2797a6f45b4f48e22d 100644 (file)
@@ -163,6 +163,11 @@ void cblas_stpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_strmm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_strmm.c
index 4e80830d0e4ac23c9e1133e6098afd336ed2ebce..3839c8e7956fd284a8086d1aafdcc246fef60725 100644 (file)
@@ -219,7 +219,7 @@ void cblas_strmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_strmm is %d\n.", err_code);
+ printf("Error in offloaded cblas_strmm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -235,6 +235,11 @@ void cblas_strmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_strmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_strmv.c
index 9860ef5389428bac5ac5bc344f55043531ef2e83..40ddbc3375d8e86daf218cd3c00ce41a1c16c626 100644 (file)
@@ -169,6 +169,11 @@ void cblas_strmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_strsm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_strsm.c
index 4bf872ca5f052ca5c8db46826e154982c7e698d6..18e329e6287e7d58a1953daa138d4e2b5742703e 100644 (file)
@@ -219,7 +219,7 @@ void cblas_strsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_strsm is %d\n.", err_code);
+ printf("Error in offloaded cblas_strsm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -235,6 +235,11 @@ void cblas_strsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_strsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_strsv.c
index 1a7e2096f48a89a55075e2816760173a67ab0b20..26b9a3c8e76547cc2c05a295f6225e59a1245b16 100644 (file)
@@ -169,6 +169,11 @@ void cblas_strsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_xerbla.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_xerbla.c
index f7da8da5f5bfcbee9eaa11924c8a55b556cae538..23efb904e8bb5b76c347471d593b01b6d4087c38 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zaxpy.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zaxpy.c
index c4899aa2aa4e361b238f6d07d600028dddc9e8d2..fdbd907ea4e1ac980aea101ff3ed2bb0d8212b98 100644 (file)
@@ -156,6 +156,11 @@ void cblas_zaxpy(const int N, const void *alpha, const void *X, const int incX,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zcopy.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zcopy.c
index 36b75550ec81044c32c1e0f358d180b5d1d07b35..da878b56ffbe71b8951a3b92b2ffde00ceb450e2 100644 (file)
@@ -145,6 +145,11 @@ void cblas_zcopy(const int N, const void *X, const int incX, void *Y, const int
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zdotc_sub.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zdotc_sub.c
index 7bc1336cd31f3d5576c4676db93f5301f9cc6b27..4a97d0ba4993c2190e46117a065eb3eb977406d6 100644 (file)
@@ -156,6 +156,11 @@ void cblas_zdotc_sub(const int N, const void *X, const int incX, const void *Y,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zdotu_sub.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zdotu_sub.c
index 0327eebe150194bb5ea43796d293af7103a1eb41..7d7f3e12606d8c51f448f476c2e377d516992759 100644 (file)
@@ -156,6 +156,11 @@ void cblas_zdotu_sub(const int N, const void *X, const int incX, const void *Y,
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zdscal.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zdscal.c
index 838c7dea90c45dbcb4ee8e60e6f01c4fb0a8430d..7294884c36b518c5bba2e1c523505f96430f1dda 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgbmv.c
index 049ca5811653975b0bce644c61be20cb0356cf9e..3eb84718dd76f48a7489c5e7c6e0d7b9f0903eb2 100644 (file)
@@ -218,6 +218,11 @@ void cblas_zgbmv(const enum CBLAS_ORDER order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgemm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgemm.c
index fc11cb1c7672bc45fc2fbbea949939375d677332..ac457bd7a69992a2d361731f55a0ea120fa55597 100644 (file)
@@ -250,7 +250,7 @@ void cblas_zgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_zgemm is %d\n.", err_code);
+ printf("Error in offloaded cblas_zgemm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -266,6 +266,11 @@ void cblas_zgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgemv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgemv.c
index 2e1dbc1d6209cd2e3c8c340bfca0d54a9c32c716..b4767f5b4858a98d737f2b8ac346262030aad962 100644 (file)
@@ -206,6 +206,11 @@ void cblas_zgemv(const enum CBLAS_ORDER order, const enum CBLAS_TRANSPOSE TransA
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgerc.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgerc.c
index 6292ddccffd4e7509d3e2515c6362177a1937c88..58eb984d4af06d5d0498bc7cd5a09dc221dff788 100644 (file)
@@ -189,6 +189,11 @@ void cblas_zgerc(const enum CBLAS_ORDER order, const int M, const int N, const v
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgeru.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zgeru.c
index 8302431314f7ef2f0452302e7771b983121dd136..23d4c079cf77b08e356cb59d3f65633f4e76d6c7 100644 (file)
@@ -189,6 +189,11 @@ void cblas_zgeru(const enum CBLAS_ORDER order, const int M, const int N, const v
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhbmv.c
index 6afd4cbd2c2c27421dceed1e9d16227fe91fda32..67779e49f77aca7dba32d0f9142c4cf8e8194665 100644 (file)
@@ -206,6 +206,11 @@ void cblas_zhbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhemm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhemm.c
index 193b0f345d6d6d8390e39525947a7e6f7961a5db..7e94b80d08ea4a36ccce275679f50cf53ae15df9 100644 (file)
@@ -244,7 +244,7 @@ void cblas_zhemm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_zhemm is %d\n.", err_code);
+ printf("Error in offloaded cblas_zhemm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -260,6 +260,11 @@ void cblas_zhemm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhemv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhemv.c
index 283bc8d77feec964a2f6205685d33073c0172551..c6a4cbe1a4ec9edb8bd98f7b0563f13feb08a821 100644 (file)
@@ -200,6 +200,11 @@ void cblas_zhemv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zher.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zher.c
index bf0dec2e521f2e40394ebd26ed609a0794301e70..3fdd79ee8ef72548fff6bbf00d78849217ff0a1d 100644 (file)
@@ -163,6 +163,11 @@ void cblas_zher(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zher2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zher2.c
index 9b72f952c717e8b87f0e45464343b7e4a45500c5..0cdf1aba2bbfa961cebe34a3bc4ef7730d608caa 100644 (file)
@@ -189,6 +189,11 @@ void cblas_zher2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zher2k.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zher2k.c
index 94442469dbf76005979ff4b53146ddbf3c9f4ef8..e15a8ea81025a0d56c9b4f639238fb2fcddeff5c 100644 (file)
@@ -239,7 +239,7 @@ void cblas_zher2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_zher2k is %d\n.", err_code);
+ printf("Error in offloaded cblas_zher2k with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -255,6 +255,11 @@ void cblas_zher2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zherk.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zherk.c
index 651fab2d45c10ff4ff177a89ac8089699d99aaec..5eb89b4731cdacf20a2791a7b8ad96b40d3ea571 100644 (file)
@@ -213,7 +213,7 @@ void cblas_zherk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_zherk is %d\n.", err_code);
+ printf("Error in offloaded cblas_zherk with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -229,6 +229,11 @@ void cblas_zherk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhpmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhpmv.c
index 8c14a93696a54038c91b093be502852b680fd6d9..bc9cdf9013a2aa36df5382ba41eab1cae8698c6c 100644 (file)
@@ -194,6 +194,11 @@ void cblas_zhpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhpr.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhpr.c
index ff810ec1ded88adb08f1f8aca3d66df6308abfc1..1b25b51baf179dfe22d8fb7259e1024a38f92be6 100644 (file)
@@ -157,6 +157,11 @@ void cblas_zhpr(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhpr2.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zhpr2.c
index 33c9fb6149e06308ed18df853a188c5b1ddba158..a1aeaae7b6640000a8427109b9da3946300b55d8 100644 (file)
@@ -183,6 +183,11 @@ void cblas_zhpr2(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zrotg.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zrotg.c
index f13b5c94c59ca73113957901051ee8933b2fc773..f1e437c882ee4ddc34cce605e8685979c6a98b1e 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zscal.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zscal.c
index c54445b49c073aeab180876b1bf32d1dc18e0f4f..0169b07d5a27847529cd3ccef1d8e67a8ad56db7 100644 (file)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zswap.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zswap.c
index d4855ae08da00f6abf1519179d23430905a8827c..70a29e9e339d900b38d79aad7f40ae273c072d55 100644 (file)
@@ -156,6 +156,11 @@ void cblas_zswap(const int N, void *X, const int incX, void *Y, const int incY)
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zsymm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zsymm.c
index cd9731d6cb66008a89a604a38f9e28c3189229bd..9175e0ebb8b8a09f02358c07d2077c68fe01b19b 100644 (file)
@@ -244,7 +244,7 @@ void cblas_zsymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_zsymm is %d\n.", err_code);
+ printf("Error in offloaded cblas_zsymm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -260,6 +260,11 @@ void cblas_zsymm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zsyr2k.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zsyr2k.c
index 5c83eedc82d6d7212f1fd816652debc8dce66dc8..53b704443cb751df55942af3fce43e50b1a1e3ce 100644 (file)
@@ -244,7 +244,7 @@ void cblas_zsyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_zsyr2k is %d\n.", err_code);
+ printf("Error in offloaded cblas_zsyr2k with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -260,6 +260,11 @@ void cblas_zsyr2k(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, cons
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zsyrk.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_zsyrk.c
index 49622bba4be258772826ffaff90d3e66818d9739..f705eb6ac58e2e84753d16f9bc01d45d8ea95877 100644 (file)
@@ -223,7 +223,7 @@ void cblas_zsyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_zsyrk is %d\n.", err_code);
+ printf("Error in offloaded cblas_zsyrk with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -239,6 +239,11 @@ void cblas_zsyrk(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztbmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztbmv.c
index f17892612f30f69f0a03cbc6555baf5727aa8989..c026942373d1e562a45c6b2084be77ce1e034fbd 100644 (file)
@@ -175,6 +175,11 @@ void cblas_ztbmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztbsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztbsv.c
index 6202e8d8ed3c0fcbb7026b62638994eb4fb575a6..754eca7b03969c359f69936b9a0ee99a6e246a0a 100644 (file)
@@ -175,6 +175,11 @@ void cblas_ztbsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztpmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztpmv.c
index 9d26625f0c751cac87d6cd0e6f3f17a86f3da394..6fd2dd0b29806406dc270141a02a39b91b1a72bc 100644 (file)
@@ -163,6 +163,11 @@ void cblas_ztpmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztpsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztpsv.c
index 1c47aa7e9bdded2604a2a9611b77d46595d8c12a..dcf6100e6b3aa7df19ba96bd6438237b9a94e7fc 100644 (file)
@@ -163,6 +163,11 @@ void cblas_ztpsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztrmm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztrmm.c
index 4953031e56496c0551003e67f2f225a8279dbcb7..c010d894eb1d74182d677139327a1c39a4cb5e1b 100644 (file)
@@ -224,7 +224,7 @@ void cblas_ztrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_ztrmm is %d\n.", err_code);
+ printf("Error in offloaded cblas_ztrmm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -240,6 +240,11 @@ void cblas_ztrmm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztrmv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztrmv.c
index e3f466cdbb08267fe2c6998ffd7c440a0593cc71..1cbe9e05c04f0af3a5fcae7f68fc29532a7cc3c5 100644 (file)
@@ -169,6 +169,11 @@ void cblas_ztrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztrsm.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztrsm.c
index 1be9ded6fa0b7171f9a4875c196cf1db10a1cb6b..4cca72875b944680f67ad2f7324c25d0ff50a4de 100644 (file)
@@ -224,7 +224,7 @@ void cblas_ztrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#endif
if(err_code != TICBLAS_SUCCESS) {
- printf("Error code returned by offloaded cblas_ztrsm is %d\n.", err_code);
+ printf("Error in offloaded cblas_ztrsm with error code %d!\n", err_code);
}
ti_cblas_mem_free(msmc_ptr);
@@ -240,6 +240,11 @@ void cblas_ztrsm(const enum CBLAS_ORDER Order, const enum CBLAS_SIDE Side, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztrsv.c b/src/ti/linalg/blasblisacc/src/ti_cblas_cblas_ztrsv.c
index 558a8873098fa7924ce835ed274f00777f8285ae..044c64e7b5e566bfb5d93b7b0ccd80cb39de0e5b 100644 (file)
@@ -169,6 +169,11 @@ void cblas_ztrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ti_cblas_delete_kernel(__K);
+ }
+
ti_cblas_error(err.what(),err.err());
return ;
}
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_initfini.c b/src/ti/linalg/blasblisacc/src/ti_cblas_initfini.c
index 48da1ea5abeb94f410f75bd19e66c4a1a86bf1ca..7ae2b566754e725a45c57421cdf70d1068e19c09 100644 (file)
#endif
ti_cblas_get_kernel(int idx, const char *fname)
{
-#if 0
- if (!ti_cblas_kernel_valid[idx]) {
-#ifdef __cplusplus
- ti_cblas_ocl_kernels[idx] = new Kernel(ti_cblas_ocl_program, fname);
-#else
- cl_int err;
- ti_cblas_ocl_kernels[idx] = clCreateKernel(ti_cblas_ocl_program,fname,&err);
- TI_CBLAS_OCL_CHKERROR("clCreateKernel",err);
-#endif
- ti_cblas_kernel_valid[idx] = 1;
- }
- return ti_cblas_ocl_kernels[idx];
-#else
#ifdef __cplusplus
Kernel* __K;
#else
cl_kernel __K;
#endif
+
#ifdef __cplusplus
- __K = new Kernel(*ti_cblas_ocl_program, fname);
+ __K = new Kernel(*ti_cblas_ocl_program, fname);
#else
- cl_int err;
- __K = clCreateKernel(ti_cblas_ocl_program,fname,&err);
- TI_CBLAS_OCL_CHKERROR("clCreateKernel",err);
+ cl_int err;
+ __K = clCreateKernel(ti_cblas_ocl_program,fname,&err);
+ TI_CBLAS_OCL_CHKERROR("clCreateKernel",err);
#endif
- return __K;
-#endif
+ return __K;
}
#ifdef __cplusplus
diff --git a/src/ti/linalg/blasblisacc/src/ti_cblas_mem_config.c b/src/ti/linalg/blasblisacc/src/ti_cblas_mem_config.c
index ee89893d58d10f04f08abc49a38178c724430ddc..47ff0c029321f8c37d0a21c4f62065f16e1feeb8 100644 (file)
#ifdef TI_CBLAS_DEBUG
printf("No enough memory!\n");
#endif
- return(TICBLAS_ERROR);
+ return(TICBLAS_ERROR_NOMEM);
}
/* Configure L1D if necessary */
@@ -130,7 +130,10 @@ int bli_l3_mem_config(void *msmc_buf, size_t msmc_buf_size, void *ddr_buf, size_
}
if(l1d_cfg_err || l2_cfg_err) {
- return(TICBLAS_ERROR);
+#ifdef TI_CBLAS_DEBUG
+ printf("L1D or L2 configuration error!\n");
+#endif
+ return(TICBLAS_ERROR_MEMCFG);
}
#ifdef TI_CBLAS_DEBUG
@@ -159,7 +162,7 @@ int bli_l3_mem_config(void *msmc_buf, size_t msmc_buf_size, void *ddr_buf, size_
printf("Before calling BLIS, memory descriptor base is 0x%x, used is %d.\n", blas_memdscr_tab[3]->base, blas_memdscr_tab[3]->used);
}
else {
- printf("BLAS init error.\n");
+ printf("BLAS init error with code %d.\n ", blas_ret_err_code);
}
#endif
}
}
if(l1d_cfg_err != LIB_CACHE_SUCCESS) {
- return(-3);
+ return(TICBLAS_ERROR_MEMRECFG);
}
/* configure L2 back if necessary */
}
}
if(l2_cfg_err != LIB_CACHE_SUCCESS) {
- return(-4);
+ return(TICBLAS_ERROR_MEMRECFG);
}
#ifdef TI_CBLAS_DEBUG
diff --git a/src/ti/linalg/blasblisacc/src/wrap_gen/oclgen.pl b/src/ti/linalg/blasblisacc/src/wrap_gen/oclgen.pl
index 74c949da7e0e657d1a474c6cc23ad98146791128..77a49a40eb76383ce835904ba342dcc036d972d6 100755 (executable)
if (index($blas_L3, '.'.$kernel_name.'|') != -1) {
$armcode .= "
if(err_code != TICBLAS_SUCCESS) {
- printf(\"Error code returned by offloaded $trampname is %d\\n.\", err_code);
+ printf(\"Error in offloaded $trampname with error code %d!\\n\", err_code);
}
${namespace}_mem_free(msmc_ptr);
#ifdef __cplusplus
catch (Error err)
{
+ /* delete __K if it has not been deleted */
+ if(__K!=NULL) {
+ ${namespace}_delete_kernel(__K);
+ }
+
${namespace}_error(err.what(),err.err());
return ";
$armcode .= "0" unless ($tramptype =~ /^void$/i);
diff --git a/src/ti/linalg/blis/frame/base/bli_malloc.c b/src/ti/linalg/blis/frame/base/bli_malloc.c
index c9cb628cebb6d48bbf56369fda31da09f5f9f41f..4d0942f7c743740d871d1f0f8a91d185de059a82 100644 (file)
p = _aligned_malloc( ( size_t )size,
( size_t )BLIS_HEAP_ADDR_ALIGN_SIZE );
#elif defined (BLIS_ENABLE_C66X_BUILD)
- p = malloc( ( size_t )size );
+ //p = malloc( ( size_t )size );
+ /* Use LibArch slow permanent memory allocator */
+ p = lib_pmem_salloc(blasGetMemHandle(), size, 0);
#else
r_val = posix_memalign( &p,
( size_t )BLIS_HEAP_ADDR_ALIGN_SIZE,
{
void* p = NULL;
- p = memalign(BLIS_CACHE_LINE_SIZE, ( size_t )size);
+ //p = memalign(BLIS_CACHE_LINE_SIZE, ( size_t )size);
+ p = lib_pmem_salloc(blasGetMemHandle(), size, BLIS_CACHE_LINE_SIZE);
if ( p == NULL ) bli_abort();
__free_ddr( p );
}
#elif defined (BLIS_ENABLE_C66X_BUILD)
- free(p);
+ //free(p);
+ lib_pmem_sfree(blasGetMemHandle(), p);
#elif BLIS_HEAP_ADDR_ALIGN_SIZE == 1 || !defined(_WIN32)
free( p );
#else
index 3af4e4a6716493a81f566ada50c18218e574879d..3e45b5fa36146b6b113e3f533f29582ab50868d1 100644 (file)
||((mem_medium_base == NULL) || (mem_medium_size < BLAS_MEM_SIZE_MEDIUM) )\r
||((mem_slow_base == NULL) || (mem_slow_size < BLAS_MEM_SIZE_SLOW) )\r
) {\r
- return(TICBLAS_ERROR);\r
+ return(TICBLAS_ERROR_NOMEM);\r
}\r
else {\r
lib_smem_vinit(blas_mem_handle, mem_vfast_base, mem_vfast_size);\r
||(pool_mk_mem_L3 == NULL) \r
||(pool_kn_mem_L3 == NULL) \r
||(pool_mn_mem_L3 == NULL) ) {\r
- return(TICBLAS_ERROR); \r
+ return(TICBLAS_ERROR_MEMINIT); \r
} \r
else {\r
bli_mem_init();\r
return(TICBLAS_SUCCESS);\r
}\r
else {\r
- return(TICBLAS_ERROR);\r
+ return(TICBLAS_ERROR_NEW);\r
}\r
}\r
\r
return(TICBLAS_SUCCESS);\r
}\r
else {\r
- return(TICBLAS_ERROR);\r
+ return(TICBLAS_ERROR_DELETE);\r
}\r
}\r
\r
index 611118d3a40651ef45846b0a33924fe3fd1ad246..18b7a1289f8c08fec3ec8e8471ae76b445287a47 100644 (file)
* @name Error Return Codes\r
*/\r
/*@{*/\r
-#define TICBLAS_SUCCESS (0) /**< Success. No error. */\r
-#define TICBLAS_ERROR (-1) /**< Failure. */ \r
+#define TICBLAS_SUCCESS (0) /**< Success. No error. */\r
+#define TICBLAS_ERROR_NOMEM (1) /**< Failure. Provided memory is not enough. */\r
+#define TICBLAS_ERROR_MEMINIT (2) /**< Failure. Memory init error. */\r
+#define TICBLAS_ERROR_MEMCFG (3) /**< Failure. L1D/L2 config error. */\r
+#define TICBLAS_ERROR_NEW (4) /**< Failure. tiCblasnew error. */\r
+#define TICBLAS_ERROR_DELETE (5) /**< Failure. tiCblasDelete error. */\r
+#define TICBLAS_ERROR_MEMRECFG (6) /**< Failure. L1D/L2 reconfig error. */\r
/*@}*/\r
/** @} */\r
\r
/**\r
* @ingroup ti_cblas_api\r
- * @brief Function tiCblasGetSizes() returns the required size of each of the\r
- * memory types defined by the Library Architecture and Framework \r
- * (LibArch)\r
+ * @brief Function tiCblasGetSizes() returns the required size of each of \r
+ * the memory types defined by the Library Architecture and \r
+ * Framework (LibArch).\r
+ *\r
+ * @remarks Memory types are categorized into scratch and permanent memories:\r
+ * - Scratch memory content doesn't need to be stored from call to call;\r
+ * - Permanent memory content must be stored across multiple calls.\r
+ * For example, if an application uses library A and library B, the \r
+ * scratch memory of library A and library B can be shared/overlapped,\r
+ * but permanent memory may not be shared/overlapped. \r
+ *\r
+ * Scratch and permanent memories are each categorized into four types\r
+ * based on speed:\r
+ * - very fast memory, e.g. L1D;\r
+ * - fast memory, e.g. L2;\r
+ * - medium memory, e.g. L3/MSMC;\r
+ * - slow memory, e.g. DDR.\r
*\r
* @param[out] smem_size_vfast size of very fast shared memory \r
* @param[out] smem_size_fast size of fast shared memory \r
/**\r
* @ingroup ti_cblas_api\r
* @brief Function tiCblasInit() performs heap initialization for CBLAS \r
- * to do memory allocations.\r
+ * to do dynamic memory allocations.\r
* \r
+ * @remarks Users must allocate memories according to the requirements \r
+ * given by tiCblasGetSizes() and pass the base and size to this\r
+ * function. \r
+ *\r
* @remarks tiCblasInit() must NOT be called before tiCblasNew(). \r
*\r
* @param[in] mem_vfast_base base of very fast shared memory \r
index befa9dd53ea97fa4801e9028bb6f66cb480c8da6..c8e409c9107e162530f7895da7b4dc200ba5bfbe 100644 (file)
$(EXE): cgemm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) cgemm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/cgemm_tune/cgemm_tune.c b/src/ti/linalg/tuning/cgemm_tune/cgemm_tune.c
index 358eaefadb5e1e9ab9d3a0d7dcdac9e5e06f5bc2..ad44fc84aa6e0c97510103dfedf7bb1d6d24a031 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const float complex *C1, const float complex *C2, int M, int N);
int run_cgemm_dsp_and_arm(int M, int K, int N, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
else {
printf("Measuring DSP and ARM GFLOPS for (M,N,K)=(%d,%d,%d), (m,n,k)=(%d,%d,%d).\n", M,N,K,m,n,k);
cgemm_err = run_cgemm_dsp_and_arm(M, N, K, &t_dsp, &t_arm, &total_GFLOPS_DSP, &total_GFLOPS_ARM);
- //dsym_err = run_dsymm_dsp_and_arm();
if(cgemm_err == -1) { /* out of memory for DSP offloading */
ofld_flag[m][n][k] = NO_OFFLOAD;
time_DSP = t_dsp;
time_ARM = t_arm;
if (cgemm_err == 0){
- //if(total_GFLOPS_DSP - total_GFLOPS_ARM > 1.0) {
if(DSP_FASTER_THAN_ARM(t_dsp,t_arm)) {
ofld_flag[m][n][k] = OFFLOAD;
printf("Offloading to DSP for this point. Skipping next point.\n");
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_cgemm_dsp_and_arm(int M, int K, int N, float *time_dsp, float *time_arm,
@@ -177,7 +174,7 @@ int run_cgemm_dsp_and_arm(int M, int K, int N, float *time_dsp, float *time_arm,
float operation_count = 2.0*(float)M*(float)N*(float)K;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
@@ -232,7 +229,6 @@ int run_cgemm_dsp_and_arm(int M, int K, int N, float *time_dsp, float *time_arm,
/*------------------------------------------------------------------------
* Time DSP cgemm
*-----------------------------------------------------------------------*/
- //ti_cblas_offload_config("001"); /* force offloading level 3 to DSP */
TI_CBLAS_L3_OFFLOAD = 1;
tick();
@@ -247,7 +243,6 @@ int run_cgemm_dsp_and_arm(int M, int K, int N, float *time_dsp, float *time_arm,
/*-------------------------------------------------------------------------
* Time ARM cgemm
*------------------------------------------------------------------------*/
- //ti_cblas_offload_config("000"); /* force no offloading */
TI_CBLAS_L3_OFFLOAD = 0;
tick();
@@ -258,13 +253,11 @@ int run_cgemm_dsp_and_arm(int M, int K, int N, float *time_dsp, float *time_arm,
gflops_ARM = operation_count/time_secs*1e-9;
total_GFLOPS_ARM += gflops_ARM;
}
- //printf(" %6.3f %6.3f %9.6fs %9.6fs\n", gflops_DSP, gflops_ARM, time_dsp, time_arm);
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- //return check_results(Cdsp, Carm, M, N);
- err_code += check_results(Cdsp, Carm, M, N);
+ num_errors += comp_matrix_complex(Cdsp, Carm, M, N);
__free_ddr(A);
__free_ddr(B);
@@ -277,39 +270,7 @@ int run_cgemm_dsp_and_arm(int M, int K, int N, float *time_dsp, float *time_arm,
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const float complex *C1, const float complex *C2, int M, int N)
-{
- int i;
- const float EPISILON = 1e-5;
- //const float EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<M*N; i++)
- {
- float delta = cabs(C1[i]) - cabs(C2[i]);
-
- if (delta > EPISILON*cabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %f <==> %f\n", i, cabs(C1[i]), cabs(C2[i]));
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
+ return num_errors;
+} /* run_cgemm_dsp_and_arm */
diff --git a/src/ti/linalg/tuning/common/print_header.c b/src/ti/linalg/tuning/common/print_header.c
index 41333431c957a6bac5db56308670a4a06a0d5e26..e9606540a28031e8d71f453d03ef40a6a89d52e8 100644 (file)
" * THE POSSIBILITY OF SUCH DAMAGE. \n"
" *****************************************************************************/ \n"
"\n"
-"#include \"ti_cblas.h\"\n\n");
+"#include \"ti_cblas_acc.h\"\n\n");
} /* print_file_header */
index fcf71a2d31ab50bd0e42c9f4dfe06947756fc7bf..226160938cb3d79b266d67cefb8fdbef207a7bcd 100644 (file)
*****************************************************************************/
#include <stdlib.h>
#include <stdio.h>
+#include <math.h>
+#include <complex.h>
-#define TUNING_START_SIZE_SQUARE_MATRIX 16
-#define TUNING_START_SIZE_RECTAN_MATRIX 64
-#define NUM_MATRIX_SIZE_TO_BENCHMARK 4 //16
+#define TUNING_START_SIZE_RECTAN_MATRIX 8
+#define NUM_MATRIX_SIZE_TO_BENCHMARK 16
#define HAS_MEMORY 1
#define NO_MEMORY 0
#define OFFLOAD 1
extern void print_file_header(FILE *fp_tbl);
+extern int comp_matrix_complex(const float complex *C1, const float complex *C2, int M, int N);
+extern int comp_matrix_double(const double *C1, const double *C2, int M, int N);
+extern int comp_matrix(const float *C1, const float *C2, int M, int N);
index bb5bf0b6fd8dbacc309712dc4fd3bac39aaabf8e..7aba22080681cd634a3a58ac9a9320681a390f91 100644 (file)
$(EXE): csyrk_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) csyrk_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/csyrk_tune/csyrk_tune.c b/src/ti/linalg/tuning/csyrk_tune/csyrk_tune.c
index 09b4b5bfb466c505229430ed5a28f2e8cefa9400..e18826e7bfaa957aef9a9ec31bfd40eb08bac5b9 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const float complex *C1, const float complex *C2, int N, int K);
int run_csyrk_dsp_and_arm(int N, int K, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_csyrk_dsp_and_arm(int N, int K, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm)
float operation_count = 2.0*(float)N*(float)K;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Cdsp, Carm, N, N);
+ num_errors += comp_matrix_complex(Cdsp, Carm, N, N);
__free_ddr(A);
__free_ddr(Cdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const float complex *C1, const float complex *C2, int M, int N)
-{
- int i;
- const float EPISILON = 1e-5;
- //const float EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<M*N; i++)
- {
- float delta = cabs(C1[i]) - cabs(C2[i]);
-
- if (delta > EPISILON*cabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %f <==> %f\n", i, cabs(C1[i]), cabs(C2[i]));
- }
+ return num_errors;
+} /* run_csyrk_dsp_and_arm */
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
index 3cd80f98224548f0ce94c9780182cece31fd84d1..88817a34cb996bd35ee9f7a3ea91ba656afcda25 100644 (file)
$(EXE): ctrmm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) ctrmm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/ctrmm_tune/ctrmm_tune.c b/src/ti/linalg/tuning/ctrmm_tune/ctrmm_tune.c
index 125b7fcf4f9c8a80d5336a3cfcd30886e550d43c..fa35c925090ada456700961be28e55f480c60ea7 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const float complex *C1, const float complex *C2, int M, int N);
int run_ctrmm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
time_DSP = t_dsp;
time_ARM = t_arm;
if (ctrmm_err == 0){
- //if(total_GFLOPS_DSP - total_GFLOPS_ARM > 1.0) {
if(DSP_FASTER_THAN_ARM(t_dsp,t_arm)) {
ofld_flag[m][n] = OFFLOAD;
printf("Offloading to DSP for this point. Skipping next point.\n");
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_ctrmm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm)
float operation_count = 2.0*(float)M*(float)N;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
{
Bdsp[i] = Barm[i] = (float)rand()/RAND_MAX + (float)rand()/RAND_MAX * I;
}
-/*
- if(M==8 && N==8) {
- FILE *file_a = fopen("mat_a.dat","w");
- FILE *file_b = fopen("mat_b.dat","w");
- FILE *file_c = fopen("mat_c.dat","w");
-
- for(i=0; i < size_A; ++i) fprintf(file_a, "%1.10e\t%1.10e\n",crealf(A[i]), cimagf(A[i]));
- for(i=0; i < size_B; ++i) fprintf(file_b, "%1.10e\t%1.10e\n",crealf(Barm[i]), cimagf(Barm[i]));
- for(i=0; i < size_B; ++i) fprintf(file_c, "%1.10e\t%1.10e\n",crealf(Bdsp[i]), cimagf(Bdsp[i]));
-
- fclose(file_a);
- fclose(file_b);
- fclose(file_c);
- }
-*/
+
int lda = (side == CblasLeft) ? M : N;
int ldb = M;
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Bdsp, Barm, M, N);
+ num_errors += comp_matrix_complex(Bdsp, Barm, M, N);
__free_ddr(A);
__free_ddr(Bdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const float complex *C1, const float complex *C2, int M, int N)
-{
- int i;
- const float EPISILON = 1e-5;
- //const float EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<M*N; i++)
- {
- float delta = cabs(C1[i]) - cabs(C2[i]);
-
- if (delta > EPISILON*cabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %f <==> %f\n", i, cabs(C1[i]), cabs(C2[i]));
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
-
+ return num_errors;
+} /* run_ctrmm_dsp_and_arm */
index 79956113708449f8e371b10b5e4a967c12e2ef28..d0dac9265f4cdb55906d91bbf2862f70c4c3c676 100644 (file)
$(EXE): ctrsm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) ctrsm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/ctrsm_tune/ctrsm_tune.c b/src/ti/linalg/tuning/ctrsm_tune/ctrsm_tune.c
index abf02cfed8931345b15589ba4c8323b753fbafdd..39c7ded9c5790e205ebb6cb5650531d251168abe 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const float complex *C1, const float complex *C2, int M, int N);
int run_ctrsm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_ctrsm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm)
float operation_count = 2.0*(float)M*(float)N;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
A[j*lda+k] = (float)rand()/RAND_MAX + (float)rand()/RAND_MAX * I;
}
}
-// for (i = 0; i < size_A; ++i)
-// {
-// A[i] = (float)rand()/RAND_MAX + (float)rand()/RAND_MAX * I;
-// }
for (i = 0; i < size_B; ++i)
{
Bdsp[i] = Barm[i] = (float)rand()/RAND_MAX + (float)rand()/RAND_MAX * I;
}
-/*
- if(M==8 && N==8) {
- FILE *file_a = fopen("mat_a.dat","w");
- FILE *file_b = fopen("mat_b.dat","w");
- FILE *file_c = fopen("mat_c.dat","w");
-
- for(i=0; i < size_A; ++i) fprintf(file_a, "%1.10e\t%1.10e\n",crealf(A[i]), cimagf(A[i]));
- for(i=0; i < size_B; ++i) fprintf(file_b, "%1.10e\t%1.10e\n",crealf(Barm[i]), cimagf(Barm[i]));
- for(i=0; i < size_B; ++i) fprintf(file_c, "%1.10e\t%1.10e\n",crealf(Bdsp[i]), cimagf(Bdsp[i]));
-
- fclose(file_a);
- fclose(file_b);
- fclose(file_c);
- }
-*/
+
/*============ BLAS tuning: running on DSP and then on ARM =============*/
/*------------------------------------------------------------------------
* Time DSP ctrsm
gflops_ARM = operation_count/time_secs*1e-9;
total_GFLOPS_ARM += gflops_ARM;
}
- //printf(" %6.3f %6.3f %9.6fs %9.6fs\n", gflops_DSP, gflops_ARM, time_dsp, time_arm);
if(M==8 && N==8) {
FILE *file_a = fopen("mat_a2.dat","w");
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Bdsp, Barm, M, N);
+ num_errors += comp_matrix_complex(Bdsp, Barm, M, N);
__free_ddr(A);
__free_ddr(Bdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const float complex *C1, const float complex *C2, int M, int N)
-{
- int i;
- float norm, delta;
- const float EPISILON = 1e-5;
- const float DELTA = 1e-5;
- //const float EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<M*N; i++)
- {
- delta = cabs(C1[i]) - cabs(C2[i]);
- norm = cabs(C1[i]);
- if(norm < cabs(C2[i]))
- norm = cabs(C2[i]);
-
- if (delta > EPISILON*norm && delta>DELTA)
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %f <==> %f\n", i, cabs(C1[i]), cabs(C2[i]));
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
+ return num_errors;
+} /* run_ctrsm_dsp_and_arm */
index 1917a037eb09ddd38fe093b1c89da7d023269b3f..19194a8b4a9b61f68acdbc2e06b5855b09b3f7fc 100644 (file)
$(EXE): dgemm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) dgemm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/dgemm_tune/dgemm_tune.c b/src/ti/linalg/tuning/dgemm_tune/dgemm_tune.c
index d4b043fdfa1115b85a6cd5866221c6bd8c9b4532..9a0114064b5e0ae02b6ddf46ca3748ed9750a98c 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const double *C1, const double *C2, int M, int N);
int run_dgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
else {
printf("Measuring DSP and ARM GFLOPS for (M,N,K)=(%d,%d,%d), (m,n,k)=(%d,%d,%d).\n", M,N,K,m,n,k);
dgemm_err = run_dgemm_dsp_and_arm(M, N, K, &t_dsp, &t_arm, &total_GFLOPS_DSP, &total_GFLOPS_ARM);
- //dsym_err = run_dsymm_dsp_and_arm();
if(dgemm_err == -1) { /* out of memory for DSP offloading */
ofld_flag[m][n][k] = NO_OFFLOAD;
time_DSP = t_dsp;
time_ARM = t_arm;
if (dgemm_err == 0){
- //if(total_GFLOPS_DSP - total_GFLOPS_ARM > 1.0) {
if(DSP_FASTER_THAN_ARM(t_dsp,t_arm)) {
ofld_flag[m][n][k] = OFFLOAD;
printf("Offloading to DSP for this point. Skipping next point.\n");
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_dgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
@@ -175,7 +172,7 @@ int run_dgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
float operation_count = 2.0*(double)M*(double)N*(double)K;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
@@ -205,8 +202,8 @@ int run_dgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
/*-------------------------------------------------------------------------
* Initialize matrices
*------------------------------------------------------------------------*/
- for (i = 0; i < (long long)M*K; ++i) A[i] = (double)rand()/RAND_MAX;// (double)(rand() % 5 + 1);
- for (i = 0; i < (long long)K*N; ++i) B[i] = (double)rand()/RAND_MAX;// (double)(rand() % 5 + 1);
+ for (i = 0; i < (long long)M*K; ++i) A[i] = (double)rand()/RAND_MAX;
+ for (i = 0; i < (long long)K*N; ++i) B[i] = (double)rand()/RAND_MAX;
for (i = 0; i < (long long)M*N; ++i) Carm[i] = Cdsp[i] = 0;
int lda = ((order == CblasColMajor && transA == CblasNoTrans) ||
@@ -234,17 +231,7 @@ int run_dgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
gflops_DSP = operation_count/time_secs*1e-9;
total_GFLOPS_DSP += gflops_DSP;
}
-/*
- if(M==4096 && K==256 && N==16) {
- FILE *file_a = fopen("mat_a.dat","w");
- FILE *file_b = fopen("mat_b.dat","w");
- FILE *file_c = fopen("mat_c.dat","w");
-
- for(i=0; i < M*K; ++i) fprintf(file_a, "%1.10e\n",A[i]);
- for(i=0; i < K*N; ++i) fprintf(file_b, "%1.10e\n",B[i]);
- for(i=0; i < M*N; ++i) fprintf(file_c, "%1.10e\n",Cdsp[i]);
- }
-*/
+
/*-------------------------------------------------------------------------
* Time ARM dgemm
*------------------------------------------------------------------------*/
@@ -259,14 +246,12 @@ int run_dgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
gflops_ARM = operation_count/time_secs*1e-9;
total_GFLOPS_ARM += gflops_ARM;
}
- //printf(" %6.3f %6.3f %9.6fs %9.6fs\n", gflops_DSP, gflops_ARM, time_dsp, time_arm);
fflush(stdout);
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- //return check_results(Cdsp, Carm, M, N);
- err_code += check_results(Cdsp, Carm, M, N);
+ num_errors += comp_matrix_double(Cdsp, Carm, M, N);
__free_ddr(A);
__free_ddr(B);
@@ -279,39 +264,6 @@ int run_dgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
*time_dsp = total_time_dsp / (double)NUM_TEST_RUN;
*time_arm = total_time_arm / (double)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const double *C1, const double *C2, int M, int N)
-{
- int i;
- const double EPISILON = 1e-10;
- //const double EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<(long)M*N; i++)
- {
- double delta = fabs(C1[i] - C2[i]);
- if (delta > EPISILON*fabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %e <==> %e\n", i, C1[i], C2[i]);
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
-
+ return num_errors;
+} /* run_dgemm_dsp_and_arm */
index 36fc37df7b19369b755b45479f54e7d2afdb8079..078241b5a4cd396ccfb54333981ce71153eb3e9c 100644 (file)
$(EXE): dsyrk_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) dsyrk_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/dsyrk_tune/dsyrk_tune.c b/src/ti/linalg/tuning/dsyrk_tune/dsyrk_tune.c
index e19c26fadda468bdcb879a0d8fd3baf23072871d..ccd6893da57d6a769fb4bafbf09e8e28db243861 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const double *C1, const double *C2, int N, int K);
int run_dsyrk_dsp_and_arm(int N, int K, double *time_dsp, double *time_arm,
double *gflops_dsp, double *gflops_arm);
else {
printf("Measuring DSP and ARM GFLOPS for (N,K)=(%d,%d), (n,k)=(%d,%d).\n", N,K,n,k);
dsyrk_err = run_dsyrk_dsp_and_arm(N, K, &t_dsp, &t_arm, &total_GFLOPS_DSP, &total_GFLOPS_ARM);
- //dsym_err = run_dsymm_dsp_and_arm();
if(dsyrk_err == -1) { /* out of memory for DSP offloading */
ofld_flag[n][k] = NO_OFFLOAD;
time_DSP = t_dsp;
time_ARM = t_arm;
if (dsyrk_err == 0){
- //if(total_GFLOPS_DSP - total_GFLOPS_ARM > 1.0) {
if(DSP_FASTER_THAN_ARM(t_dsp,t_arm)) {
ofld_flag[n][k] = OFFLOAD;
printf("Offloading to DSP for this point. Skipping next point.\n");
double operation_count = 2.0*(double)N*(double)K;
double total_GFLOPS_DSP = 0.0f;
double total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
/*-------------------------------------------------------------------------
* Time ARM dsyrk
*------------------------------------------------------------------------*/
- //ti_cblas_offload_config("000"); /* force no offloading */
- //printf("Running on ARM.\n");
TI_CBLAS_L3_OFFLOAD = 0;
tick();
gflops_ARM = operation_count/time_secs*1e-9;
total_GFLOPS_ARM += gflops_ARM;
}
- //printf(" %6.3f %6.3f %9.6fs %9.6fs\n", gflops_DSP, gflops_ARM, time_dsp, time_arm);
fflush(stdout);
if(N==8 && K==8) {
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Cdsp, Carm, N, N);
+ num_errors += comp_matrix_double(Cdsp, Carm, N, N);
__free_ddr(A);
__free_ddr(Cdsp);
*time_dsp = total_time_dsp / (double)NUM_TEST_RUN;
*time_arm = total_time_arm / (double)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const double *C1, const double *C2, int M, int N)
-{
- int i;
- const double EPISILON = 1e-10;
- //const double EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<(long)M*N; i++)
- {
- double delta = fabs(C1[i] - C2[i]);
- if (delta > EPISILON*fabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %e <==> %e\n", i, C1[i], C2[i]);
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
-
+ return num_errors;
+} /* comp_matrix_double */
index 33377d36e95d5c5fee929e0a9896066f6935258d..750f349bd1b0ff44fca320971de59198bcc20da8 100644 (file)
$(EXE): dtrmm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) dtrmm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/dtrmm_tune/dtrmm_tune.c b/src/ti/linalg/tuning/dtrmm_tune/dtrmm_tune.c
index 7293c67093b8cec5b98f5a84cc57dcd8b31d358b..ecda5ed9e656825ab251270da41beb682735abd0 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const double *C1, const double *C2, int M, int N);
int run_dtrmm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_dtrmm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float operation_count = 2.0*(float)M*(float)N;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Bdsp, Barm, M, N);
+ num_errors += comp_matrix_double(Bdsp, Barm, M, N);
__free_ddr(A);
__free_ddr(Bdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const double *C1, const double *C2, int M, int N)
-{
- int i;
- const double EPISILON = 1e-5;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<(long)M*N; i++)
- {
- double delta = fabs(C1[i] - C2[i]);
-
- if (delta > EPISILON*fabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %e <==> %e\n", i, C1[i], C2[i]);
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- return 0;
- }
-}
-
+ return num_errors;
+} /* run_dtrmm_dsp_and_arm */
index 68687ef4a9dbeae5a24883fcde73ec5327389307..7672c21c6c9eb180b41813bff60fd649bfad6cf8 100644 (file)
$(EXE): dtrsm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) dtrsm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/dtrsm_tune/dtrsm_tune.c b/src/ti/linalg/tuning/dtrsm_tune/dtrsm_tune.c
index aec15f1a3dc3e203043e229d21ef0831182c6063..d598f6923821c552d10cc70dcb6e29df5cd374e1 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const double *C1, const double *C2, int M, int N);
int run_dtrsm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_dtrsm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float operation_count = 2.0*(float)M*(float)N;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
*------------------------------------------------------------------------*/
int lda = (side == CblasLeft) ? M : N;
int ldb = M;
-// for (i = 0; i < size_A; ++i) A[i] = (double)rand()/RAND_MAX;
for(j=0;j<lda;j++)
{
for(k=0;k<lda;k++)
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Bdsp, Barm, M, N);
+ num_errors += comp_matrix_double(Bdsp, Barm, M, N);
__free_ddr(A);
__free_ddr(Bdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const double *C1, const double *C2, int M, int N)
-{
- int i;
- const double EPISILON = 1e-5;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<(long)M*N; i++)
- {
- double delta = fabs(C1[i] - C2[i]);
-
- if (delta > EPISILON*fabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %e <==> %e\n", i, C1[i], C2[i]);
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- return 0;
- }
-}
-
+ return num_errors;
+} /* run_dtrsm_dsp_and_arm */
index ea6f25acd974acec1a43aa1db90942009fe132a4..8d1dd3223c3cf29c6f76cb59f1cb875818e24371 100644 (file)
LD_FLAGS=-L$(TARGET_ROOTDIR)/lib -L$(TARGET_ROOTDIR)/usr/lib -Wl,-rpath-link,$(TARGET_ROOTDIR)/lib -Wl,-rpath-link,$(TARGET_ROOTDIR)/usr/lib
BLASLIB = $(LIB_DIR)libcblas_armplusdsp.a -lOpenCL -locl_util -lstdc++ -lrt -lm -lgomp -lpthread
LAPACKLIB = $(LIB_DIR)libcblaswr.a $(LIB_DIR)liblapack.a $(LIB_DIR)libf2c.a $(LIB_DIR)libcblas_armplusdsp.a -lOpenCL -locl_util -lstdc++ -lrt -lm -lgomp -lpthread
-TUNE_UTILS = ../common/print_header.o
-TUNE_UTILS_OBJ = print_header.o
+TUNE_UTILS = ../common/print_header.o ../common/comp_matrix.o
+TUNE_UTILS_OBJ = print_header.o comp_matrix.o
%.o: %.c
@$(CC) -c $(CFLAGS) $<
index ba82c7650d470782dc27fc535644b24d6f444a2f..e0a54175fa2ef479ac89eb0b5d515e551282e2ff 100644 (file)
$(EXE): sgemm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) sgemm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/sgemm_tune/sgemm_tune.c b/src/ti/linalg/tuning/sgemm_tune/sgemm_tune.c
index 7e11ea8181fc1c582907e546940b5af294331099..6c85a02e7aa818bc57c3981a7a4c1adc51361dbf 100644 (file)
float alpha = 0.7;
float beta = 0.3;
enum CBLAS_ORDER order = CblasColMajor;
-//enum CBLAS_ORDER order = CblasRowMajor;
enum CBLAS_TRANSPOSE transA = CblasNoTrans;
enum CBLAS_TRANSPOSE transB = CblasNoTrans;
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const float *C1, const float *C2, int M, int N);
int run_sgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_sgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
@@ -175,7 +173,7 @@ int run_sgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
float operation_count = 2.0*(float)M*(float)N*(float)K;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
@@ -221,8 +219,6 @@ int run_sgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
/*------------------------------------------------------------------------
* Time DSP sgemm
*-----------------------------------------------------------------------*/
- //ti_cblas_offload_config("001"); /* force offloading level 3 to DSP */
- //printf("Running on DSP.\n");
TI_CBLAS_L3_OFFLOAD = 1;
tick();
@@ -233,22 +229,10 @@ int run_sgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
gflops_DSP = operation_count/time_secs*1e-9;
total_GFLOPS_DSP += gflops_DSP;
}
-/*
- if(M==4096 && K==256 && N==16) {
- FILE *file_a = fopen("mat_a.dat","w");
- FILE *file_b = fopen("mat_b.dat","w");
- FILE *file_c = fopen("mat_c.dat","w");
-
- for(i=0; i < M*K; ++i) fprintf(file_a, "%1.10e\n",A[i]);
- for(i=0; i < K*N; ++i) fprintf(file_b, "%1.10e\n",B[i]);
- for(i=0; i < M*N; ++i) fprintf(file_c, "%1.10e\n",Cdsp[i]);
- }
-*/
+
/*-------------------------------------------------------------------------
* Time ARM sgemm
*------------------------------------------------------------------------*/
- //ti_cblas_offload_config("000"); /* force no offloading */
- //printf("Running on ARM.\n");
TI_CBLAS_L3_OFFLOAD = 0;
tick();
@@ -259,14 +243,12 @@ int run_sgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
gflops_ARM = operation_count/time_secs*1e-9;
total_GFLOPS_ARM += gflops_ARM;
}
- //printf(" %6.3f %6.3f %9.6fs %9.6fs\n", gflops_DSP, gflops_ARM, time_dsp, time_arm);
fflush(stdout);
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- //return check_results(Cdsp, Carm, M, N);
- err_code += check_results(Cdsp, Carm, M, N);
+ num_errors += comp_matrix(Cdsp, Carm, M, N);
__free_ddr(A);
__free_ddr(B);
@@ -279,40 +261,5 @@ int run_sgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const float *C1, const float *C2, int M, int N)
-{
- int i;
- const float EPISILON = 1e-5;
- //const float EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<(long)M*N; i++)
- {
- float delta = fabs(C1[i] - C2[i]);
-
- if (delta > EPISILON*fabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %e <==> %e\n", i, C1[i], C2[i]);
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
-
-
+ return num_errors;
+} /* run_sgemm_dsp_and_arm */
index 1bcbd5f376dd6ff1890183e9552d6f290ad40ab6..b813669562743b88ebe5fcd44e78ba77ef1178bf 100644 (file)
$(EXE): ssyrk_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) ssyrk_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/ssyrk_tune/ssyrk_tune.c b/src/ti/linalg/tuning/ssyrk_tune/ssyrk_tune.c
index 14913da95b745feb5a91324369546d8c23a1655c..50b623a11d9b9a2d3746a6aba901e37253fa1f56 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const float *C1, const float *C2, int N, int K);
int run_ssyrk_dsp_and_arm(int N, int K, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
if( (n>0 && ofld_flag[n-1][k]==OFFLOAD)
||(k>0 && ofld_flag[n][k-1]==OFFLOAD) ) {
ofld_flag[n][k] = OFFLOAD;
- mem_flag[n][k] = HAS_MEMORY; // to avoid error
+ mem_flag[n][k] = HAS_MEMORY; /* to avoid error */
time_DSP = -1.0;
time_ARM = -1.0;
printf("Offloading. Skipping (N,K)=(%d,%d), (n,k)=(%d,%d).\n", N,K,n,k);
else {
printf("Measuring DSP and ARM GFLOPS for (N,K)=(%d,%d), (n,k)=(%d,%d).\n", N,K,n,k);
ssyrk_err = run_ssyrk_dsp_and_arm(N, K, &t_dsp, &t_arm, &total_GFLOPS_DSP, &total_GFLOPS_ARM);
- //dsym_err = run_dsymm_dsp_and_arm();
if(ssyrk_err == -1) { /* out of memory for DSP offloading */
ofld_flag[n][k] = NO_OFFLOAD;
time_DSP = t_dsp;
time_ARM = t_arm;
if (ssyrk_err == 0){
- //if(total_GFLOPS_DSP - total_GFLOPS_ARM > 1.0) {
if(DSP_FASTER_THAN_ARM(t_dsp,t_arm)) {
ofld_flag[n][k] = OFFLOAD;
printf("Offloading to DSP for this point. Skipping next point.\n");
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_ssyrk_dsp_and_arm(int N, int K, float *time_dsp, float *time_arm,
float operation_count = 2.0*(float)N*(float)K;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
||(size_C*sizeof(float)>(long long)0x0ffffffff) ) {
return (-1);
}
-
+
for (iter = 0; iter <= NUM_TEST_RUN; iter++)
{
/*-------------------------------------------------------------------------
/*-------------------------------------------------------------------------
* Time ARM ssyrk
*------------------------------------------------------------------------*/
- //ti_cblas_offload_config("000"); /* force no offloading */
- //printf("Running on ARM.\n");
TI_CBLAS_L3_OFFLOAD = 0;
tick();
gflops_ARM = operation_count/time_secs*1e-9;
total_GFLOPS_ARM += gflops_ARM;
}
- //printf(" %6.3f %6.3f %9.6fs %9.6fs\n", gflops_DSP, gflops_ARM, time_dsp, time_arm);
fflush(stdout);
-
+
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Cdsp, Carm, N, N);
+ num_errors += comp_matrix(Cdsp, Carm, N, N);
__free_ddr(A);
__free_ddr(Cdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const float *C1, const float *C2, int M, int N)
-{
- int i;
- const float EPISILON = 1e-5;
- //const float EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<(long)M*N; i++)
- {
- float delta = fabs(C1[i] - C2[i]);
- if (delta > EPISILON*fabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %e <==> %e\n", i, C1[i], C2[i]);
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
-
+ return num_errors;
+} /* run_ssyrk_dsp_and_arm */
index 1569f89e29ab98bc82cec68f55cf2c4b0addf5f2..dfbde2a68a00a918309dbe34d6cf330552a2e802 100644 (file)
$(EXE): strmm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) strmm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/strmm_tune/strmm_tune.c b/src/ti/linalg/tuning/strmm_tune/strmm_tune.c
index 2e25e0bf820c3e64c426c023694b8fd3fbc7b4cb..242da72976d7f7647e354828f60b93514a2728ba 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const float *C1, const float *C2, int M, int N);
int run_strmm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
if( (m>0 && ofld_flag[m-1][n]==OFFLOAD)
||(n>0 && ofld_flag[m][n-1]==OFFLOAD) ) {
ofld_flag[m][n] = OFFLOAD;
- mem_flag[m][n] = HAS_MEMORY; // to avoid error
+ mem_flag[m][n] = HAS_MEMORY; /* to avoid error */
time_DSP = -1.0;
time_ARM = -1.0;
printf("Offloading. Skipping (M,N)=(%d,%d), (m,n)=(%d,%d).\n", M,N,m,n);
time_DSP = t_dsp;
time_ARM = t_arm;
if (strmm_err == 0){
- //if(total_GFLOPS_DSP - total_GFLOPS_ARM > 1.0) {
if(DSP_FASTER_THAN_ARM(t_dsp,t_arm)) {
ofld_flag[m][n] = OFFLOAD;
printf("Offloading to DSP for this point. Skipping next point.\n");
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_strmm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float operation_count = 2.0*(float)M*(float)N;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
- if(side == CblasLeft) {
- size_A = (long long)M*(long long)M;
- }
- else {
- size_A = (long long)N*(long long)N;
- }
- size_B = (long long)M*(long long)N;
+ if(side == CblasLeft) {
+ size_A = (long long)M*(long long)M;
+ }
+ else {
+ size_A = (long long)N*(long long)N;
+ }
+ size_B = (long long)M*(long long)N;
for (iter = 0; iter <= NUM_TEST_RUN; iter++)
{
/*-------------------------------------------------------------------------
*------------------------------------------------------------------------*/
for (i = 0; i < size_A; ++i) A[i] = (float)rand()/RAND_MAX;
for (i = 0; i < (long long)M*N; ++i) Bdsp[i] = Barm[i] = (float)rand()/RAND_MAX;
- //for (i = 0; i < (long long)M*N; ++i) Barm[i] = Bdsp[i];
-/*
- if(M==8 && N==8) {
- FILE *file_a = fopen("mat_a.dat","w");
- FILE *file_b = fopen("mat_b.dat","w");
- FILE *file_c = fopen("mat_c.dat","w");
-
- for(i=0; i < size_A; ++i) fprintf(file_a, "%1.10e\n",A[i]);
- for(i=0; i < M*N; ++i) fprintf(file_b, "%1.10e\n",Barm[i]);
- for(i=0; i < M*N; ++i) fprintf(file_c, "%1.10e\n",Bdsp[i]);
-
- fclose(file_a);
- fclose(file_b);
- fclose(file_c);
- }
-*/
+
int lda = (side == CblasLeft) ? M : N;
int ldb = M;
gflops_DSP = operation_count/time_secs*1e-9;
total_GFLOPS_DSP += gflops_DSP;
}
-
+
/*-------------------------------------------------------------------------
* Time ARM strmm
*------------------------------------------------------------------------*/
gflops_ARM = operation_count/time_secs*1e-9;
total_GFLOPS_ARM += gflops_ARM;
}
- //printf(" %6.3f %6.3f %9.6fs %9.6fs\n", gflops_DSP, gflops_ARM, time_dsp, time_arm);
if(M==8 && N==8) {
FILE *file_a = fopen("mat_a2.dat","w");
for(i=0; i < size_A; ++i) fprintf(file_a, "%1.10e\n",A[i]);
for(i=0; i < M*N; ++i) fprintf(file_b, "%1.10e\n",Barm[i]);
for(i=0; i < M*N; ++i) fprintf(file_c, "%1.10e\n",Bdsp[i]);
-
- fclose(file_a);
- fclose(file_b);
- fclose(file_c);
+
+ fclose(file_a);
+ fclose(file_b);
+ fclose(file_c);
}
-
+
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Bdsp, Barm, M, N);
+ num_errors += comp_matrix(Bdsp, Barm, M, N);
__free_ddr(A);
__free_ddr(Bdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const float *C1, const float *C2, int M, int N)
-{
- int i;
- const float EPISILON = 1e-5;
- //const float EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<(long)M*N; i++)
- {
- float delta = fabs(C1[i] - C2[i]);
-
- if (delta > EPISILON*fabs(C1[i]))
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %e <==> %e\n", i, C1[i], C2[i]);
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
-
+ return num_errors;
+} /* run_strmm_dsp_and_arm */
index 987fc5e8ad8916bcfedc22a47c03880b95fd104b..fccf1ac92fa5304d7964dbcb82030584cf5e29e8 100644 (file)
$(EXE): strsm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) strsm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/strsm_tune/strsm_tune.c b/src/ti/linalg/tuning/strsm_tune/strsm_tune.c
index 0dd16bc7c11c6f6bff23854c4342d99c79226dd4..106a0ab08342522b117208881c7303d4503f0f01 100644 (file)
/*-----------------------------------------------------------------------------
* Prototypes
*----------------------------------------------------------------------------*/
-int check_results(const float *C1, const float *C2, int M, int N);
int run_strsm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float *gflops_dsp, float *gflops_arm);
time_DSP = t_dsp;
time_ARM = t_arm;
if (strsm_err == 0){
- //if(total_GFLOPS_DSP - total_GFLOPS_ARM > 1.0) {
if(DSP_FASTER_THAN_ARM(t_dsp,t_arm)) {
ofld_flag[m][n] = OFFLOAD;
printf("Offloading to DSP for this point. Skipping next point.\n");
fclose(fp_tbl);
return 0;
-}
+} /* main */
int run_strsm_dsp_and_arm(int M, int N, float *time_dsp, float *time_arm,
float operation_count = 2.0*(float)M*(float)N;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
- if(side == CblasLeft) {
- size_A = (long long)M*(long long)M;
- }
- else {
- size_A = (long long)N*(long long)N;
- }
- size_B = (long long)M*(long long)N;
-
+ if(side == CblasLeft) {
+ size_A = (long long)M*(long long)M;
+ }
+ else {
+ size_A = (long long)N*(long long)N;
+ }
+ size_B = (long long)M*(long long)N;
+
for (iter = 0; iter <= NUM_TEST_RUN; iter++)
{
/*-------------------------------------------------------------------------
*------------------------------------------------------------------------*/
int lda = (side == CblasLeft) ? M : N;
int ldb = M;
- //for (i = 0; i < size_A; ++i) A[i] = (float)rand()/RAND_MAX;
- for(j=0;j<lda;j++)
- {
- for(k=0;k<lda;k++)
- {
- if (j==k)
- A[j*lda+k] = 1.0+j;
+ for(j=0;j<lda;j++)
+ {
+ for(k=0;k<lda;k++)
+ {
+ if (j==k)
+ A[j*lda+k] = 1.0+j;
else if (j<k)
- A[j*lda+k] = 0.0;
- else
- A[j*lda+k] = (float)rand()/RAND_MAX;
- }
- }
+ A[j*lda+k] = 0.0;
+ else
+ A[j*lda+k] = (float)rand()/RAND_MAX;
+ }
+ }
for (i = 0; i < (long long)M*N; ++i) Bdsp[i] = Barm[i] = (float)rand()/RAND_MAX;
-/*
- if(M==256 && N==128) {
- FILE *file_a = fopen("mat_a.dat","w");
- FILE *file_b = fopen("mat_b.dat","w");
- FILE *file_c = fopen("mat_c.dat","w");
-
- for(i=0; i < size_A; ++i) fprintf(file_a, "%1.10e\n",A[i]);
- for(i=0; i < M*N; ++i) fprintf(file_b, "%1.10e\n",Barm[i]);
- for(i=0; i < M*N; ++i) fprintf(file_c, "%1.10e\n",Bdsp[i]);
-
- fclose(file_a);
- fclose(file_b);
- fclose(file_c);
- }
-*/
+
/*============ BLAS tuning: running on DSP and then on ARM =============*/
/*------------------------------------------------------------------------
* Time DSP strsm
gflops_DSP = operation_count/time_secs*1e-9;
total_GFLOPS_DSP += gflops_DSP;
}
-
+
/*-------------------------------------------------------------------------
* Time ARM strsm
*------------------------------------------------------------------------*/
gflops_ARM = operation_count/time_secs*1e-9;
total_GFLOPS_ARM += gflops_ARM;
}
- //printf(" %6.3f %6.3f %9.6fs %9.6fs\n", gflops_DSP, gflops_ARM, time_dsp, time_arm);
if(M==256 && N==128) {
FILE *file_a2 = fopen("mat_a2.dat","w");
for(i=0; i < size_A; ++i) fprintf(file_a2, "%1.10e\n",A[i]);
for(i=0; i < M*N; ++i) fprintf(file_b2, "%1.10e\n",Barm[i]);
for(i=0; i < M*N; ++i) fprintf(file_c2, "%1.10e\n",Bdsp[i]);
-
- fclose(file_a2);
- fclose(file_b2);
- fclose(file_c2);
+
+ fclose(file_a2);
+ fclose(file_b2);
+ fclose(file_c2);
}
-
+
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Bdsp, Barm, M, N);
+ num_errors += comp_matrix(Bdsp, Barm, M, N);
__free_ddr(A);
__free_ddr(Bdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
-}
-
-
-/*-----------------------------------------------------------------------------
-* check_results
-*----------------------------------------------------------------------------*/
-int check_results(const float *C1, const float *C2, int M, int N)
-{
- int i;
- float norm, delta;
- const float EPISILON = 1e-2;
- const float DELTA = 1e-5;
- //const float EPISILON = 1e-200;
- const int NERRORS = 5;
- int num_errors = 0;
-
- for (i=0; i<(long)M*N; i++)
- {
- delta = fabs(C1[i] - C2[i]);
- norm = fabs(C1[i]);
- if(norm < fabs(C2[i]))
- norm = fabs(C2[i]);
-
- if (delta > EPISILON*norm && delta>DELTA)
- if ((num_errors += 1) < NERRORS)
- printf("Error [elem:%d]: %e <==> %e\n", i, C1[i], C2[i]);
- }
-
- if (num_errors > 0)
- {
- printf("FAIL with %d errors!\n", num_errors);
- return num_errors;
- }
- else
- {
- //printf("PASS!\n");
- return 0;
- }
-}
-
+ return num_errors;
+} /* run_strsm_dsp_and_arm */
index 43545bfba285f9aab5f44d90e3bcdc76885eb241..6aeb6e7cbde0dab13f6e672f4ba198d2387b27ba 100644 (file)
$(EXE): zgemm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) zgemm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/zgemm_tune/zgemm_tune.c b/src/ti/linalg/tuning/zgemm_tune/zgemm_tune.c
index 5d8cee50ab7a7fea9b42dc40c7b73f90eaeeb4e1..fe15243ad343d45bd37c9c9e8bbaf06e434be7db 100644 (file)
@@ -175,7 +175,7 @@ int run_zgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
float operation_count = 2.0*(float)M*(float)N*(float)K;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
@@ -262,7 +262,7 @@ int run_zgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
* Verify Results
*------------------------------------------------------------------------*/
//return check_results(Cdsp, Carm, M, N);
- err_code += check_results(Cdsp, Carm, M, N);
+ num_errors += check_results(Cdsp, Carm, M, N);
__free_ddr(A);
__free_ddr(B);
@@ -275,7 +275,7 @@ int run_zgemm_dsp_and_arm(int M, int N, int K, float *time_dsp, float *time_arm,
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
+ return num_errors;
}
/*-----------------------------------------------------------------------------
index 3513b244a2cd8eddec153c906f3b9ba9687f803a..8601b48e0fb2465884df3448912f8c02fd96429c 100644 (file)
$(EXE): zsyrk_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) zsyrk_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/zsyrk_tune/zsyrk_tune.c b/src/ti/linalg/tuning/zsyrk_tune/zsyrk_tune.c
index 5fee5e1efda02f272bf7c11118c6f84144e48c23..a4c193a678ecf10d8cafebe28c21bbea86ea016d 100644 (file)
float operation_count = 2.0*(float)N*(float)K;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Cdsp, Carm, N, N);
+ num_errors += check_results(Cdsp, Carm, N, N);
__free_ddr(A);
__free_ddr(Cdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
+ return num_errors;
}
index ad9d748e551954f904f3320c681d6f2d294c7d99..5a50ce6c21d73f5f0207d61e0a528c3cc8a2cc8a 100644 (file)
$(EXE): ztrmm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) ztrmm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/ztrmm_tune/ztrmm_tune.c b/src/ti/linalg/tuning/ztrmm_tune/ztrmm_tune.c
index 0d261ddbc2c5bdbc31b4dbc2548a01c400bf3832..7433debc4532cd28bb0c46bf34e65d02acb39728 100644 (file)
float operation_count = 2.0*(float)M*(float)N;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Bdsp, Barm, M, N);
+ num_errors += check_results(Bdsp, Barm, M, N);
__free_ddr(A);
__free_ddr(Bdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
+ return num_errors;
}
index 91ce915c5b2d64c52eb4a2363418aabb3c9c5487..04e9914c18ddc990e73f1f17659417029e78deb1 100644 (file)
$(EXE): ztrsm_tune.o $(TUNE_UTILS)
$(CC) $(CFLAGS) ztrsm_tune.o $(TUNE_UTILS_OBJ) $(BLASLIB) -o $@
-tune: $(EXE)
+tune:
./$(EXE);
\ No newline at end of file
diff --git a/src/ti/linalg/tuning/ztrsm_tune/ztrsm_tune.c b/src/ti/linalg/tuning/ztrsm_tune/ztrsm_tune.c
index ed6fc621635f3037ce5ba926cf823d906fa7717d..ac3d23562e7b5e9bde0b175f4bc892512195709c 100644 (file)
float operation_count = 2.0*(float)M*(float)N;
float total_GFLOPS_DSP = 0.0f;
float total_GFLOPS_ARM = 0.0f;
- int err_code = 0;
+ int num_errors = 0;
total_time_dsp = 0.0;
total_time_arm = 0.0;
/*-------------------------------------------------------------------------
* Verify Results
*------------------------------------------------------------------------*/
- err_code += check_results(Bdsp, Barm, M, N);
+ num_errors += check_results(Bdsp, Barm, M, N);
__free_ddr(A);
__free_ddr(Bdsp);
*time_dsp = total_time_dsp / (float)NUM_TEST_RUN;
*time_arm = total_time_arm / (float)NUM_TEST_RUN;
- return err_code;
+ return num_errors;
}