]> Gitweb @ Texas Instruments - Open Source Git Repositories - git.TI.com/gitweb - dense-linear-algebra-libraries/linalg.git/blobdiff - blasblisacc/src/ti_cblas_cblas_ctrmv.c
Added bli_mem_init() to level 3 facade functions. Use Perl script to generate wrapper...
[dense-linear-algebra-libraries/linalg.git] / blasblisacc / src / ti_cblas_cblas_ctrmv.c
index ee423018f4fcbe362257aab0f4a883c8e91b2e9e..0b33200b8e48b83dfbc2fe92ddcf2c25a48286df 100644 (file)
@@ -44,20 +44,19 @@ void cblas_ctrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
        if (!ti_cblas_init_done) ti_cblas_init();
        TI_CBLAS_DEBUG_PRINT("Intercepted call to %s\n", "cblas_ctrmv");
 
-        TI_CBLAS_PROFILE_START();
-
+    TI_CBLAS_PROFILE_START();
        /* Dynamic condtional offload to ARM */
-        if ((TI_CBLAS_L2_OFFLOAD == TI_CBLAS_OFFLOAD_NONE)) { 
-               TI_CBLAS_DEBUG_PRINT("Executing ARM %s\n", "cblas_ctrmv"); 
-               __real_cblas_ctrmv(order,Uplo,TransA,Diag,N,A,lda,X,incX); 
-               TI_CBLAS_PROFILE_REPORT("  Entire %s call (ARM) took %8.2f us\n","cblas_ctrmv", (float) clock_diff);
-               return ;
-        }
-        /* End ARM offload */
+    if ((TI_CBLAS_L2_OFFLOAD == TI_CBLAS_OFFLOAD_NONE)) { 
+       TI_CBLAS_DEBUG_PRINT("Executing ARM %s\n", "cblas_ctrmv"); 
+       __real_cblas_ctrmv(order,Uplo,TransA,Diag,N,A,lda,X,incX); 
+    TI_CBLAS_PROFILE_REPORT("  Entire %s call (ARM) took %8.2f us\n","cblas_ctrmv", (float) clock_diff);
+       return ;
+    }
+    /* End ARM offload */
 
        /******************************************************************/
        /* DSP offload WILL be done if control reaches here */
-               TI_CBLAS_DEBUG_PRINT("Offloading to DSP %s\n", "cblas_ctrmv"); 
+       TI_CBLAS_DEBUG_PRINT("Offloading to DSP %s\n", "cblas_ctrmv"); 
 
        /* Lookup kernel pointer from global table */
 #ifdef __cplusplus
@@ -74,7 +73,6 @@ void cblas_ctrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
 #endif
        {
 
-
 #ifdef __cplusplus
                __K->setArg(0, order);
 #else
@@ -159,7 +157,9 @@ void cblas_ctrmv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, const
                TI_CBLAS_OCL_CHKERROR("clReleaseEvent",err);
 
 #endif
+
                ti_cblas_delete_kernel(__K);
+
                TI_CBLAS_DEBUG_PRINT("Finished executing %s\n", "cblas_ctrmv");
                TI_CBLAS_PROFILE_REPORT("  Entire %s call (DSP) took %8.2f us\n","cblas_ctrmv", (float) clock_diff);
                return ;