index 829ba41bc234c938da58fc12bfdca5749a58dcab..09f6f84ee794e367e8936ae1fa73100aa0131e29 100644 (file)
@@ -44,20 +44,19 @@ float cblas_sdsdot(const int N, const float alpha, const float *X, const int inc
if (!ti_cblas_init_done) ti_cblas_init();
TI_CBLAS_DEBUG_PRINT("Intercepted call to %s\n", "cblas_sdsdot");
- TI_CBLAS_PROFILE_START();
-
+ TI_CBLAS_PROFILE_START();
/* Dynamic condtional offload to ARM */
- if ((TI_CBLAS_L1_OFFLOAD == TI_CBLAS_OFFLOAD_NONE)) {
- TI_CBLAS_DEBUG_PRINT("Executing ARM %s\n", "cblas_sdsdot");
- float rval = __real_cblas_sdsdot(N,alpha,X,incX,Y,incY);
- TI_CBLAS_PROFILE_REPORT(" Entire %s call (ARM) took %8.2f us\n","cblas_sdsdot", (float) clock_diff);
- return rval;
- }
- /* End ARM offload */
+ if ((TI_CBLAS_L1_OFFLOAD == TI_CBLAS_OFFLOAD_NONE)) {
+ TI_CBLAS_DEBUG_PRINT("Executing ARM %s\n", "cblas_sdsdot");
+ float rval = __real_cblas_sdsdot(N,alpha,X,incX,Y,incY);
+ TI_CBLAS_PROFILE_REPORT(" Entire %s call (ARM) took %8.2f us\n","cblas_sdsdot", (float) clock_diff);
+ return rval;
+ }
+ /* End ARM offload */
/******************************************************************/
/* DSP offload WILL be done if control reaches here */
- TI_CBLAS_DEBUG_PRINT("Offloading to DSP %s\n", "cblas_sdsdot");
+ TI_CBLAS_DEBUG_PRINT("Offloading to DSP %s\n", "cblas_sdsdot");
/* Lookup kernel pointer from global table */
#ifdef __cplusplus
#endif
{
-
#ifdef __cplusplus
__K->setArg(0, N);
#else
@@ -154,6 +152,7 @@ float cblas_sdsdot(const int N, const float alpha, const float *X, const int inc
TI_CBLAS_OCL_CHKERROR("clReleaseEvent",err);
#endif
+
ti_cblas_delete_kernel(__K);
TI_CBLAS_DEBUG_PRINT("Finished executing %s\n", "cblas_sdsdot");