]> Gitweb @ Texas Instruments - Open Source Git Repositories - git.TI.com/gitweb - dense-linear-algebra-libraries/linalg.git/blobdiff - src/ti/linalg/blis/frame/1/scal2v/bli_scal2v_ref.c
Sync with external git. Should be the other way around.
[dense-linear-algebra-libraries/linalg.git] / src / ti / linalg / blis / frame / 1 / scal2v / bli_scal2v_ref.c
diff --git a/src/ti/linalg/blis/frame/1/scal2v/bli_scal2v_ref.c b/src/ti/linalg/blis/frame/1/scal2v/bli_scal2v_ref.c
new file mode 100644 (file)
index 0000000..d1cc876
--- /dev/null
@@ -0,0 +1,170 @@
+/*
+
+   BLIS    
+   An object-based framework for developing high-performance BLAS-like
+   libraries.
+
+   Copyright (C) 2014, The University of Texas at Austin
+
+   Redistribution and use in source and binary forms, with or without
+   modification, are permitted provided that the following conditions are
+   met:
+    - Redistributions of source code must retain the above copyright
+      notice, this list of conditions and the following disclaimer.
+    - Redistributions in binary form must reproduce the above copyright
+      notice, this list of conditions and the following disclaimer in the
+      documentation and/or other materials provided with the distribution.
+    - Neither the name of The University of Texas at Austin nor the names
+      of its contributors may be used to endorse or promote products
+      derived from this software without specific prior written permission.
+
+   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+   HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+*/
+
+#include "blis.h"
+
+/*
+#define FUNCPTR_T scal2v_fp
+
+typedef void (*FUNCPTR_T)(
+                           conj_t conjx,
+                           dim_t  n,
+                           void*  beta,
+                           void*  x, inc_t incx,
+                           void*  y, inc_t incy
+                         );
+
+// If some mixed datatype functions will not be compiled, we initialize
+// the corresponding elements of the function array to NULL.
+#ifdef BLIS_ENABLE_MIXED_PRECISION_SUPPORT
+static FUNCPTR_T GENARRAY3_ALL(ftypes,scal2v_ref);
+#else
+#ifdef BLIS_ENABLE_MIXED_DOMAIN_SUPPORT
+static FUNCPTR_T GENARRAY3_EXT(ftypes,scal2v_ref);
+#else
+static FUNCPTR_T GENARRAY3_MIN(ftypes,scal2v_ref);
+#endif
+#endif
+
+
+void bli_scal2v_ref( obj_t*  beta,
+                          obj_t*  x,
+                          obj_t*  y )
+{
+       num_t     dt_x      = bli_obj_datatype( *x );
+       num_t     dt_y      = bli_obj_datatype( *y );
+
+       conj_t    conjx     = bli_obj_conj_status( *x );
+       dim_t     n         = bli_obj_vector_dim( *x );
+
+       inc_t     inc_x     = bli_obj_vector_inc( *x );
+       void*     buf_x     = bli_obj_buffer_at_off( *x );
+
+       inc_t     inc_y     = bli_obj_vector_inc( *y );
+       void*     buf_y     = bli_obj_buffer_at_off( *y );
+
+       num_t     dt_beta;
+       void*     buf_beta;
+
+       FUNCPTR_T f;
+
+       // If beta is a scalar constant, use dt_x to extract the address of the
+       // corresponding constant value; otherwise, use the datatype encoded
+       // within the beta object and extract the buffer at the beta offset.
+       bli_set_scalar_dt_buffer( beta, dt_x, dt_beta, buf_beta );
+
+       // Index into the type combination array to extract the correct
+       // function pointer.
+       f = ftypes[dt_beta][dt_x][dt_y];
+
+       // Invoke the function.
+       f( conjx,
+          n,
+          buf_beta,
+          buf_x, inc_x,
+          buf_y, inc_y );
+}
+*/
+
+
+#undef  GENTFUNC3
+#define GENTFUNC3( ctype_b, ctype_x, ctype_y, chb, chx, chy, varname, setvker ) \
+\
+void PASTEMAC3(chb,chx,chy,varname) \
+     ( \
+       conj_t            conjx, \
+       dim_t             n, \
+       ctype_b* restrict beta, \
+       ctype_x* restrict x, inc_t incx, \
+       ctype_y* restrict y, inc_t incy  \
+     ) \
+{ \
+       ctype_b* beta_cast = beta; \
+       ctype_x* x_cast    = x; \
+       ctype_y* y_cast    = y; \
+       ctype_x* chi1; \
+       ctype_y* psi1; \
+       dim_t    i; \
+\
+       if ( bli_zero_dim1( n ) ) return; \
+\
+       /* If beta is zero, use setv. */ \
+       if ( PASTEMAC(chb,eq0)( *beta_cast ) ) \
+       { \
+               ctype_y* zero = PASTEMAC(chy,0); \
+\
+               PASTEMAC2(chy,chy,setvker)( n, \
+                                           zero, \
+                                           y, incy ); \
+               return; \
+       } \
+\
+       chi1 = x_cast; \
+       psi1 = y_cast; \
+\
+       if ( bli_is_conj( conjx ) ) \
+       { \
+               for ( i = 0; i < n; ++i ) \
+               { \
+                       PASTEMAC3(chb,chx,chy,scal2js)( *beta_cast, *chi1, *psi1 ); \
+\
+                       chi1 += incx; \
+                       psi1 += incy; \
+               } \
+       } \
+       else \
+       { \
+               for ( i = 0; i < n; ++i ) \
+               { \
+                       PASTEMAC3(chb,chx,chy,scal2s)( *beta_cast, *chi1, *psi1 ); \
+\
+                       chi1 += incx; \
+                       psi1 += incy; \
+               } \
+       } \
+}
+
+
+// Define the basic set of functions unconditionally, and then also some
+// mixed datatype functions if requested.
+INSERT_GENTFUNC3_BASIC( scal2v_ref, SETV_KERNEL )
+
+#ifdef BLIS_ENABLE_MIXED_DOMAIN_SUPPORT
+INSERT_GENTFUNC3_MIX_D( scal2v_ref, SETV_KERNEL )
+#endif
+
+#ifdef BLIS_ENABLE_MIXED_PRECISION_SUPPORT
+INSERT_GENTFUNC3_MIX_P( scal2v_ref, SETV_KERNEL )
+#endif
+