1 files changed, 0 insertions, 633 deletions
diff --git a/libpixelflinger/include/private/pixelflinger/ggl_fixed.h b/libpixelflinger/include/private/pixelflinger/ggl_fixed.h
deleted file mode 100644
index 787f6202b..000000000
--- a/libpixelflinger/include/private/pixelflinger/ggl_fixed.h
+++ /dev/null
@@ -1,633 +0,0 @@
-/*
- * Copyright (C) 2005 The Android Open Source Project
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-#ifndef ANDROID_GGL_FIXED_H
-#define ANDROID_GGL_FIXED_H
-#include <math.h>
-#include <pixelflinger/pixelflinger.h>
-// ----------------------------------------------------------------------------
-#define CONST           __attribute__((const))
-#define ALWAYS_INLINE   __attribute__((always_inline))
-const GGLfixed FIXED_BITS = 16;
-const GGLfixed FIXED_EPSILON  = 1;
-const GGLfixed FIXED_ONE  = 1L<<FIXED_BITS;
-const GGLfixed FIXED_HALF = 1L<<(FIXED_BITS-1);
-const GGLfixed FIXED_MIN  = 0x80000000L;
-const GGLfixed FIXED_MAX  = 0x7FFFFFFFL;
-inline GGLfixed gglIntToFixed(GGLfixed i)       ALWAYS_INLINE ;
-inline GGLfixed gglFixedToIntRound(GGLfixed f)  ALWAYS_INLINE ;
-inline GGLfixed gglFixedToIntFloor(GGLfixed f)  ALWAYS_INLINE ;
-inline GGLfixed gglFixedToIntCeil(GGLfixed f)   ALWAYS_INLINE ;
-inline GGLfixed gglFracx(GGLfixed v)            ALWAYS_INLINE ;
-inline GGLfixed gglFloorx(GGLfixed v)           ALWAYS_INLINE ;
-inline GGLfixed gglCeilx(GGLfixed v)            ALWAYS_INLINE ;
-inline GGLfixed gglCenterx(GGLfixed v)          ALWAYS_INLINE ;
-inline GGLfixed gglRoundx(GGLfixed v)           ALWAYS_INLINE ;
-GGLfixed gglIntToFixed(GGLfixed i) {
-    return i<<FIXED_BITS;
-}
-GGLfixed gglFixedToIntRound(GGLfixed f) {
-    return (f + FIXED_HALF)>>FIXED_BITS;
-}
-GGLfixed gglFixedToIntFloor(GGLfixed f) {
-    return f>>FIXED_BITS;
-}
-GGLfixed gglFixedToIntCeil(GGLfixed f) {
-    return (f + ((1<<FIXED_BITS) - 1))>>FIXED_BITS;
-}
-GGLfixed gglFracx(GGLfixed v) {
-    return v & ((1<<FIXED_BITS)-1);
-}
-GGLfixed gglFloorx(GGLfixed v) {
-    return gglFixedToIntFloor(v)<<FIXED_BITS;
-}
-GGLfixed gglCeilx(GGLfixed v) {
-    return gglFixedToIntCeil(v)<<FIXED_BITS;
-}
-GGLfixed gglCenterx(GGLfixed v) {
-    return gglFloorx(v + FIXED_HALF) | FIXED_HALF;
-}
-GGLfixed gglRoundx(GGLfixed v) {
-    return gglFixedToIntRound(v)<<FIXED_BITS;
-}
-// conversion from (unsigned) int, short, byte to fixed...
-#define GGL_B_TO_X(_x)      GGLfixed( ((int32_t(_x)+1)>>1)<<10 )
-#define GGL_S_TO_X(_x)      GGLfixed( ((int32_t(_x)+1)>>1)<<2 )
-#define GGL_I_TO_X(_x)      GGLfixed( ((int32_t(_x)>>1)+1)>>14 )
-#define GGL_UB_TO_X(_x)     GGLfixed(   uint32_t(_x) +      \
-                                        (uint32_t(_x)<<8) + \
-                                        (uint32_t(_x)>>7) )
-#define GGL_US_TO_X(_x)     GGLfixed( (_x) + ((_x)>>15) )
-#define GGL_UI_TO_X(_x)     GGLfixed( (((_x)>>1)+1)>>15 )
-// ----------------------------------------------------------------------------
-GGLfixed gglPowx(GGLfixed x, GGLfixed y) CONST;
-GGLfixed gglSqrtx(GGLfixed a) CONST;
-GGLfixed gglSqrtRecipx(GGLfixed x) CONST;
-GGLfixed gglFastDivx(GGLfixed n, GGLfixed d) CONST;
-int32_t gglMulDivi(int32_t a, int32_t b, int32_t c);
-int32_t gglRecipQNormalized(int32_t x, int* exponent);
-int32_t gglRecipQ(GGLfixed x, int q) CONST;
-inline GGLfixed gglRecip(GGLfixed x) CONST;
-inline GGLfixed gglRecip(GGLfixed x) {
-    return gglRecipQ(x, 16);
-}
-inline GGLfixed gglRecip28(GGLfixed x) CONST;
-int32_t gglRecip28(GGLfixed x) {
-    return gglRecipQ(x, 28);
-}
-// ----------------------------------------------------------------------------
-#if defined(__arm__) && !defined(__thumb__)
-// inline ARM implementations
-inline GGLfixed gglMulx(GGLfixed x, GGLfixed y, int shift) CONST;
-inline GGLfixed gglMulx(GGLfixed x, GGLfixed y, int shift) {
-    GGLfixed result, t;
-    if (__builtin_constant_p(shift)) {
-    asm("smull  %[lo], %[hi], %[x], %[y]            \n"
-        "movs   %[lo], %[lo], lsr %[rshift]         \n"
-        "adc    %[lo], %[lo], %[hi], lsl %[lshift]  \n"
-        : [lo]"=r"(result), [hi]"=r"(t), [x]"=r"(x)
-        : "%[x]"(x), [y]"r"(y), [lshift] "I"(32-shift), [rshift] "I"(shift)
-        : "cc"
-        );
-    } else {
-    asm("smull  %[lo], %[hi], %[x], %[y]            \n"
-        "movs   %[lo], %[lo], lsr %[rshift]         \n"
-        "adc    %[lo], %[lo], %[hi], lsl %[lshift]  \n"
-        : [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
-        : "%[x]"(x), [y]"r"(y), [lshift] "r"(32-shift), [rshift] "r"(shift)
-        : "cc"
-        );
-    }
-    return result;
-}
-inline GGLfixed gglMulAddx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) CONST;
-inline GGLfixed gglMulAddx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) {
-    GGLfixed result, t;
-    if (__builtin_constant_p(shift)) {
-    asm("smull  %[lo], %[hi], %[x], %[y]            \n"
-        "add    %[lo], %[a],  %[lo], lsr %[rshift]  \n"
-        "add    %[lo], %[lo], %[hi], lsl %[lshift]  \n"
-        : [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
-        : "%[x]"(x), [y]"r"(y), [a]"r"(a), [lshift] "I"(32-shift), [rshift] "I"(shift)
-        );
-    } else {
-    asm("smull  %[lo], %[hi], %[x], %[y]            \n"
-        "add    %[lo], %[a],  %[lo], lsr %[rshift]  \n"
-        "add    %[lo], %[lo], %[hi], lsl %[lshift]  \n"
-        : [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
-        : "%[x]"(x), [y]"r"(y), [a]"r"(a), [lshift] "r"(32-shift), [rshift] "r"(shift)
-        );
-    }
-    return result;
-}
-inline GGLfixed gglMulSubx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) CONST;
-inline GGLfixed gglMulSubx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) {
-    GGLfixed result, t;
-    if (__builtin_constant_p(shift)) {
-    asm("smull  %[lo], %[hi], %[x], %[y]            \n"
-        "rsb    %[lo], %[a],  %[lo], lsr %[rshift]  \n"
-        "add    %[lo], %[lo], %[hi], lsl %[lshift]  \n"
-        : [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
-        : "%[x]"(x), [y]"r"(y), [a]"r"(a), [lshift] "I"(32-shift), [rshift] "I"(shift)
-        );
-    } else {
-    asm("smull  %[lo], %[hi], %[x], %[y]            \n"
-        "rsb    %[lo], %[a],  %[lo], lsr %[rshift]  \n"
-        "add    %[lo], %[lo], %[hi], lsl %[lshift]  \n"
-        : [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
-        : "%[x]"(x), [y]"r"(y), [a]"r"(a), [lshift] "r"(32-shift), [rshift] "r"(shift)
-        );
-    }
-    return result;
-}
-inline int64_t gglMulii(int32_t x, int32_t y) CONST;
-inline int64_t gglMulii(int32_t x, int32_t y)
-{
-    // 64-bits result: r0=low, r1=high
-    union {
-        struct {
-            int32_t lo;
-            int32_t hi;
-        } s;
-        int64_t res;
-    };
-    asm("smull %0, %1, %2, %3   \n"
-        : "=r"(s.lo), "=&r"(s.hi)
-        : "%r"(x), "r"(y)
-        :
-        );
-    return res;
-}
-#elif defined(__mips__) && __mips_isa_rev < 6
-/*inline MIPS implementations*/
-inline GGLfixed gglMulx(GGLfixed a, GGLfixed b, int shift) CONST;
-inline GGLfixed gglMulx(GGLfixed a, GGLfixed b, int shift) {
-    GGLfixed result,tmp,tmp1,tmp2;
-    if (__builtin_constant_p(shift)) {
-        if (shift == 0) {
-            asm ("mult %[a], %[b] \t\n"
-              "mflo  %[res]   \t\n"
-            : [res]"=&r"(result),[tmp]"=&r"(tmp)
-            : [a]"r"(a),[b]"r"(b)
-            : "%hi","%lo"
-            );
-        } else if (shift == 32)
-        {
-            asm ("mult %[a], %[b] \t\n"
-            "li  %[tmp],1\t\n"
-            "sll  %[tmp],%[tmp],0x1f\t\n"
-            "mflo %[res]   \t\n"
-            "addu %[tmp1],%[tmp],%[res] \t\n"
-            "sltu %[tmp1],%[tmp1],%[tmp]\t\n"   /*obit*/
-            "sra %[tmp],%[tmp],0x1f \t\n"
-            "mfhi  %[res]   \t\n"
-            "addu %[res],%[res],%[tmp]\t\n"
-            "addu %[res],%[res],%[tmp1]\t\n"
-            : [res]"=&r"(result),[tmp]"=&r"(tmp),[tmp1]"=&r"(tmp1)
-            : [a]"r"(a),[b]"r"(b),[shift]"I"(shift)
-            : "%hi","%lo"
-            );
-        } else if ((shift >0) && (shift < 32))
-        {
-            asm ("mult %[a], %[b] \t\n"
-            "li  %[tmp],1 \t\n"
-            "sll  %[tmp],%[tmp],%[shiftm1] \t\n"
-            "mflo  %[res]   \t\n"
-            "addu %[tmp1],%[tmp],%[res] \t\n"
-            "sltu %[tmp1],%[tmp1],%[tmp] \t\n"  /*obit?*/
-            "addu  %[res],%[res],%[tmp] \t\n"
-            "mfhi  %[tmp]   \t\n"
-            "addu  %[tmp],%[tmp],%[tmp1] \t\n"
-            "sll   %[tmp],%[tmp],%[lshift] \t\n"
-            "srl   %[res],%[res],%[rshift]    \t\n"
-            "or    %[res],%[res],%[tmp] \t\n"
-            : [res]"=&r"(result),[tmp]"=&r"(tmp),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
-            : [a]"r"(a),[b]"r"(b),[lshift]"I"(32-shift),[rshift]"I"(shift),[shiftm1]"I"(shift-1)
-            : "%hi","%lo"
-            );
-        } else {
-            asm ("mult %[a], %[b] \t\n"
-            "li  %[tmp],1 \t\n"
-            "sll  %[tmp],%[tmp],%[shiftm1] \t\n"
-            "mflo  %[res]   \t\n"
-            "addu %[tmp1],%[tmp],%[res] \t\n"
-            "sltu %[tmp1],%[tmp1],%[tmp] \t\n"  /*obit?*/
-            "sra  %[tmp2],%[tmp],0x1f \t\n"
-            "addu  %[res],%[res],%[tmp] \t\n"
-            "mfhi  %[tmp]   \t\n"
-            "addu  %[tmp],%[tmp],%[tmp2] \t\n"
-            "addu  %[tmp],%[tmp],%[tmp1] \t\n"            /*tmp=hi*/
-            "srl   %[tmp2],%[res],%[rshift]    \t\n"
-            "srav  %[res], %[tmp],%[rshift]\t\n"
-            "sll   %[tmp],%[tmp],1 \t\n"
-            "sll   %[tmp],%[tmp],%[norbits] \t\n"
-            "or    %[tmp],%[tmp],%[tmp2] \t\n"
-            "movz  %[res],%[tmp],%[bit5] \t\n"
-            : [res]"=&r"(result),[tmp]"=&r"(tmp),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
-            : [a]"r"(a),[b]"r"(b),[norbits]"I"(~(shift)),[rshift]"I"(shift),[shiftm1] "I"(shift-1),[bit5]"I"(shift & 0x20)
-            : "%hi","%lo"
-            );
-        }
-    } else {
-        asm ("mult %[a], %[b] \t\n"
-        "li  %[tmp],1 \t\n"
-        "sll  %[tmp],%[tmp],%[shiftm1] \t\n"
-        "mflo  %[res]   \t\n"
-        "addu %[tmp1],%[tmp],%[res] \t\n"
-        "sltu %[tmp1],%[tmp1],%[tmp] \t\n"  /*obit?*/
-        "sra  %[tmp2],%[tmp],0x1f \t\n"
-        "addu  %[res],%[res],%[tmp] \t\n"
-        "mfhi  %[tmp]   \t\n"
-        "addu  %[tmp],%[tmp],%[tmp2] \t\n"
-        "addu  %[tmp],%[tmp],%[tmp1] \t\n"            /*tmp=hi*/
-        "srl   %[tmp2],%[res],%[rshift]    \t\n"
-        "srav  %[res], %[tmp],%[rshift]\t\n"
-        "sll   %[tmp],%[tmp],1 \t\n"
-        "sll   %[tmp],%[tmp],%[norbits] \t\n"
-        "or    %[tmp],%[tmp],%[tmp2] \t\n"
-        "movz  %[res],%[tmp],%[bit5] \t\n"
-         : [res]"=&r"(result),[tmp]"=&r"(tmp),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
-         : [a]"r"(a),[b]"r"(b),[norbits]"r"(~(shift)),[rshift] "r"(shift),[shiftm1]"r"(shift-1),[bit5] "r"(shift & 0x20)
-         : "%hi","%lo"
-         );
-        }
-        return result;
-}
-inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) CONST;
-inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) {
-    GGLfixed result,t,tmp1,tmp2;
-    if (__builtin_constant_p(shift)) {
-        if (shift == 0) {
-                 asm ("mult %[a], %[b] \t\n"
-                 "mflo  %[lo]   \t\n"
-                 "addu  %[lo],%[lo],%[c]    \t\n"
-                 : [lo]"=&r"(result)
-                 : [a]"r"(a),[b]"r"(b),[c]"r"(c)
-                 : "%hi","%lo"
-                 );
-                } else if (shift == 32) {
-                    asm ("mult %[a], %[b] \t\n"
-                    "mfhi  %[lo]   \t\n"
-                    "addu  %[lo],%[lo],%[c]    \t\n"
-                    : [lo]"=&r"(result)
-                    : [a]"r"(a),[b]"r"(b),[c]"r"(c)
-                    : "%hi","%lo"
-                    );
-                } else if ((shift>0) && (shift<32)) {
-                    asm ("mult %[a], %[b] \t\n"
-                    "mflo  %[res]   \t\n"
-                    "mfhi  %[t]   \t\n"
-                    "srl   %[res],%[res],%[rshift]    \t\n"
-                    "sll   %[t],%[t],%[lshift]     \t\n"
-                    "or  %[res],%[res],%[t]    \t\n"
-                    "addu  %[res],%[res],%[c]    \t\n"
-                    : [res]"=&r"(result),[t]"=&r"(t)
-                    : [a]"r"(a),[b]"r"(b),[c]"r"(c),[lshift]"I"(32-shift),[rshift]"I"(shift)
-                    : "%hi","%lo"
-                    );
-                } else {
-                    asm ("mult %[a], %[b] \t\n"
-                    "nor %[tmp1],$zero,%[shift]\t\n"
-                    "mflo  %[res]   \t\n"
-                    "mfhi  %[t]   \t\n"
-                    "srl   %[res],%[res],%[shift]    \t\n"
-                    "sll   %[tmp2],%[t],1     \t\n"
-                    "sllv  %[tmp2],%[tmp2],%[tmp1]     \t\n"
-                    "or  %[tmp1],%[tmp2],%[res]    \t\n"
-                    "srav  %[res],%[t],%[shift]     \t\n"
-                    "andi %[tmp2],%[shift],0x20\t\n"
-                    "movz %[res],%[tmp1],%[tmp2]\t\n"
-                    "addu  %[res],%[res],%[c]    \t\n"
-                    : [res]"=&r"(result),[t]"=&r"(t),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
-                    : [a]"r"(a),[b]"r"(b),[c]"r"(c),[shift]"I"(shift)
-                    : "%hi","%lo"
-                    );
-                }
-            } else {
-                asm ("mult %[a], %[b] \t\n"
-                "nor %[tmp1],$zero,%[shift]\t\n"
-                "mflo  %[res]   \t\n"
-                "mfhi  %[t]   \t\n"
-                "srl   %[res],%[res],%[shift]    \t\n"
-                "sll   %[tmp2],%[t],1     \t\n"
-                "sllv  %[tmp2],%[tmp2],%[tmp1]     \t\n"
-                "or  %[tmp1],%[tmp2],%[res]    \t\n"
-                "srav  %[res],%[t],%[shift]     \t\n"
-                "andi %[tmp2],%[shift],0x20\t\n"
-                "movz %[res],%[tmp1],%[tmp2]\t\n"
-                "addu  %[res],%[res],%[c]    \t\n"
-                : [res]"=&r"(result),[t]"=&r"(t),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
-                : [a]"r"(a),[b]"r"(b),[c]"r"(c),[shift]"r"(shift)
-                : "%hi","%lo"
-                );
-            }
-            return result;
-}
-inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) CONST;
-inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) {
-    GGLfixed result,t,tmp1,tmp2;
-    if (__builtin_constant_p(shift)) {
-        if (shift == 0) {
-                 asm ("mult %[a], %[b] \t\n"
-                 "mflo  %[lo]   \t\n"
-                 "subu  %[lo],%[lo],%[c]    \t\n"
-                 : [lo]"=&r"(result)
-                 : [a]"r"(a),[b]"r"(b),[c]"r"(c)
-                 : "%hi","%lo"
-                 );
-                } else if (shift == 32) {
-                    asm ("mult %[a], %[b] \t\n"
-                    "mfhi  %[lo]   \t\n"
-                    "subu  %[lo],%[lo],%[c]    \t\n"
-                    : [lo]"=&r"(result)
-                    : [a]"r"(a),[b]"r"(b),[c]"r"(c)
-                    : "%hi","%lo"
-                    );
-                } else if ((shift>0) && (shift<32)) {
-                    asm ("mult %[a], %[b] \t\n"
-                    "mflo  %[res]   \t\n"
-                    "mfhi  %[t]   \t\n"
-                    "srl   %[res],%[res],%[rshift]    \t\n"
-                    "sll   %[t],%[t],%[lshift]     \t\n"
-                    "or  %[res],%[res],%[t]    \t\n"
-                    "subu  %[res],%[res],%[c]    \t\n"
-                    : [res]"=&r"(result),[t]"=&r"(t)
-                    : [a]"r"(a),[b]"r"(b),[c]"r"(c),[lshift]"I"(32-shift),[rshift]"I"(shift)
-                    : "%hi","%lo"
-                    );
-                } else {
-                    asm ("mult %[a], %[b] \t\n"
-                    "nor %[tmp1],$zero,%[shift]\t\n"
-                     "mflo  %[res]   \t\n"
-                     "mfhi  %[t]   \t\n"
-                     "srl   %[res],%[res],%[shift]    \t\n"
-                     "sll   %[tmp2],%[t],1     \t\n"
-                     "sllv  %[tmp2],%[tmp2],%[tmp1]     \t\n"
-                     "or  %[tmp1],%[tmp2],%[res]    \t\n"
-                     "srav  %[res],%[t],%[shift]     \t\n"
-                     "andi %[tmp2],%[shift],0x20\t\n"
-                     "movz %[res],%[tmp1],%[tmp2]\t\n"
-                     "subu  %[res],%[res],%[c]    \t\n"
-                     : [res]"=&r"(result),[t]"=&r"(t),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
-                     : [a]"r"(a),[b]"r"(b),[c]"r"(c),[shift]"I"(shift)
-                     : "%hi","%lo"
-                     );
-                    }
-                } else {
-                asm ("mult %[a], %[b] \t\n"
-                "nor %[tmp1],$zero,%[shift]\t\n"
-                "mflo  %[res]   \t\n"
-                "mfhi  %[t]   \t\n"
-                "srl   %[res],%[res],%[shift]    \t\n"
-                "sll   %[tmp2],%[t],1     \t\n"
-                "sllv  %[tmp2],%[tmp2],%[tmp1]     \t\n"
-                "or  %[tmp1],%[tmp2],%[res]    \t\n"
-                "srav  %[res],%[t],%[shift]     \t\n"
-                "andi %[tmp2],%[shift],0x20\t\n"
-                "movz %[res],%[tmp1],%[tmp2]\t\n"
-                "subu  %[res],%[res],%[c]    \t\n"
-                : [res]"=&r"(result),[t]"=&r"(t),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
-                : [a]"r"(a),[b]"r"(b),[c]"r"(c),[shift]"r"(shift)
-                : "%hi","%lo"
-                );
-            }
-    return result;
-}
-inline int64_t gglMulii(int32_t x, int32_t y) CONST;
-inline int64_t gglMulii(int32_t x, int32_t y) {
-    union {
-        struct {
-#if defined(__MIPSEL__)
-            int32_t lo;
-            int32_t hi;
-#elif defined(__MIPSEB__)
-            int32_t hi;
-            int32_t lo;
-#endif
-        } s;
-        int64_t res;
-    }u;
-    asm("mult %2, %3 \t\n"
-        "mfhi %1   \t\n"
-        "mflo %0   \t\n"
-        : "=r"(u.s.lo), "=&r"(u.s.hi)
-        : "%r"(x), "r"(y)
-        : "%hi","%lo"
-        );
-    return u.res;
-}
-#elif defined(__aarch64__)
-// inline AArch64 implementations
-inline GGLfixed gglMulx(GGLfixed x, GGLfixed y, int shift) CONST;
-inline GGLfixed gglMulx(GGLfixed x, GGLfixed y, int shift)
-{
-    GGLfixed result;
-    GGLfixed round;
-    asm("mov    %x[round], #1                        \n"
-        "lsl    %x[round], %x[round], %x[shift]      \n"
-        "lsr    %x[round], %x[round], #1             \n"
-        "smaddl %x[result], %w[x], %w[y],%x[round]   \n"
-        "lsr    %x[result], %x[result], %x[shift]    \n"
-        : [round]"=&r"(round), [result]"=&r"(result) \
-        : [x]"r"(x), [y]"r"(y), [shift] "r"(shift)   \
-        :
-       );
-    return result;
-}
-inline GGLfixed gglMulAddx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) CONST;
-inline GGLfixed gglMulAddx(GGLfixed x, GGLfixed y, GGLfixed a, int shift)
-{
-    GGLfixed result;
-    asm("smull  %x[result], %w[x], %w[y]                     \n"
-        "lsr    %x[result], %x[result], %x[shift]            \n"
-        "add    %w[result], %w[result], %w[a]                \n"
-        : [result]"=&r"(result)                               \
-        : [x]"r"(x), [y]"r"(y), [a]"r"(a), [shift] "r"(shift) \
-        :
-        );
-    return result;
-}
-inline GGLfixed gglMulSubx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) CONST;
-inline GGLfixed gglMulSubx(GGLfixed x, GGLfixed y, GGLfixed a, int shift)
-{
-    GGLfixed result;
-    int rshift;
-    asm("smull  %x[result], %w[x], %w[y]                     \n"
-        "lsr    %x[result], %x[result], %x[shift]            \n"
-        "sub    %w[result], %w[result], %w[a]                \n"
-        : [result]"=&r"(result)                               \
-        : [x]"r"(x), [y]"r"(y), [a]"r"(a), [shift] "r"(shift) \
-        :
-        );
-    return result;
-}
-inline int64_t gglMulii(int32_t x, int32_t y) CONST;
-inline int64_t gglMulii(int32_t x, int32_t y)
-{
-    int64_t res;
-    asm("smull  %x0, %w1, %w2 \n"
-        : "=r"(res)
-        : "%r"(x), "r"(y)
-        :
-        );
-    return res;
-}
-#else // ----------------------------------------------------------------------
-inline GGLfixed gglMulx(GGLfixed a, GGLfixed b, int shift) CONST;
-inline GGLfixed gglMulx(GGLfixed a, GGLfixed b, int shift) {
-    return GGLfixed((int64_t(a)*b + (1<<(shift-1)))>>shift);
-}
-inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) CONST;
-inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) {
-    return GGLfixed((int64_t(a)*b)>>shift) + c;
-}
-inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) CONST;
-inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) {
-    return GGLfixed((int64_t(a)*b)>>shift) - c;
-}
-inline int64_t gglMulii(int32_t a, int32_t b) CONST;
-inline int64_t gglMulii(int32_t a, int32_t b) {
-    return int64_t(a)*b;
-}
-#endif
-// ------------------------------------------------------------------------
-inline GGLfixed gglMulx(GGLfixed a, GGLfixed b) CONST;
-inline GGLfixed gglMulx(GGLfixed a, GGLfixed b) {
-    return gglMulx(a, b, 16);
-}
-inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c) CONST;
-inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c) {
-    return gglMulAddx(a, b, c, 16);
-}
-inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c) CONST;
-inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c) {
-    return gglMulSubx(a, b, c, 16);
-}
-// ------------------------------------------------------------------------
-inline int32_t gglClz(int32_t x) CONST;
-inline int32_t gglClz(int32_t x)
-{
-#if (defined(__arm__) && !defined(__thumb__)) || defined(__mips__) || defined(__aarch64__)
-    return __builtin_clz(x);
-#else
-    if (!x) return 32;
-    int32_t exp = 31;
-    if (x & 0xFFFF0000) { exp -=16; x >>= 16; }
-    if (x & 0x0000ff00) { exp -= 8; x >>= 8; }
-    if (x & 0x000000f0) { exp -= 4; x >>= 4; }
-    if (x & 0x0000000c) { exp -= 2; x >>= 2; }
-    if (x & 0x00000002) { exp -= 1; }
-    return exp;
-#endif
-}
-// ------------------------------------------------------------------------
-int32_t gglDivQ(GGLfixed n, GGLfixed d, int32_t i) CONST;
-inline int32_t gglDivQ16(GGLfixed n, GGLfixed d) CONST;
-inline int32_t gglDivQ16(GGLfixed n, GGLfixed d) {
-    return gglDivQ(n, d, 16);
-}
-inline int32_t gglDivx(GGLfixed n, GGLfixed d) CONST;
-inline int32_t gglDivx(GGLfixed n, GGLfixed d) {
-    return gglDivQ(n, d, 16);
-}
-// ------------------------------------------------------------------------
-inline GGLfixed gglRecipFast(GGLfixed x) CONST;
-inline GGLfixed gglRecipFast(GGLfixed x)
-{
-    // This is a really bad approximation of 1/x, but it's also
-    // very fast. x must be strictly positive.
-    // if x between [0.5, 1[ , then 1/x = 3-2*x
-    // (we use 2.30 fixed-point)
-    const int32_t lz = gglClz(x);
-    return (0xC0000000 - (x << (lz - 1))) >> (30-lz);
-}
-// ------------------------------------------------------------------------
-inline GGLfixed gglClampx(GGLfixed c) CONST;
-inline GGLfixed gglClampx(GGLfixed c)
-{
-#if defined(__thumb__)
-    // clamp without branches
-    c &= ~(c>>31);  c = FIXED_ONE - c;
-    c &= ~(c>>31);  c = FIXED_ONE - c;
-#else
-#if defined(__arm__)
-    // I don't know why gcc thinks its smarter than me! The code below
-    // clamps to zero in one instruction, but gcc won't generate it and
-    // replace it by a cmp + movlt (it's quite amazing actually).
-    asm("bic %0, %1, %1, asr #31\n" : "=r"(c) : "r"(c));
-#elif defined(__aarch64__)
-    asm("bic %w0, %w1, %w1, asr #31\n" : "=r"(c) : "r"(c));
-#else
-    c &= ~(c>>31);
-#endif
-    if (c>FIXED_ONE)
-        c = FIXED_ONE;
-#endif
-    return c;
-}
-// ------------------------------------------------------------------------
-#endif // ANDROID_GGL_FIXED_H

diff --git a/libpixelflinger/include/private/pixelflinger/ggl_fixed.h b/libpixelflinger/include/private/pixelflinger/ggl_fixed.h deleted file mode 100644 index 787f6202b..000000000 --- a/libpixelflinger/include/private/pixelflinger/ggl_fixed.h +++ /dev/null
@@ -1,633 +0,0 @@
1	/*
2	* Copyright (C) 2005 The Android Open Source Project
3	*
4	* Licensed under the Apache License, Version 2.0 (the "License");
5	* you may not use this file except in compliance with the License.
6	* You may obtain a copy of the License at
7	*
8	* http://www.apache.org/licenses/LICENSE-2.0
9	*
10	* Unless required by applicable law or agreed to in writing, software
11	* distributed under the License is distributed on an "AS IS" BASIS,
12	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13	* See the License for the specific language governing permissions and
14	* limitations under the License.
15	*/
16
17	#ifndef ANDROID_GGL_FIXED_H
18	#define ANDROID_GGL_FIXED_H
19
20	#include <math.h>
21	#include <pixelflinger/pixelflinger.h>
22
23	// ----------------------------------------------------------------------------
24
25	#define CONST __attribute__((const))
26	#define ALWAYS_INLINE __attribute__((always_inline))
27
28	const GGLfixed FIXED_BITS = 16;
29	const GGLfixed FIXED_EPSILON = 1;
30	const GGLfixed FIXED_ONE = 1L<<FIXED_BITS;
31	const GGLfixed FIXED_HALF = 1L<<(FIXED_BITS-1);
32	const GGLfixed FIXED_MIN = 0x80000000L;
33	const GGLfixed FIXED_MAX = 0x7FFFFFFFL;
34
35	inline GGLfixed gglIntToFixed(GGLfixed i) ALWAYS_INLINE ;
36	inline GGLfixed gglFixedToIntRound(GGLfixed f) ALWAYS_INLINE ;
37	inline GGLfixed gglFixedToIntFloor(GGLfixed f) ALWAYS_INLINE ;
38	inline GGLfixed gglFixedToIntCeil(GGLfixed f) ALWAYS_INLINE ;
39	inline GGLfixed gglFracx(GGLfixed v) ALWAYS_INLINE ;
40	inline GGLfixed gglFloorx(GGLfixed v) ALWAYS_INLINE ;
41	inline GGLfixed gglCeilx(GGLfixed v) ALWAYS_INLINE ;
42	inline GGLfixed gglCenterx(GGLfixed v) ALWAYS_INLINE ;
43	inline GGLfixed gglRoundx(GGLfixed v) ALWAYS_INLINE ;
44
45	GGLfixed gglIntToFixed(GGLfixed i) {
46	return i<<FIXED_BITS;
47	}
48	GGLfixed gglFixedToIntRound(GGLfixed f) {
49	return (f + FIXED_HALF)>>FIXED_BITS;
50	}
51	GGLfixed gglFixedToIntFloor(GGLfixed f) {
52	return f>>FIXED_BITS;
53	}
54	GGLfixed gglFixedToIntCeil(GGLfixed f) {
55	return (f + ((1<<FIXED_BITS) - 1))>>FIXED_BITS;
56	}
57
58	GGLfixed gglFracx(GGLfixed v) {
59	return v & ((1<<FIXED_BITS)-1);
60	}
61	GGLfixed gglFloorx(GGLfixed v) {
62	return gglFixedToIntFloor(v)<<FIXED_BITS;
63	}
64	GGLfixed gglCeilx(GGLfixed v) {
65	return gglFixedToIntCeil(v)<<FIXED_BITS;
66	}
67	GGLfixed gglCenterx(GGLfixed v) {
68	return gglFloorx(v + FIXED_HALF) \| FIXED_HALF;
69	}
70	GGLfixed gglRoundx(GGLfixed v) {
71	return gglFixedToIntRound(v)<<FIXED_BITS;
72	}
73
74	// conversion from (unsigned) int, short, byte to fixed...
75	#define GGL_B_TO_X(_x) GGLfixed( ((int32_t(_x)+1)>>1)<<10 )
76	#define GGL_S_TO_X(_x) GGLfixed( ((int32_t(_x)+1)>>1)<<2 )
77	#define GGL_I_TO_X(_x) GGLfixed( ((int32_t(_x)>>1)+1)>>14 )
78	#define GGL_UB_TO_X(_x) GGLfixed( uint32_t(_x) + \
79	(uint32_t(_x)<<8) + \
80	(uint32_t(_x)>>7) )
81	#define GGL_US_TO_X(_x) GGLfixed( (_x) + ((_x)>>15) )
82	#define GGL_UI_TO_X(_x) GGLfixed( (((_x)>>1)+1)>>15 )
83
84	// ----------------------------------------------------------------------------
85
86	GGLfixed gglPowx(GGLfixed x, GGLfixed y) CONST;
87	GGLfixed gglSqrtx(GGLfixed a) CONST;
88	GGLfixed gglSqrtRecipx(GGLfixed x) CONST;
89	GGLfixed gglFastDivx(GGLfixed n, GGLfixed d) CONST;
90	int32_t gglMulDivi(int32_t a, int32_t b, int32_t c);
91
92	int32_t gglRecipQNormalized(int32_t x, int* exponent);
93	int32_t gglRecipQ(GGLfixed x, int q) CONST;
94
95	inline GGLfixed gglRecip(GGLfixed x) CONST;
96	inline GGLfixed gglRecip(GGLfixed x) {
97	return gglRecipQ(x, 16);
98	}
99
100	inline GGLfixed gglRecip28(GGLfixed x) CONST;
101	int32_t gglRecip28(GGLfixed x) {
102	return gglRecipQ(x, 28);
103	}
104
105	// ----------------------------------------------------------------------------
106
107	#if defined(__arm__) && !defined(__thumb__)
108
109	// inline ARM implementations
110	inline GGLfixed gglMulx(GGLfixed x, GGLfixed y, int shift) CONST;
111	inline GGLfixed gglMulx(GGLfixed x, GGLfixed y, int shift) {
112	GGLfixed result, t;
113	if (__builtin_constant_p(shift)) {
114	asm("smull %[lo], %[hi], %[x], %[y] \n"
115	"movs %[lo], %[lo], lsr %[rshift] \n"
116	"adc %[lo], %[lo], %[hi], lsl %[lshift] \n"
117	: [lo]"=r"(result), [hi]"=r"(t), [x]"=r"(x)
118	: "%[x]"(x), [y]"r"(y), [lshift] "I"(32-shift), [rshift] "I"(shift)
119	: "cc"
120	);
121	} else {
122	asm("smull %[lo], %[hi], %[x], %[y] \n"
123	"movs %[lo], %[lo], lsr %[rshift] \n"
124	"adc %[lo], %[lo], %[hi], lsl %[lshift] \n"
125	: [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
126	: "%[x]"(x), [y]"r"(y), [lshift] "r"(32-shift), [rshift] "r"(shift)
127	: "cc"
128	);
129	}
130	return result;
131	}
132
133	inline GGLfixed gglMulAddx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) CONST;
134	inline GGLfixed gglMulAddx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) {
135	GGLfixed result, t;
136	if (__builtin_constant_p(shift)) {
137	asm("smull %[lo], %[hi], %[x], %[y] \n"
138	"add %[lo], %[a], %[lo], lsr %[rshift] \n"
139	"add %[lo], %[lo], %[hi], lsl %[lshift] \n"
140	: [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
141	: "%[x]"(x), [y]"r"(y), [a]"r"(a), [lshift] "I"(32-shift), [rshift] "I"(shift)
142	);
143	} else {
144	asm("smull %[lo], %[hi], %[x], %[y] \n"
145	"add %[lo], %[a], %[lo], lsr %[rshift] \n"
146	"add %[lo], %[lo], %[hi], lsl %[lshift] \n"
147	: [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
148	: "%[x]"(x), [y]"r"(y), [a]"r"(a), [lshift] "r"(32-shift), [rshift] "r"(shift)
149	);
150	}
151	return result;
152	}
153
154	inline GGLfixed gglMulSubx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) CONST;
155	inline GGLfixed gglMulSubx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) {
156	GGLfixed result, t;
157	if (__builtin_constant_p(shift)) {
158	asm("smull %[lo], %[hi], %[x], %[y] \n"
159	"rsb %[lo], %[a], %[lo], lsr %[rshift] \n"
160	"add %[lo], %[lo], %[hi], lsl %[lshift] \n"
161	: [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
162	: "%[x]"(x), [y]"r"(y), [a]"r"(a), [lshift] "I"(32-shift), [rshift] "I"(shift)
163	);
164	} else {
165	asm("smull %[lo], %[hi], %[x], %[y] \n"
166	"rsb %[lo], %[a], %[lo], lsr %[rshift] \n"
167	"add %[lo], %[lo], %[hi], lsl %[lshift] \n"
168	: [lo]"=&r"(result), [hi]"=&r"(t), [x]"=&r"(x)
169	: "%[x]"(x), [y]"r"(y), [a]"r"(a), [lshift] "r"(32-shift), [rshift] "r"(shift)
170	);
171	}
172	return result;
173	}
174
175	inline int64_t gglMulii(int32_t x, int32_t y) CONST;
176	inline int64_t gglMulii(int32_t x, int32_t y)
177	{
178	// 64-bits result: r0=low, r1=high
179	union {
180	struct {
181	int32_t lo;
182	int32_t hi;
183	} s;
184	int64_t res;
185	};
186	asm("smull %0, %1, %2, %3 \n"
187	: "=r"(s.lo), "=&r"(s.hi)
188	: "%r"(x), "r"(y)
189	:
190	);
191	return res;
192	}
193	#elif defined(__mips__) && __mips_isa_rev < 6
194
195	/inline MIPS implementations/
196	inline GGLfixed gglMulx(GGLfixed a, GGLfixed b, int shift) CONST;
197	inline GGLfixed gglMulx(GGLfixed a, GGLfixed b, int shift) {
198	GGLfixed result,tmp,tmp1,tmp2;
199
200	if (__builtin_constant_p(shift)) {
201	if (shift == 0) {
202	asm ("mult %[a], %[b] \t\n"
203	"mflo %[res] \t\n"
204	: [res]"=&r"(result),[tmp]"=&r"(tmp)
205	: [a]"r"(a),[b]"r"(b)
206	: "%hi","%lo"
207	);
208	} else if (shift == 32)
209	{
210	asm ("mult %[a], %[b] \t\n"
211	"li %[tmp],1\t\n"
212	"sll %[tmp],%[tmp],0x1f\t\n"
213	"mflo %[res] \t\n"
214	"addu %[tmp1],%[tmp],%[res] \t\n"
215	"sltu %[tmp1],%[tmp1],%[tmp]\t\n" /obit/
216	"sra %[tmp],%[tmp],0x1f \t\n"
217	"mfhi %[res] \t\n"
218	"addu %[res],%[res],%[tmp]\t\n"
219	"addu %[res],%[res],%[tmp1]\t\n"
220	: [res]"=&r"(result),[tmp]"=&r"(tmp),[tmp1]"=&r"(tmp1)
221	: [a]"r"(a),[b]"r"(b),[shift]"I"(shift)
222	: "%hi","%lo"
223	);
224	} else if ((shift >0) && (shift < 32))
225	{
226	asm ("mult %[a], %[b] \t\n"
227	"li %[tmp],1 \t\n"
228	"sll %[tmp],%[tmp],%[shiftm1] \t\n"
229	"mflo %[res] \t\n"
230	"addu %[tmp1],%[tmp],%[res] \t\n"
231	"sltu %[tmp1],%[tmp1],%[tmp] \t\n" /obit?/
232	"addu %[res],%[res],%[tmp] \t\n"
233	"mfhi %[tmp] \t\n"
234	"addu %[tmp],%[tmp],%[tmp1] \t\n"
235	"sll %[tmp],%[tmp],%[lshift] \t\n"
236	"srl %[res],%[res],%[rshift] \t\n"
237	"or %[res],%[res],%[tmp] \t\n"
238	: [res]"=&r"(result),[tmp]"=&r"(tmp),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
239	: [a]"r"(a),[b]"r"(b),[lshift]"I"(32-shift),[rshift]"I"(shift),[shiftm1]"I"(shift-1)
240	: "%hi","%lo"
241	);
242	} else {
243	asm ("mult %[a], %[b] \t\n"
244	"li %[tmp],1 \t\n"
245	"sll %[tmp],%[tmp],%[shiftm1] \t\n"
246	"mflo %[res] \t\n"
247	"addu %[tmp1],%[tmp],%[res] \t\n"
248	"sltu %[tmp1],%[tmp1],%[tmp] \t\n" /obit?/
249	"sra %[tmp2],%[tmp],0x1f \t\n"
250	"addu %[res],%[res],%[tmp] \t\n"
251	"mfhi %[tmp] \t\n"
252	"addu %[tmp],%[tmp],%[tmp2] \t\n"
253	"addu %[tmp],%[tmp],%[tmp1] \t\n" /tmp=hi/
254	"srl %[tmp2],%[res],%[rshift] \t\n"
255	"srav %[res], %[tmp],%[rshift]\t\n"
256	"sll %[tmp],%[tmp],1 \t\n"
257	"sll %[tmp],%[tmp],%[norbits] \t\n"
258	"or %[tmp],%[tmp],%[tmp2] \t\n"
259	"movz %[res],%[tmp],%[bit5] \t\n"
260	: [res]"=&r"(result),[tmp]"=&r"(tmp),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
261	: [a]"r"(a),[b]"r"(b),[norbits]"I"(~(shift)),[rshift]"I"(shift),[shiftm1] "I"(shift-1),[bit5]"I"(shift & 0x20)
262	: "%hi","%lo"
263	);
264	}
265	} else {
266	asm ("mult %[a], %[b] \t\n"
267	"li %[tmp],1 \t\n"
268	"sll %[tmp],%[tmp],%[shiftm1] \t\n"
269	"mflo %[res] \t\n"
270	"addu %[tmp1],%[tmp],%[res] \t\n"
271	"sltu %[tmp1],%[tmp1],%[tmp] \t\n" /obit?/
272	"sra %[tmp2],%[tmp],0x1f \t\n"
273	"addu %[res],%[res],%[tmp] \t\n"
274	"mfhi %[tmp] \t\n"
275	"addu %[tmp],%[tmp],%[tmp2] \t\n"
276	"addu %[tmp],%[tmp],%[tmp1] \t\n" /tmp=hi/
277	"srl %[tmp2],%[res],%[rshift] \t\n"
278	"srav %[res], %[tmp],%[rshift]\t\n"
279	"sll %[tmp],%[tmp],1 \t\n"
280	"sll %[tmp],%[tmp],%[norbits] \t\n"
281	"or %[tmp],%[tmp],%[tmp2] \t\n"
282	"movz %[res],%[tmp],%[bit5] \t\n"
283	: [res]"=&r"(result),[tmp]"=&r"(tmp),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
284	: [a]"r"(a),[b]"r"(b),[norbits]"r"(~(shift)),[rshift] "r"(shift),[shiftm1]"r"(shift-1),[bit5] "r"(shift & 0x20)
285	: "%hi","%lo"
286	);
287	}
288
289	return result;
290	}
291
292	inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) CONST;
293	inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) {
294	GGLfixed result,t,tmp1,tmp2;
295
296	if (__builtin_constant_p(shift)) {
297	if (shift == 0) {
298	asm ("mult %[a], %[b] \t\n"
299	"mflo %[lo] \t\n"
300	"addu %[lo],%[lo],%[c] \t\n"
301	: [lo]"=&r"(result)
302	: [a]"r"(a),[b]"r"(b),[c]"r"(c)
303	: "%hi","%lo"
304	);
305	} else if (shift == 32) {
306	asm ("mult %[a], %[b] \t\n"
307	"mfhi %[lo] \t\n"
308	"addu %[lo],%[lo],%[c] \t\n"
309	: [lo]"=&r"(result)
310	: [a]"r"(a),[b]"r"(b),[c]"r"(c)
311	: "%hi","%lo"
312	);
313	} else if ((shift>0) && (shift<32)) {
314	asm ("mult %[a], %[b] \t\n"
315	"mflo %[res] \t\n"
316	"mfhi %[t] \t\n"
317	"srl %[res],%[res],%[rshift] \t\n"
318	"sll %[t],%[t],%[lshift] \t\n"
319	"or %[res],%[res],%[t] \t\n"
320	"addu %[res],%[res],%[c] \t\n"
321	: [res]"=&r"(result),[t]"=&r"(t)
322	: [a]"r"(a),[b]"r"(b),[c]"r"(c),[lshift]"I"(32-shift),[rshift]"I"(shift)
323	: "%hi","%lo"
324	);
325	} else {
326	asm ("mult %[a], %[b] \t\n"
327	"nor %[tmp1],$zero,%[shift]\t\n"
328	"mflo %[res] \t\n"
329	"mfhi %[t] \t\n"
330	"srl %[res],%[res],%[shift] \t\n"
331	"sll %[tmp2],%[t],1 \t\n"
332	"sllv %[tmp2],%[tmp2],%[tmp1] \t\n"
333	"or %[tmp1],%[tmp2],%[res] \t\n"
334	"srav %[res],%[t],%[shift] \t\n"
335	"andi %[tmp2],%[shift],0x20\t\n"
336	"movz %[res],%[tmp1],%[tmp2]\t\n"
337	"addu %[res],%[res],%[c] \t\n"
338	: [res]"=&r"(result),[t]"=&r"(t),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
339	: [a]"r"(a),[b]"r"(b),[c]"r"(c),[shift]"I"(shift)
340	: "%hi","%lo"
341	);
342	}
343	} else {
344	asm ("mult %[a], %[b] \t\n"
345	"nor %[tmp1],$zero,%[shift]\t\n"
346	"mflo %[res] \t\n"
347	"mfhi %[t] \t\n"
348	"srl %[res],%[res],%[shift] \t\n"
349	"sll %[tmp2],%[t],1 \t\n"
350	"sllv %[tmp2],%[tmp2],%[tmp1] \t\n"
351	"or %[tmp1],%[tmp2],%[res] \t\n"
352	"srav %[res],%[t],%[shift] \t\n"
353	"andi %[tmp2],%[shift],0x20\t\n"
354	"movz %[res],%[tmp1],%[tmp2]\t\n"
355	"addu %[res],%[res],%[c] \t\n"
356	: [res]"=&r"(result),[t]"=&r"(t),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
357	: [a]"r"(a),[b]"r"(b),[c]"r"(c),[shift]"r"(shift)
358	: "%hi","%lo"
359	);
360	}
361	return result;
362	}
363
364	inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) CONST;
365	inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) {
366	GGLfixed result,t,tmp1,tmp2;
367
368	if (__builtin_constant_p(shift)) {
369	if (shift == 0) {
370	asm ("mult %[a], %[b] \t\n"
371	"mflo %[lo] \t\n"
372	"subu %[lo],%[lo],%[c] \t\n"
373	: [lo]"=&r"(result)
374	: [a]"r"(a),[b]"r"(b),[c]"r"(c)
375	: "%hi","%lo"
376	);
377	} else if (shift == 32) {
378	asm ("mult %[a], %[b] \t\n"
379	"mfhi %[lo] \t\n"
380	"subu %[lo],%[lo],%[c] \t\n"
381	: [lo]"=&r"(result)
382	: [a]"r"(a),[b]"r"(b),[c]"r"(c)
383	: "%hi","%lo"
384	);
385	} else if ((shift>0) && (shift<32)) {
386	asm ("mult %[a], %[b] \t\n"
387	"mflo %[res] \t\n"
388	"mfhi %[t] \t\n"
389	"srl %[res],%[res],%[rshift] \t\n"
390	"sll %[t],%[t],%[lshift] \t\n"
391	"or %[res],%[res],%[t] \t\n"
392	"subu %[res],%[res],%[c] \t\n"
393	: [res]"=&r"(result),[t]"=&r"(t)
394	: [a]"r"(a),[b]"r"(b),[c]"r"(c),[lshift]"I"(32-shift),[rshift]"I"(shift)
395	: "%hi","%lo"
396	);
397	} else {
398	asm ("mult %[a], %[b] \t\n"
399	"nor %[tmp1],$zero,%[shift]\t\n"
400	"mflo %[res] \t\n"
401	"mfhi %[t] \t\n"
402	"srl %[res],%[res],%[shift] \t\n"
403	"sll %[tmp2],%[t],1 \t\n"
404	"sllv %[tmp2],%[tmp2],%[tmp1] \t\n"
405	"or %[tmp1],%[tmp2],%[res] \t\n"
406	"srav %[res],%[t],%[shift] \t\n"
407	"andi %[tmp2],%[shift],0x20\t\n"
408	"movz %[res],%[tmp1],%[tmp2]\t\n"
409	"subu %[res],%[res],%[c] \t\n"
410	: [res]"=&r"(result),[t]"=&r"(t),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
411	: [a]"r"(a),[b]"r"(b),[c]"r"(c),[shift]"I"(shift)
412	: "%hi","%lo"
413	);
414	}
415	} else {
416	asm ("mult %[a], %[b] \t\n"
417	"nor %[tmp1],$zero,%[shift]\t\n"
418	"mflo %[res] \t\n"
419	"mfhi %[t] \t\n"
420	"srl %[res],%[res],%[shift] \t\n"
421	"sll %[tmp2],%[t],1 \t\n"
422	"sllv %[tmp2],%[tmp2],%[tmp1] \t\n"
423	"or %[tmp1],%[tmp2],%[res] \t\n"
424	"srav %[res],%[t],%[shift] \t\n"
425	"andi %[tmp2],%[shift],0x20\t\n"
426	"movz %[res],%[tmp1],%[tmp2]\t\n"
427	"subu %[res],%[res],%[c] \t\n"
428	: [res]"=&r"(result),[t]"=&r"(t),[tmp1]"=&r"(tmp1),[tmp2]"=&r"(tmp2)
429	: [a]"r"(a),[b]"r"(b),[c]"r"(c),[shift]"r"(shift)
430	: "%hi","%lo"
431	);
432	}
433	return result;
434	}
435
436	inline int64_t gglMulii(int32_t x, int32_t y) CONST;
437	inline int64_t gglMulii(int32_t x, int32_t y) {
438	union {
439	struct {
440	#if defined(__MIPSEL__)
441	int32_t lo;
442	int32_t hi;
443	#elif defined(__MIPSEB__)
444	int32_t hi;
445	int32_t lo;
446	#endif
447	} s;
448	int64_t res;
449	}u;
450	asm("mult %2, %3 \t\n"
451	"mfhi %1 \t\n"
452	"mflo %0 \t\n"
453	: "=r"(u.s.lo), "=&r"(u.s.hi)
454	: "%r"(x), "r"(y)
455	: "%hi","%lo"
456	);
457	return u.res;
458	}
459
460	#elif defined(__aarch64__)
461
462	// inline AArch64 implementations
463
464	inline GGLfixed gglMulx(GGLfixed x, GGLfixed y, int shift) CONST;
465	inline GGLfixed gglMulx(GGLfixed x, GGLfixed y, int shift)
466	{
467	GGLfixed result;
468	GGLfixed round;
469
470	asm("mov %x[round], #1 \n"
471	"lsl %x[round], %x[round], %x[shift] \n"
472	"lsr %x[round], %x[round], #1 \n"
473	"smaddl %x[result], %w[x], %w[y],%x[round] \n"
474	"lsr %x[result], %x[result], %x[shift] \n"
475	: [round]"=&r"(round), [result]"=&r"(result) \
476	: [x]"r"(x), [y]"r"(y), [shift] "r"(shift) \
477	:
478	);
479	return result;
480	}
481	inline GGLfixed gglMulAddx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) CONST;
482	inline GGLfixed gglMulAddx(GGLfixed x, GGLfixed y, GGLfixed a, int shift)
483	{
484	GGLfixed result;
485	asm("smull %x[result], %w[x], %w[y] \n"
486	"lsr %x[result], %x[result], %x[shift] \n"
487	"add %w[result], %w[result], %w[a] \n"
488	: [result]"=&r"(result) \
489	: [x]"r"(x), [y]"r"(y), [a]"r"(a), [shift] "r"(shift) \
490	:
491	);
492	return result;
493	}
494
495	inline GGLfixed gglMulSubx(GGLfixed x, GGLfixed y, GGLfixed a, int shift) CONST;
496	inline GGLfixed gglMulSubx(GGLfixed x, GGLfixed y, GGLfixed a, int shift)
497	{
498
499	GGLfixed result;
500	int rshift;
501
502	asm("smull %x[result], %w[x], %w[y] \n"
503	"lsr %x[result], %x[result], %x[shift] \n"
504	"sub %w[result], %w[result], %w[a] \n"
505	: [result]"=&r"(result) \
506	: [x]"r"(x), [y]"r"(y), [a]"r"(a), [shift] "r"(shift) \
507	:
508	);
509	return result;
510	}
511	inline int64_t gglMulii(int32_t x, int32_t y) CONST;
512	inline int64_t gglMulii(int32_t x, int32_t y)
513	{
514	int64_t res;
515	asm("smull %x0, %w1, %w2 \n"
516	: "=r"(res)
517	: "%r"(x), "r"(y)
518	:
519	);
520	return res;
521	}
522
523	#else // ----------------------------------------------------------------------
524
525	inline GGLfixed gglMulx(GGLfixed a, GGLfixed b, int shift) CONST;
526	inline GGLfixed gglMulx(GGLfixed a, GGLfixed b, int shift) {
527	return GGLfixed((int64_t(a)*b + (1<<(shift-1)))>>shift);
528	}
529	inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) CONST;
530	inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) {
531	return GGLfixed((int64_t(a)*b)>>shift) + c;
532	}
533	inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) CONST;
534	inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c, int shift) {
535	return GGLfixed((int64_t(a)*b)>>shift) - c;
536	}
537	inline int64_t gglMulii(int32_t a, int32_t b) CONST;
538	inline int64_t gglMulii(int32_t a, int32_t b) {
539	return int64_t(a)*b;
540	}
541
542	#endif
543
544	// ------------------------------------------------------------------------
545
546	inline GGLfixed gglMulx(GGLfixed a, GGLfixed b) CONST;
547	inline GGLfixed gglMulx(GGLfixed a, GGLfixed b) {
548	return gglMulx(a, b, 16);
549	}
550	inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c) CONST;
551	inline GGLfixed gglMulAddx(GGLfixed a, GGLfixed b, GGLfixed c) {
552	return gglMulAddx(a, b, c, 16);
553	}
554	inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c) CONST;
555	inline GGLfixed gglMulSubx(GGLfixed a, GGLfixed b, GGLfixed c) {
556	return gglMulSubx(a, b, c, 16);
557	}
558
559	// ------------------------------------------------------------------------
560
561	inline int32_t gglClz(int32_t x) CONST;
562	inline int32_t gglClz(int32_t x)
563	{
564	#if (defined(__arm__) && !defined(__thumb__)) \|\| defined(__mips__) \|\| defined(__aarch64__)
565	return __builtin_clz(x);
566	#else
567	if (!x) return 32;
568	int32_t exp = 31;
569	if (x & 0xFFFF0000) { exp -=16; x >>= 16; }
570	if (x & 0x0000ff00) { exp -= 8; x >>= 8; }
571	if (x & 0x000000f0) { exp -= 4; x >>= 4; }
572	if (x & 0x0000000c) { exp -= 2; x >>= 2; }
573	if (x & 0x00000002) { exp -= 1; }
574	return exp;
575	#endif
576	}
577
578	// ------------------------------------------------------------------------
579
580	int32_t gglDivQ(GGLfixed n, GGLfixed d, int32_t i) CONST;
581
582	inline int32_t gglDivQ16(GGLfixed n, GGLfixed d) CONST;
583	inline int32_t gglDivQ16(GGLfixed n, GGLfixed d) {
584	return gglDivQ(n, d, 16);
585	}
586
587	inline int32_t gglDivx(GGLfixed n, GGLfixed d) CONST;
588	inline int32_t gglDivx(GGLfixed n, GGLfixed d) {
589	return gglDivQ(n, d, 16);
590	}
591
592	// ------------------------------------------------------------------------
593
594	inline GGLfixed gglRecipFast(GGLfixed x) CONST;
595	inline GGLfixed gglRecipFast(GGLfixed x)
596	{
597	// This is a really bad approximation of 1/x, but it's also
598	// very fast. x must be strictly positive.
599	// if x between [0.5, 1[ , then 1/x = 3-2*x
600	// (we use 2.30 fixed-point)
601	const int32_t lz = gglClz(x);
602	return (0xC0000000 - (x << (lz - 1))) >> (30-lz);
603	}
604
605	// ------------------------------------------------------------------------
606
607	inline GGLfixed gglClampx(GGLfixed c) CONST;
608	inline GGLfixed gglClampx(GGLfixed c)
609	{
610	#if defined(__thumb__)
611	// clamp without branches
612	c &= ~(c>>31); c = FIXED_ONE - c;
613	c &= ~(c>>31); c = FIXED_ONE - c;
614	#else
615	#if defined(__arm__)
616	// I don't know why gcc thinks its smarter than me! The code below
617	// clamps to zero in one instruction, but gcc won't generate it and
618	// replace it by a cmp + movlt (it's quite amazing actually).
619	asm("bic %0, %1, %1, asr #31\n" : "=r"(c) : "r"(c));
620	#elif defined(__aarch64__)
621	asm("bic %w0, %w1, %w1, asr #31\n" : "=r"(c) : "r"(c));
622	#else
623	c &= ~(c>>31);
624	#endif
625	if (c>FIXED_ONE)
626	c = FIXED_ONE;
627	#endif
628	return c;
629	}
630
631	// ------------------------------------------------------------------------
632
633	#endif // ANDROID_GGL_FIXED_H