/*********************************************************************/ /* Copyright 2009, 2010 The University of Texas at Austin. */ /* All rights reserved. */ /* */ /* Redistribution and use in source and binary forms, with or */ /* without modification, are permitted provided that the following */ /* conditions are met: */ /* */ /* 1. Redistributions of source code must retain the above */ /* copyright notice, this list of conditions and the following */ /* disclaimer. */ /* */ /* 2. Redistributions in binary form must reproduce the above */ /* copyright notice, this list of conditions and the following */ /* disclaimer in the documentation and/or other materials */ /* provided with the distribution. */ /* */ /* THIS SOFTWARE IS PROVIDED BY THE UNIVERSITY OF TEXAS AT */ /* AUSTIN ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, */ /* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF */ /* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE */ /* DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY OF TEXAS AT */ /* AUSTIN OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, */ /* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES */ /* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE */ /* GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR */ /* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF */ /* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT */ /* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT */ /* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE */ /* POSSIBILITY OF SUCH DAMAGE. */ /* */ /* The views and conclusions contained in the software and */ /* documentation are those of the authors and should not be */ /* interpreted as representing official policies, either expressed */ /* or implied, of The University of Texas at Austin. */ /*********************************************************************/ #define ASSEMBLER #include "common.h" #define N $4 #define X $5 #define INCX $6 #define I $3 #define TEMP $7 #define a1 $f4 #define a2 $f5 #define a3 $f6 #define a4 $f7 #define a5 $f8 #define a6 $f9 #define a7 $f10 #define a8 $f11 #define t1 $f12 #define t2 $f13 #define t3 $f14 #define t4 $f15 #define s1 $f0 #define s2 $f1 #define s3 $f2 #define s4 $f3 #define x1 $2 #define x2 $8 #define x3 $9 #define x4 $10 PROLOGUE #ifdef F_INTERFACE LDINT N, 0(N) LDINT INCX, 0(INCX) #endif blez N, .L999 li x1, 0 blez INCX, .L999 dsll INCX, INCX, BASE_SHIFT LD a1, 0 * SIZE(X) daddiu N, N, -1 blez N, .L999 li x1, 1 FABS s1, a1 daddu X, X, INCX FABS s2, a1 li x2, 1 FABS s3, a1 dsra I, N, 3 FABS s4, a1 li x3, 1 li TEMP, 2 blez I, .L15 li x4, 1 LD a1, 0 * SIZE(X) daddu X, X, INCX LD a2, 0 * SIZE(X) daddu X, X, INCX LD a3, 0 * SIZE(X) daddu X, X, INCX LD a4, 0 * SIZE(X) daddu X, X, INCX LD a5, 0 * SIZE(X) daddu X, X, INCX LD a6, 0 * SIZE(X) daddu X, X, INCX LD a7, 0 * SIZE(X) daddu X, X, INCX LD a8, 0 * SIZE(X) daddiu I, I, -1 blez I, .L13 daddu X, X, INCX .align 3 .L12: FABS t1, a1 LD a1, 0 * SIZE(X) FABS t2, a2 daddu X, X, INCX FABS t3, a3 LD a2, 0 * SIZE(X) FABS t4, a4 daddu X, X, INCX CMPLT $fcc0, t1, s1 LD a3, 0 * SIZE(X) CMPLT $fcc1, t2, s2 daddu X, X, INCX CMPLT $fcc2, t3, s3 LD a4, 0 * SIZE(X) CMPLT $fcc3, t4, s4 daddu X, X, INCX CMOVT s1, t1, $fcc0 movt x1, TEMP, $fcc0 CMOVT s2, t2, $fcc1 movt x2, TEMP, $fcc1 CMOVT s3, t3, $fcc2 movt x3, TEMP, $fcc2 CMOVT s4, t4, $fcc3 movt x4, TEMP, $fcc3 daddiu TEMP, TEMP, 4 daddiu I, I, -1 FABS t1, a5 LD a5, 0 * SIZE(X) FABS t2, a6 daddu X, X, INCX FABS t3, a7 LD a6, 0 * SIZE(X) FABS t4, a8 daddu X, X, INCX CMPLT $fcc0, t1, s1 LD a7, 0 * SIZE(X) CMPLT $fcc1, t2, s2 daddu X, X, INCX CMPLT $fcc2, t3, s3 LD a8, 0 * SIZE(X) CMPLT $fcc3, t4, s4 daddu X, X, INCX CMOVT s1, t1, $fcc0 movt x1, TEMP, $fcc0 CMOVT s2, t2, $fcc1 movt x2, TEMP, $fcc1 CMOVT s3, t3, $fcc2 movt x3, TEMP, $fcc2 CMOVT s4, t4, $fcc3 movt x4, TEMP, $fcc3 bgtz I, .L12 daddiu TEMP, TEMP, 4 .align 3 .L13: FABS t1, a1 FABS t2, a2 FABS t3, a3 FABS t4, a4 CMPLT $fcc0, t1, s1 CMPLT $fcc1, t2, s2 CMPLT $fcc2, t3, s3 CMPLT $fcc3, t4, s4 CMOVT s1, t1, $fcc0 movt x1, TEMP, $fcc0 CMOVT s2, t2, $fcc1 movt x2, TEMP, $fcc1 CMOVT s3, t3, $fcc2 movt x3, TEMP, $fcc2 CMOVT s4, t4, $fcc3 movt x4, TEMP, $fcc3 FABS t1, a5 daddiu TEMP, TEMP, 4 FABS t2, a6 NOP FABS t3, a7 FABS t4, a8 CMPLT $fcc0, t1, s1 CMPLT $fcc1, t2, s2 CMPLT $fcc2, t3, s3 CMPLT $fcc3, t4, s4 CMOVT s1, t1, $fcc0 movt x1, TEMP, $fcc0 CMOVT s2, t2, $fcc1 movt x2, TEMP, $fcc1 CMOVT s3, t3, $fcc2 movt x3, TEMP, $fcc2 CMOVT s4, t4, $fcc3 movt x4, TEMP, $fcc3 daddiu TEMP, TEMP, 4 daddiu x2, x2, 1 daddiu x3, x3, 2 daddiu x4, x4, 3 .align 3 .L15: andi I, N, 7 blez I, .L998 NOP .align 3 .L16: LD a1, 0 * SIZE(X) daddu X, X, INCX FABS t1, a1 daddiu I, I, -1 CMPLT $fcc0, t1, s1 NOP CMOVT s1, t1, $fcc0 movt x1, TEMP, $fcc0 bgtz I, .L16 daddiu TEMP, TEMP, 1 .align 3 .L998: CMPLT $fcc0, s2, s1 CMPLT $fcc1, s4, s3 CMOVT s1, s2, $fcc0 movt x1, x2, $fcc0 CMOVT s3, s4, $fcc1 movt x3, x4, $fcc1 CMPLT $fcc0, s3, s1 CMOVT s1, s3, $fcc0 movt x1, x3, $fcc0 .align 3 .L999: j $31 NOP EPILOGUE