X-Git-Url: https://oss.titaniummirror.com/gitweb/?a=blobdiff_plain;f=gmp%2Fmpn%2Fpowerpc64%2Flogops_n.asm;fp=gmp%2Fmpn%2Fpowerpc64%2Flogops_n.asm;h=917b59f4557a32f1cc69a7c9cca90f2ed3da7e3a;hb=6fed43773c9b0ce596dca5686f37ac3fc0fa11c0;hp=0000000000000000000000000000000000000000;hpb=27b11d56b743098deb193d510b337ba22dc52e5c;p=msp430-gcc.git diff --git a/gmp/mpn/powerpc64/logops_n.asm b/gmp/mpn/powerpc64/logops_n.asm new file mode 100644 index 00000000..917b59f4 --- /dev/null +++ b/gmp/mpn/powerpc64/logops_n.asm @@ -0,0 +1,137 @@ +dnl PowerPC-64 mpn_and_n, mpn_andn_n, mpn_nand_n, mpn_ior_n, mpn_iorn_n, +dnl mpn_nior_n, mpn_xor_n, mpn_xnor_n -- mpn bitwise logical operations. + +dnl Copyright 2003, 2004, 2005 Free Software Foundation, Inc. + +dnl This file is part of the GNU MP Library. + +dnl The GNU MP Library is free software; you can redistribute it and/or modify +dnl it under the terms of the GNU Lesser General Public License as published +dnl by the Free Software Foundation; either version 3 of the License, or (at +dnl your option) any later version. + +dnl The GNU MP Library is distributed in the hope that it will be useful, but +dnl WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY +dnl or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public +dnl License for more details. + +dnl You should have received a copy of the GNU Lesser General Public License +dnl along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. + +include(`../config.m4') + +C cycles/limb +C POWER3/PPC630: 1.75 +C POWER4/PPC970: 2.10 + +C n POWER3/PPC630 POWER4/PPC970 +C 1 15.00 15.33 +C 2 7.50 7.99 +C 3 5.33 6.00 +C 4 4.50 4.74 +C 5 4.20 4.39 +C 6 3.50 3.99 +C 7 3.14 3.64 +C 8 3.00 3.36 +C 9 3.00 3.36 +C 10 2.70 3.25 +C 11 2.63 3.11 +C 12 2.58 3.00 +C 13 2.61 3.02 +C 14 2.42 2.82 +C 15 2.40 2.79 +C 50 2.08 2.67 +C 100 1.85 2.31 +C 200 1.80 2.18 +C 400 1.77 2.14 +C 1000 1.76 2.10# +C 2000 1.75# 2.13 +C 4000 2.30 2.57 +C 8000 2.62 2.58 +C 16000 2.52 4.25 +C 32000 2.49 16.25 +C 64000 2.66 18.76 + +ifdef(`OPERATION_and_n', +` define(`func',`mpn_and_n') + define(`logop', `and')') +ifdef(`OPERATION_andn_n', +` define(`func',`mpn_andn_n') + define(`logop', `andc')') +ifdef(`OPERATION_nand_n', +` define(`func',`mpn_nand_n') + define(`logop', `nand')') +ifdef(`OPERATION_ior_n', +` define(`func',`mpn_ior_n') + define(`logop', `or')') +ifdef(`OPERATION_iorn_n', +` define(`func',`mpn_iorn_n') + define(`logop', `orc')') +ifdef(`OPERATION_nior_n', +` define(`func',`mpn_nior_n') + define(`logop', `nor')') +ifdef(`OPERATION_xor_n', +` define(`func',`mpn_xor_n') + define(`logop', `xor')') +ifdef(`OPERATION_xnor_n', +` define(`func',`mpn_xnor_n') + define(`logop', `eqv')') + +C INPUT PARAMETERS +C rp r3 +C up r4 +C vp r5 +C n r6 + +MULFUNC_PROLOGUE(mpn_and_n mpn_andn_n mpn_nand_n mpn_ior_n mpn_iorn_n mpn_nior_n mpn_xor_n mpn_xnor_n) + +ASM_START() +PROLOGUE(func) + ld r8, 0(r4) C read lowest u limb + ld r9, 0(r5) C read lowest v limb + addi r6, r6, 3 C compute branch count (1) + rldic. r0, r6, 3, 59 C r0 = (n-1 & 3) << 3; cr0 = (n == 4(t+1))? + cmpldi cr6, r0, 16 C cr6 = (n cmp 4t + 3) + +ifdef(`HAVE_ABI_mode32', +` rldicl r6, r6, 62,34', C ...branch count +` rldicl r6, r6, 62, 2') C ...branch count + mtctr r6 + + ld r6, 0(r4) C read lowest u limb (again) + ld r7, 0(r5) C read lowest v limb (again) + + add r5, r5, r0 C offset vp + add r4, r4, r0 C offset up + add r3, r3, r0 C offset rp + + beq cr0, L(L01) + blt cr6, L(L10) + beq cr6, L(L11) + b L(L00) + +L(oop): ld r8, -24(r4) + ld r9, -24(r5) + logop r10, r6, r7 + std r10, -32(r3) +L(L00): ld r6, -16(r4) + ld r7, -16(r5) + logop r10, r8, r9 + std r10, -24(r3) +L(L11): ld r8, -8(r4) + ld r9, -8(r5) + logop r10, r6, r7 + std r10, -16(r3) +L(L10): ld r6, 0(r4) + ld r7, 0(r5) + logop r10, r8, r9 + std r10, -8(r3) +L(L01): addi r5, r5, 32 + addi r4, r4, 32 + addi r3, r3, 32 + bdnz L(oop) + + logop r10, r6, r7 + std r10, -32(r3) + blr +EPILOGUE()