6d685e5318
These are all functions which are invoked from elsewhere, so annotate them as global using the new SYM_FUNC_START and their ENDPROC's by SYM_FUNC_END. Now, ENTRY/ENDPROC can be forced to be undefined on X86, so do so. Signed-off-by: Jiri Slaby <jslaby@suse.cz> Signed-off-by: Borislav Petkov <bp@suse.de> Cc: Allison Randal <allison@lohutok.net> Cc: Andrey Ryabinin <aryabinin@virtuozzo.com> Cc: Andy Lutomirski <luto@kernel.org> Cc: Andy Shevchenko <andy@infradead.org> Cc: Ard Biesheuvel <ard.biesheuvel@linaro.org> Cc: Bill Metzenthen <billm@melbpc.org.au> Cc: Boris Ostrovsky <boris.ostrovsky@oracle.com> Cc: Darren Hart <dvhart@infradead.org> Cc: "David S. Miller" <davem@davemloft.net> Cc: Greg Kroah-Hartman <gregkh@linuxfoundation.org> Cc: Herbert Xu <herbert@gondor.apana.org.au> Cc: "H. Peter Anvin" <hpa@zytor.com> Cc: Ingo Molnar <mingo@redhat.com> Cc: linux-arch@vger.kernel.org Cc: linux-crypto@vger.kernel.org Cc: linux-efi <linux-efi@vger.kernel.org> Cc: linux-efi@vger.kernel.org Cc: linux-pm@vger.kernel.org Cc: Mark Rutland <mark.rutland@arm.com> Cc: Matt Fleming <matt@codeblueprint.co.uk> Cc: Pavel Machek <pavel@ucw.cz> Cc: platform-driver-x86@vger.kernel.org Cc: "Rafael J. Wysocki" <rjw@rjwysocki.net> Cc: Thomas Gleixner <tglx@linutronix.de> Cc: Will Deacon <will@kernel.org> Cc: x86-ml <x86@kernel.org> Link: https://lkml.kernel.org/r/20191011115108.12392-28-jslaby@suse.cz
138 lines
4.0 KiB
ArmAsm
138 lines
4.0 KiB
ArmAsm
/* SPDX-License-Identifier: GPL-2.0 */
|
|
/*---------------------------------------------------------------------------+
|
|
| polynomial_Xsig.S |
|
|
| |
|
|
| Fixed point arithmetic polynomial evaluation. |
|
|
| |
|
|
| Copyright (C) 1992,1993,1994,1995 |
|
|
| W. Metzenthen, 22 Parker St, Ormond, Vic 3163, |
|
|
| Australia. E-mail billm@jacobi.maths.monash.edu.au |
|
|
| |
|
|
| Call from C as: |
|
|
| void polynomial_Xsig(Xsig *accum, unsigned long long x, |
|
|
| unsigned long long terms[], int n) |
|
|
| |
|
|
| Computes: |
|
|
| terms[0] + (terms[1] + (terms[2] + ... + (terms[n-1]*x)*x)*x)*x) ... )*x |
|
|
| and adds the result to the 12 byte Xsig. |
|
|
| The terms[] are each 8 bytes, but all computation is performed to 12 byte |
|
|
| precision. |
|
|
| |
|
|
| This function must be used carefully: most overflow of intermediate |
|
|
| results is controlled, but overflow of the result is not. |
|
|
| |
|
|
+---------------------------------------------------------------------------*/
|
|
.file "polynomial_Xsig.S"
|
|
|
|
#include "fpu_emu.h"
|
|
|
|
|
|
#define TERM_SIZE $8
|
|
#define SUM_MS -20(%ebp) /* sum ms long */
|
|
#define SUM_MIDDLE -24(%ebp) /* sum middle long */
|
|
#define SUM_LS -28(%ebp) /* sum ls long */
|
|
#define ACCUM_MS -4(%ebp) /* accum ms long */
|
|
#define ACCUM_MIDDLE -8(%ebp) /* accum middle long */
|
|
#define ACCUM_LS -12(%ebp) /* accum ls long */
|
|
#define OVERFLOWED -16(%ebp) /* addition overflow flag */
|
|
|
|
.text
|
|
SYM_FUNC_START(polynomial_Xsig)
|
|
pushl %ebp
|
|
movl %esp,%ebp
|
|
subl $32,%esp
|
|
pushl %esi
|
|
pushl %edi
|
|
pushl %ebx
|
|
|
|
movl PARAM2,%esi /* x */
|
|
movl PARAM3,%edi /* terms */
|
|
|
|
movl TERM_SIZE,%eax
|
|
mull PARAM4 /* n */
|
|
addl %eax,%edi
|
|
|
|
movl 4(%edi),%edx /* terms[n] */
|
|
movl %edx,SUM_MS
|
|
movl (%edi),%edx /* terms[n] */
|
|
movl %edx,SUM_MIDDLE
|
|
xor %eax,%eax
|
|
movl %eax,SUM_LS
|
|
movb %al,OVERFLOWED
|
|
|
|
subl TERM_SIZE,%edi
|
|
decl PARAM4
|
|
js L_accum_done
|
|
|
|
L_accum_loop:
|
|
xor %eax,%eax
|
|
movl %eax,ACCUM_MS
|
|
movl %eax,ACCUM_MIDDLE
|
|
|
|
movl SUM_MIDDLE,%eax
|
|
mull (%esi) /* x ls long */
|
|
movl %edx,ACCUM_LS
|
|
|
|
movl SUM_MIDDLE,%eax
|
|
mull 4(%esi) /* x ms long */
|
|
addl %eax,ACCUM_LS
|
|
adcl %edx,ACCUM_MIDDLE
|
|
adcl $0,ACCUM_MS
|
|
|
|
movl SUM_MS,%eax
|
|
mull (%esi) /* x ls long */
|
|
addl %eax,ACCUM_LS
|
|
adcl %edx,ACCUM_MIDDLE
|
|
adcl $0,ACCUM_MS
|
|
|
|
movl SUM_MS,%eax
|
|
mull 4(%esi) /* x ms long */
|
|
addl %eax,ACCUM_MIDDLE
|
|
adcl %edx,ACCUM_MS
|
|
|
|
testb $0xff,OVERFLOWED
|
|
jz L_no_overflow
|
|
|
|
movl (%esi),%eax
|
|
addl %eax,ACCUM_MIDDLE
|
|
movl 4(%esi),%eax
|
|
adcl %eax,ACCUM_MS /* This could overflow too */
|
|
|
|
L_no_overflow:
|
|
|
|
/*
|
|
* Now put the sum of next term and the accumulator
|
|
* into the sum register
|
|
*/
|
|
movl ACCUM_LS,%eax
|
|
addl (%edi),%eax /* term ls long */
|
|
movl %eax,SUM_LS
|
|
movl ACCUM_MIDDLE,%eax
|
|
adcl (%edi),%eax /* term ls long */
|
|
movl %eax,SUM_MIDDLE
|
|
movl ACCUM_MS,%eax
|
|
adcl 4(%edi),%eax /* term ms long */
|
|
movl %eax,SUM_MS
|
|
sbbb %al,%al
|
|
movb %al,OVERFLOWED /* Used in the next iteration */
|
|
|
|
subl TERM_SIZE,%edi
|
|
decl PARAM4
|
|
jns L_accum_loop
|
|
|
|
L_accum_done:
|
|
movl PARAM1,%edi /* accum */
|
|
movl SUM_LS,%eax
|
|
addl %eax,(%edi)
|
|
movl SUM_MIDDLE,%eax
|
|
adcl %eax,4(%edi)
|
|
movl SUM_MS,%eax
|
|
adcl %eax,8(%edi)
|
|
|
|
popl %ebx
|
|
popl %edi
|
|
popl %esi
|
|
leave
|
|
ret
|
|
SYM_FUNC_END(polynomial_Xsig)
|