mirror of
https://github.com/torvalds/linux.git
synced 2024-12-21 02:21:36 +00:00
e007c53397
Here we have another kind of deviation from the default case - a difference between exporting functions and non-functions. EXPORT_DATA_SYMBOL... is really different from EXPORT_SYMBOL... on ia64, and we need to use the right one when moving exports from *.c where C compiler has the required information to *.S, where we need to supply it manually. parisc64 will be another one like that. Tested-by: Tony Luck <tony.luck@intel.com> Signed-off-by: Al Viro <viro@zeniv.linux.org.uk>
79 lines
1.9 KiB
ArmAsm
79 lines
1.9 KiB
ArmAsm
/*
|
|
* Copyright (C) 1999-2002 Hewlett-Packard Co
|
|
* Stephane Eranian <eranian@hpl.hp.com>
|
|
* David Mosberger-Tang <davidm@hpl.hp.com>
|
|
* Copyright (C) 2002 Ken Chen <kenneth.w.chen@intel.com>
|
|
*
|
|
* 1/06/01 davidm Tuned for Itanium.
|
|
* 2/12/02 kchen Tuned for both Itanium and McKinley
|
|
* 3/08/02 davidm Some more tweaking
|
|
*/
|
|
|
|
#include <asm/asmmacro.h>
|
|
#include <asm/page.h>
|
|
#include <asm/export.h>
|
|
|
|
#ifdef CONFIG_ITANIUM
|
|
# define L3_LINE_SIZE 64 // Itanium L3 line size
|
|
# define PREFETCH_LINES 9 // magic number
|
|
#else
|
|
# define L3_LINE_SIZE 128 // McKinley L3 line size
|
|
# define PREFETCH_LINES 12 // magic number
|
|
#endif
|
|
|
|
#define saved_lc r2
|
|
#define dst_fetch r3
|
|
#define dst1 r8
|
|
#define dst2 r9
|
|
#define dst3 r10
|
|
#define dst4 r11
|
|
|
|
#define dst_last r31
|
|
|
|
GLOBAL_ENTRY(clear_page)
|
|
.prologue
|
|
.regstk 1,0,0,0
|
|
mov r16 = PAGE_SIZE/L3_LINE_SIZE-1 // main loop count, -1=repeat/until
|
|
.save ar.lc, saved_lc
|
|
mov saved_lc = ar.lc
|
|
|
|
.body
|
|
mov ar.lc = (PREFETCH_LINES - 1)
|
|
mov dst_fetch = in0
|
|
adds dst1 = 16, in0
|
|
adds dst2 = 32, in0
|
|
;;
|
|
.fetch: stf.spill.nta [dst_fetch] = f0, L3_LINE_SIZE
|
|
adds dst3 = 48, in0 // executing this multiple times is harmless
|
|
br.cloop.sptk.few .fetch
|
|
;;
|
|
addl dst_last = (PAGE_SIZE - PREFETCH_LINES*L3_LINE_SIZE), dst_fetch
|
|
mov ar.lc = r16 // one L3 line per iteration
|
|
adds dst4 = 64, in0
|
|
;;
|
|
#ifdef CONFIG_ITANIUM
|
|
// Optimized for Itanium
|
|
1: stf.spill.nta [dst1] = f0, 64
|
|
stf.spill.nta [dst2] = f0, 64
|
|
cmp.lt p8,p0=dst_fetch, dst_last
|
|
;;
|
|
#else
|
|
// Optimized for McKinley
|
|
1: stf.spill.nta [dst1] = f0, 64
|
|
stf.spill.nta [dst2] = f0, 64
|
|
stf.spill.nta [dst3] = f0, 64
|
|
stf.spill.nta [dst4] = f0, 128
|
|
cmp.lt p8,p0=dst_fetch, dst_last
|
|
;;
|
|
stf.spill.nta [dst1] = f0, 64
|
|
stf.spill.nta [dst2] = f0, 64
|
|
#endif
|
|
stf.spill.nta [dst3] = f0, 64
|
|
(p8) stf.spill.nta [dst_fetch] = f0, L3_LINE_SIZE
|
|
br.cloop.sptk.few 1b
|
|
;;
|
|
mov ar.lc = saved_lc // restore lc
|
|
br.ret.sptk.many rp
|
|
END(clear_page)
|
|
EXPORT_SYMBOL(clear_page)
|