Blame view

kernel/linux-rt-4.4.41/arch/ia64/lib/clear_page.S 1.86 KB
5113f6f70   김현기   kernel add
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
  /*
   * Copyright (C) 1999-2002 Hewlett-Packard Co
   *	Stephane Eranian <eranian@hpl.hp.com>
   *	David Mosberger-Tang <davidm@hpl.hp.com>
   * Copyright (C) 2002 Ken Chen <kenneth.w.chen@intel.com>
   *
   * 1/06/01 davidm	Tuned for Itanium.
   * 2/12/02 kchen	Tuned for both Itanium and McKinley
   * 3/08/02 davidm	Some more tweaking
   */
  
  #include <asm/asmmacro.h>
  #include <asm/page.h>
  
  #ifdef CONFIG_ITANIUM
  # define L3_LINE_SIZE	64	// Itanium L3 line size
  # define PREFETCH_LINES	9	// magic number
  #else
  # define L3_LINE_SIZE	128	// McKinley L3 line size
  # define PREFETCH_LINES	12	// magic number
  #endif
  
  #define saved_lc	r2
  #define dst_fetch	r3
  #define dst1		r8
  #define dst2		r9
  #define dst3		r10
  #define dst4		r11
  
  #define dst_last	r31
  
  GLOBAL_ENTRY(clear_page)
  	.prologue
  	.regstk 1,0,0,0
  	mov r16 = PAGE_SIZE/L3_LINE_SIZE-1	// main loop count, -1=repeat/until
  	.save ar.lc, saved_lc
  	mov saved_lc = ar.lc
  
  	.body
  	mov ar.lc = (PREFETCH_LINES - 1)
  	mov dst_fetch = in0
  	adds dst1 = 16, in0
  	adds dst2 = 32, in0
  	;;
  .fetch:	stf.spill.nta [dst_fetch] = f0, L3_LINE_SIZE
  	adds dst3 = 48, in0		// executing this multiple times is harmless
  	br.cloop.sptk.few .fetch
  	;;
  	addl dst_last = (PAGE_SIZE - PREFETCH_LINES*L3_LINE_SIZE), dst_fetch
  	mov ar.lc = r16			// one L3 line per iteration
  	adds dst4 = 64, in0
  	;;
  #ifdef CONFIG_ITANIUM
  	// Optimized for Itanium
  1:	stf.spill.nta [dst1] = f0, 64
  	stf.spill.nta [dst2] = f0, 64
  	cmp.lt p8,p0=dst_fetch, dst_last
  	;;
  #else
  	// Optimized for McKinley
  1:	stf.spill.nta [dst1] = f0, 64
  	stf.spill.nta [dst2] = f0, 64
  	stf.spill.nta [dst3] = f0, 64
  	stf.spill.nta [dst4] = f0, 128
  	cmp.lt p8,p0=dst_fetch, dst_last
  	;;
  	stf.spill.nta [dst1] = f0, 64
  	stf.spill.nta [dst2] = f0, 64
  #endif
  	stf.spill.nta [dst3] = f0, 64
  (p8)	stf.spill.nta [dst_fetch] = f0, L3_LINE_SIZE
  	br.cloop.sptk.few 1b
  	;;
  	mov ar.lc = saved_lc		// restore lc
  	br.ret.sptk.many rp
  END(clear_page)