Blame view

kernel/linux-rt-4.4.41/arch/arc/include/uapi/asm/swab.h 2.71 KB
5113f6f70   김현기   kernel add
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
  /*
   * Copyright (C) 2004, 2007-2010, 2011-2012 Synopsys, Inc. (www.synopsys.com)
   *
   * This program is free software; you can redistribute it and/or modify
   * it under the terms of the GNU General Public License version 2 as
   * published by the Free Software Foundation.
   *
   * vineetg: May 2011
   *  -Support single cycle endian-swap insn in ARC700 4.10
   *
   * vineetg: June 2009
   *  -Better htonl implementation (5 instead of 9 ALU instructions)
   *  -Hardware assisted single cycle bswap (Use Case of ARC custom instrn)
   */
  
  #ifndef __ASM_ARC_SWAB_H
  #define __ASM_ARC_SWAB_H
  
  #include <linux/types.h>
  
  /* Native single cycle endian swap insn */
  #ifdef CONFIG_ARC_HAS_SWAPE
  
  #define __arch_swab32(x)		\
  ({					\
  	unsigned int tmp = x;		\
  	__asm__(			\
  	"	swape	%0, %1	
  "	\
  	: "=r" (tmp)			\
  	: "r" (tmp));			\
  	tmp;				\
  })
  
  #else
  
  /* Several ways of Endian-Swap Emulation for ARC
   * 0: kernel generic
   * 1: ARC optimised "C"
   * 2: ARC Custom instruction
   */
  #define ARC_BSWAP_TYPE	1
  
  #if (ARC_BSWAP_TYPE == 1)		/******* Software only ********/
  
  /* The kernel default implementation of htonl is
   *		return  x<<24 | x>>24 |
   *		 (x & (__u32)0x0000ff00UL)<<8 | (x & (__u32)0x00ff0000UL)>>8;
   *
   * This generates 9 instructions on ARC (excluding the ld/st)
   *
   * 8051fd8c:	ld     r3,[r7,20]	; Mem op : Get the value to be swapped
   * 8051fd98:	asl    r5,r3,24		; get  3rd Byte
   * 8051fd9c:	lsr    r2,r3,24		; get  0th Byte
   * 8051fda0:	and    r4,r3,0xff00
   * 8051fda8:	asl    r4,r4,8		; get 1st Byte
   * 8051fdac:	and    r3,r3,0x00ff0000
   * 8051fdb4:	or     r2,r2,r5		; combine 0th and 3rd Bytes
   * 8051fdb8:	lsr    r3,r3,8		; 2nd Byte at correct place in Dst Reg
   * 8051fdbc:	or     r2,r2,r4		; combine 0,3 Bytes with 1st Byte
   * 8051fdc0:	or     r2,r2,r3		; combine 0,3,1 Bytes with 2nd Byte
   * 8051fdc4:	st     r2,[r1,20]	; Mem op : save result back to mem
   *
   * Joern suggested a better "C" algorithm which is great since
   * (1) It is portable to any architecure
   * (2) At the same time it takes advantage of ARC ISA (rotate intrns)
   */
  
  #define __arch_swab32(x)					\
  ({	unsigned long __in = (x), __tmp;			\
  	__tmp = __in << 8 | __in >> 24; /* ror tmp,in,24 */	\
  	__in = __in << 24 | __in >> 8; /* ror in,in,8 */	\
  	__tmp ^= __in;						\
  	__tmp &= 0xff00ff;					\
  	__tmp ^ __in;						\
  })
  
  #elif (ARC_BSWAP_TYPE == 2)	/* Custom single cycle bwap instruction */
  
  #define __arch_swab32(x)						\
  ({									\
  	unsigned int tmp = x;						\
  	__asm__(							\
  	"	.extInstruction	bswap, 7, 0x00, SUFFIX_NONE, SYNTAX_2OP	
  "\
  	"	bswap  %0, %1						
  "\
  	: "=r" (tmp)							\
  	: "r" (tmp));							\
  	tmp;								\
  })
  
  #endif /* ARC_BSWAP_TYPE=zzz */
  
  #endif /* CONFIG_ARC_HAS_SWAPE */
  
  #if !defined(__STRICT_ANSI__) || defined(__KERNEL__)
  #define __SWAB_64_THRU_32__
  #endif
  
  #endif