Blame view

kernel/linux-rt-4.4.41/arch/arm/lib/xor-neon.c 1.32 KB
5113f6f70   김현기   kernel add
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
  /*
   * linux/arch/arm/lib/xor-neon.c
   *
   * Copyright (C) 2013 Linaro Ltd <ard.biesheuvel@linaro.org>
   *
   * This program is free software; you can redistribute it and/or modify
   * it under the terms of the GNU General Public License version 2 as
   * published by the Free Software Foundation.
   */
  
  #include <linux/raid/xor.h>
  #include <linux/module.h>
  
  MODULE_LICENSE("GPL");
  
  #ifndef __ARM_NEON__
  #error You should compile this file with '-mfloat-abi=softfp -mfpu=neon'
  #endif
  
  /*
   * Pull in the reference implementations while instructing GCC (through
   * -ftree-vectorize) to attempt to exploit implicit parallelism and emit
   * NEON instructions.
   */
  #if __GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 6)
  #pragma GCC optimize "tree-vectorize"
  #else
  /*
   * While older versions of GCC do not generate incorrect code, they fail to
   * recognize the parallel nature of these functions, and emit plain ARM code,
   * which is known to be slower than the optimized ARM code in asm-arm/xor.h.
   */
  #warning This code requires at least version 4.6 of GCC
  #endif
  
  #pragma GCC diagnostic ignored "-Wunused-variable"
  #include <asm-generic/xor.h>
  
  struct xor_block_template const xor_block_neon_inner = {
  	.name	= "__inner_neon__",
  	.do_2	= xor_8regs_2,
  	.do_3	= xor_8regs_3,
  	.do_4	= xor_8regs_4,
  	.do_5	= xor_8regs_5,
  };
  EXPORT_SYMBOL(xor_block_neon_inner);