xor-neon.c 1.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647
  1. /*
  2. * linux/arch/arm/lib/xor-neon.c
  3. *
  4. * Copyright (C) 2013 Linaro Ltd <ard.biesheuvel@linaro.org>
  5. *
  6. * This program is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU General Public License version 2 as
  8. * published by the Free Software Foundation.
  9. */
  10. #include <linux/raid/xor.h>
  11. #include <linux/module.h>
  12. MODULE_LICENSE("GPL");
  13. #ifndef __ARM_NEON__
  14. #error You should compile this file with '-mfloat-abi=softfp -mfpu=neon'
  15. #endif
  16. /*
  17. * Pull in the reference implementations while instructing GCC (through
  18. * -ftree-vectorize) to attempt to exploit implicit parallelism and emit
  19. * NEON instructions.
  20. */
  21. #if __GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 6)
  22. #pragma GCC optimize "tree-vectorize"
  23. #else
  24. /*
  25. * While older versions of GCC do not generate incorrect code, they fail to
  26. * recognize the parallel nature of these functions, and emit plain ARM code,
  27. * which is known to be slower than the optimized ARM code in asm-arm/xor.h.
  28. */
  29. #warning This code requires at least version 4.6 of GCC
  30. #endif
  31. #pragma GCC diagnostic ignored "-Wunused-variable"
  32. #include <asm-generic/xor.h>
  33. struct xor_block_template const xor_block_neon_inner = {
  34. .name = "__inner_neon__",
  35. .do_2 = xor_8regs_2,
  36. .do_3 = xor_8regs_3,
  37. .do_4 = xor_8regs_4,
  38. .do_5 = xor_8regs_5,
  39. };
  40. EXPORT_SYMBOL(xor_block_neon_inner);