include/asm/xor_64.h

*4882a593Smuzhiyun/* SPDX-License-Identifier: GPL-2.0 */
*4882a593Smuzhiyun#ifndef _ASM_X86_XOR_64_H
*4882a593Smuzhiyun#define _ASM_X86_XOR_64_H
*4882a593Smuzhiyun
*4882a593Smuzhiyunstatic struct xor_block_template xor_block_sse = {
*4882a593Smuzhiyun	.name = "generic_sse",
*4882a593Smuzhiyun	.do_2 = xor_sse_2,
*4882a593Smuzhiyun	.do_3 = xor_sse_3,
*4882a593Smuzhiyun	.do_4 = xor_sse_4,
*4882a593Smuzhiyun	.do_5 = xor_sse_5,
*4882a593Smuzhiyun};
*4882a593Smuzhiyun
*4882a593Smuzhiyun
*4882a593Smuzhiyun/* Also try the AVX routines */
*4882a593Smuzhiyun#include <asm/xor_avx.h>
*4882a593Smuzhiyun
*4882a593Smuzhiyun/* We force the use of the SSE xor block because it can write around L2.
*4882a593Smuzhiyun   We may also be able to load into the L1 only depending on how the cpu
*4882a593Smuzhiyun   deals with a load to a line that is being prefetched.  */
*4882a593Smuzhiyun#undef XOR_TRY_TEMPLATES
*4882a593Smuzhiyun#define XOR_TRY_TEMPLATES			\
*4882a593Smuzhiyundo {						\
*4882a593Smuzhiyun	AVX_XOR_SPEED;				\
*4882a593Smuzhiyun	xor_speed(&xor_block_sse_pf64);		\
*4882a593Smuzhiyun	xor_speed(&xor_block_sse);		\
*4882a593Smuzhiyun} while (0)
*4882a593Smuzhiyun
*4882a593Smuzhiyun#endif /* _ASM_X86_XOR_64_H */