1*4882a593Smuzhiyun/* SPDX-License-Identifier: GPL-2.0 */ 2*4882a593Smuzhiyun/* GENmemcpy.S: Generic sparc64 memcpy. 3*4882a593Smuzhiyun * 4*4882a593Smuzhiyun * Copyright (C) 2007 David S. Miller (davem@davemloft.net) 5*4882a593Smuzhiyun */ 6*4882a593Smuzhiyun 7*4882a593Smuzhiyun#ifdef __KERNEL__ 8*4882a593Smuzhiyun#include <linux/linkage.h> 9*4882a593Smuzhiyun#define GLOBAL_SPARE %g7 10*4882a593Smuzhiyun#else 11*4882a593Smuzhiyun#define GLOBAL_SPARE %g5 12*4882a593Smuzhiyun#endif 13*4882a593Smuzhiyun 14*4882a593Smuzhiyun#ifndef EX_LD 15*4882a593Smuzhiyun#define EX_LD(x,y) x 16*4882a593Smuzhiyun#endif 17*4882a593Smuzhiyun 18*4882a593Smuzhiyun#ifndef EX_ST 19*4882a593Smuzhiyun#define EX_ST(x,y) x 20*4882a593Smuzhiyun#endif 21*4882a593Smuzhiyun 22*4882a593Smuzhiyun#ifndef LOAD 23*4882a593Smuzhiyun#define LOAD(type,addr,dest) type [addr], dest 24*4882a593Smuzhiyun#endif 25*4882a593Smuzhiyun 26*4882a593Smuzhiyun#ifndef STORE 27*4882a593Smuzhiyun#define STORE(type,src,addr) type src, [addr] 28*4882a593Smuzhiyun#endif 29*4882a593Smuzhiyun 30*4882a593Smuzhiyun#ifndef FUNC_NAME 31*4882a593Smuzhiyun#define FUNC_NAME GENmemcpy 32*4882a593Smuzhiyun#endif 33*4882a593Smuzhiyun 34*4882a593Smuzhiyun#ifndef PREAMBLE 35*4882a593Smuzhiyun#define PREAMBLE 36*4882a593Smuzhiyun#endif 37*4882a593Smuzhiyun 38*4882a593Smuzhiyun#ifndef XCC 39*4882a593Smuzhiyun#define XCC xcc 40*4882a593Smuzhiyun#endif 41*4882a593Smuzhiyun 42*4882a593Smuzhiyun .register %g2,#scratch 43*4882a593Smuzhiyun .register %g3,#scratch 44*4882a593Smuzhiyun 45*4882a593Smuzhiyun .text 46*4882a593Smuzhiyun 47*4882a593Smuzhiyun#ifndef EX_RETVAL 48*4882a593Smuzhiyun#define EX_RETVAL(x) x 49*4882a593SmuzhiyunENTRY(GEN_retl_o4_1) 50*4882a593Smuzhiyun add %o4, %o2, %o4 51*4882a593Smuzhiyun retl 52*4882a593Smuzhiyun add %o4, 1, %o0 53*4882a593SmuzhiyunENDPROC(GEN_retl_o4_1) 54*4882a593SmuzhiyunENTRY(GEN_retl_g1_8) 55*4882a593Smuzhiyun add %g1, %o2, %g1 56*4882a593Smuzhiyun retl 57*4882a593Smuzhiyun add %g1, 8, %o0 58*4882a593SmuzhiyunENDPROC(GEN_retl_g1_8) 59*4882a593SmuzhiyunENTRY(GEN_retl_o2_4) 60*4882a593Smuzhiyun retl 61*4882a593Smuzhiyun add %o2, 4, %o0 62*4882a593SmuzhiyunENDPROC(GEN_retl_o2_4) 63*4882a593SmuzhiyunENTRY(GEN_retl_o2_1) 64*4882a593Smuzhiyun retl 65*4882a593Smuzhiyun add %o2, 1, %o0 66*4882a593SmuzhiyunENDPROC(GEN_retl_o2_1) 67*4882a593Smuzhiyun#endif 68*4882a593Smuzhiyun 69*4882a593Smuzhiyun .align 64 70*4882a593Smuzhiyun 71*4882a593Smuzhiyun .globl FUNC_NAME 72*4882a593Smuzhiyun .type FUNC_NAME,#function 73*4882a593SmuzhiyunFUNC_NAME: /* %o0=dst, %o1=src, %o2=len */ 74*4882a593Smuzhiyun srlx %o2, 31, %g2 75*4882a593Smuzhiyun cmp %g2, 0 76*4882a593Smuzhiyun tne %XCC, 5 77*4882a593Smuzhiyun PREAMBLE 78*4882a593Smuzhiyun mov %o0, GLOBAL_SPARE 79*4882a593Smuzhiyun 80*4882a593Smuzhiyun cmp %o2, 0 81*4882a593Smuzhiyun be,pn %XCC, 85f 82*4882a593Smuzhiyun or %o0, %o1, %o3 83*4882a593Smuzhiyun cmp %o2, 16 84*4882a593Smuzhiyun blu,a,pn %XCC, 80f 85*4882a593Smuzhiyun or %o3, %o2, %o3 86*4882a593Smuzhiyun 87*4882a593Smuzhiyun xor %o0, %o1, %o4 88*4882a593Smuzhiyun andcc %o4, 0x7, %g0 89*4882a593Smuzhiyun bne,a,pn %XCC, 90f 90*4882a593Smuzhiyun sub %o0, %o1, %o3 91*4882a593Smuzhiyun 92*4882a593Smuzhiyun and %o0, 0x7, %o4 93*4882a593Smuzhiyun sub %o4, 0x8, %o4 94*4882a593Smuzhiyun sub %g0, %o4, %o4 95*4882a593Smuzhiyun sub %o2, %o4, %o2 96*4882a593Smuzhiyun1: subcc %o4, 1, %o4 97*4882a593Smuzhiyun EX_LD(LOAD(ldub, %o1, %g1),GEN_retl_o4_1) 98*4882a593Smuzhiyun EX_ST(STORE(stb, %g1, %o0),GEN_retl_o4_1) 99*4882a593Smuzhiyun add %o1, 1, %o1 100*4882a593Smuzhiyun bne,pt %XCC, 1b 101*4882a593Smuzhiyun add %o0, 1, %o0 102*4882a593Smuzhiyun 103*4882a593Smuzhiyun andn %o2, 0x7, %g1 104*4882a593Smuzhiyun sub %o2, %g1, %o2 105*4882a593Smuzhiyun1: subcc %g1, 0x8, %g1 106*4882a593Smuzhiyun EX_LD(LOAD(ldx, %o1, %g2),GEN_retl_g1_8) 107*4882a593Smuzhiyun EX_ST(STORE(stx, %g2, %o0),GEN_retl_g1_8) 108*4882a593Smuzhiyun add %o1, 0x8, %o1 109*4882a593Smuzhiyun bne,pt %XCC, 1b 110*4882a593Smuzhiyun add %o0, 0x8, %o0 111*4882a593Smuzhiyun 112*4882a593Smuzhiyun brz,pt %o2, 85f 113*4882a593Smuzhiyun sub %o0, %o1, %o3 114*4882a593Smuzhiyun ba,a,pt %XCC, 90f 115*4882a593Smuzhiyun 116*4882a593Smuzhiyun .align 64 117*4882a593Smuzhiyun80: /* 0 < len <= 16 */ 118*4882a593Smuzhiyun andcc %o3, 0x3, %g0 119*4882a593Smuzhiyun bne,pn %XCC, 90f 120*4882a593Smuzhiyun sub %o0, %o1, %o3 121*4882a593Smuzhiyun 122*4882a593Smuzhiyun1: 123*4882a593Smuzhiyun subcc %o2, 4, %o2 124*4882a593Smuzhiyun EX_LD(LOAD(lduw, %o1, %g1),GEN_retl_o2_4) 125*4882a593Smuzhiyun EX_ST(STORE(stw, %g1, %o1 + %o3),GEN_retl_o2_4) 126*4882a593Smuzhiyun bgu,pt %XCC, 1b 127*4882a593Smuzhiyun add %o1, 4, %o1 128*4882a593Smuzhiyun 129*4882a593Smuzhiyun85: retl 130*4882a593Smuzhiyun mov EX_RETVAL(GLOBAL_SPARE), %o0 131*4882a593Smuzhiyun 132*4882a593Smuzhiyun .align 32 133*4882a593Smuzhiyun90: 134*4882a593Smuzhiyun subcc %o2, 1, %o2 135*4882a593Smuzhiyun EX_LD(LOAD(ldub, %o1, %g1),GEN_retl_o2_1) 136*4882a593Smuzhiyun EX_ST(STORE(stb, %g1, %o1 + %o3),GEN_retl_o2_1) 137*4882a593Smuzhiyun bgu,pt %XCC, 90b 138*4882a593Smuzhiyun add %o1, 1, %o1 139*4882a593Smuzhiyun retl 140*4882a593Smuzhiyun mov EX_RETVAL(GLOBAL_SPARE), %o0 141*4882a593Smuzhiyun 142*4882a593Smuzhiyun .size FUNC_NAME, .-FUNC_NAME 143