1*4882a593Smuzhiyun/* SPDX-License-Identifier: GPL-2.0 */ 2*4882a593Smuzhiyun// Copyright (C) 2018 Hangzhou C-SKY Microsystems co.,ltd. 3*4882a593Smuzhiyun 4*4882a593Smuzhiyun#include <linux/linkage.h> 5*4882a593Smuzhiyun#include "sysdep.h" 6*4882a593Smuzhiyun 7*4882a593Smuzhiyun .weak memmove 8*4882a593SmuzhiyunENTRY(__memmove) 9*4882a593SmuzhiyunENTRY(memmove) 10*4882a593Smuzhiyun subu r3, r0, r1 11*4882a593Smuzhiyun cmphs r3, r2 12*4882a593Smuzhiyun bt memcpy 13*4882a593Smuzhiyun 14*4882a593Smuzhiyun mov r12, r0 15*4882a593Smuzhiyun addu r0, r0, r2 16*4882a593Smuzhiyun addu r1, r1, r2 17*4882a593Smuzhiyun 18*4882a593Smuzhiyun /* Test if len less than 4 bytes. */ 19*4882a593Smuzhiyun cmplti r2, 4 20*4882a593Smuzhiyun bt .L_copy_by_byte 21*4882a593Smuzhiyun 22*4882a593Smuzhiyun andi r13, r0, 3 23*4882a593Smuzhiyun /* Test if dest is not 4 bytes aligned. */ 24*4882a593Smuzhiyun bnez r13, .L_dest_not_aligned 25*4882a593Smuzhiyun /* Hardware can handle unaligned access directly. */ 26*4882a593Smuzhiyun.L_dest_aligned: 27*4882a593Smuzhiyun /* If dest is aligned, then copy. */ 28*4882a593Smuzhiyun zext r18, r2, 31, 4 29*4882a593Smuzhiyun /* Test if len less than 16 bytes. */ 30*4882a593Smuzhiyun bez r18, .L_len_less_16bytes 31*4882a593Smuzhiyun movi r19, 0 32*4882a593Smuzhiyun 33*4882a593Smuzhiyun /* len > 16 bytes */ 34*4882a593Smuzhiyun LABLE_ALIGN 35*4882a593Smuzhiyun.L_len_larger_16bytes: 36*4882a593Smuzhiyun subi r1, 16 37*4882a593Smuzhiyun subi r0, 16 38*4882a593Smuzhiyun#if defined(__CK860__) 39*4882a593Smuzhiyun ldw r3, (r1, 12) 40*4882a593Smuzhiyun stw r3, (r0, 12) 41*4882a593Smuzhiyun ldw r3, (r1, 8) 42*4882a593Smuzhiyun stw r3, (r0, 8) 43*4882a593Smuzhiyun ldw r3, (r1, 4) 44*4882a593Smuzhiyun stw r3, (r0, 4) 45*4882a593Smuzhiyun ldw r3, (r1, 0) 46*4882a593Smuzhiyun stw r3, (r0, 0) 47*4882a593Smuzhiyun#else 48*4882a593Smuzhiyun ldw r20, (r1, 0) 49*4882a593Smuzhiyun ldw r21, (r1, 4) 50*4882a593Smuzhiyun ldw r22, (r1, 8) 51*4882a593Smuzhiyun ldw r23, (r1, 12) 52*4882a593Smuzhiyun stw r20, (r0, 0) 53*4882a593Smuzhiyun stw r21, (r0, 4) 54*4882a593Smuzhiyun stw r22, (r0, 8) 55*4882a593Smuzhiyun stw r23, (r0, 12) 56*4882a593Smuzhiyun PRE_BNEZAD (r18) 57*4882a593Smuzhiyun#endif 58*4882a593Smuzhiyun BNEZAD (r18, .L_len_larger_16bytes) 59*4882a593Smuzhiyun 60*4882a593Smuzhiyun.L_len_less_16bytes: 61*4882a593Smuzhiyun zext r18, r2, 3, 2 62*4882a593Smuzhiyun bez r18, .L_copy_by_byte 63*4882a593Smuzhiyun.L_len_less_16bytes_loop: 64*4882a593Smuzhiyun subi r1, 4 65*4882a593Smuzhiyun subi r0, 4 66*4882a593Smuzhiyun ldw r3, (r1, 0) 67*4882a593Smuzhiyun PRE_BNEZAD (r18) 68*4882a593Smuzhiyun stw r3, (r0, 0) 69*4882a593Smuzhiyun BNEZAD (r18, .L_len_less_16bytes_loop) 70*4882a593Smuzhiyun 71*4882a593Smuzhiyun /* Test if len less than 4 bytes. */ 72*4882a593Smuzhiyun.L_copy_by_byte: 73*4882a593Smuzhiyun zext r18, r2, 1, 0 74*4882a593Smuzhiyun bez r18, .L_return 75*4882a593Smuzhiyun.L_copy_by_byte_loop: 76*4882a593Smuzhiyun subi r1, 1 77*4882a593Smuzhiyun subi r0, 1 78*4882a593Smuzhiyun ldb r3, (r1, 0) 79*4882a593Smuzhiyun PRE_BNEZAD (r18) 80*4882a593Smuzhiyun stb r3, (r0, 0) 81*4882a593Smuzhiyun BNEZAD (r18, .L_copy_by_byte_loop) 82*4882a593Smuzhiyun 83*4882a593Smuzhiyun.L_return: 84*4882a593Smuzhiyun mov r0, r12 85*4882a593Smuzhiyun rts 86*4882a593Smuzhiyun 87*4882a593Smuzhiyun /* If dest is not aligned, just copy some bytes makes the dest 88*4882a593Smuzhiyun align. */ 89*4882a593Smuzhiyun.L_dest_not_aligned: 90*4882a593Smuzhiyun sub r2, r13 91*4882a593Smuzhiyun.L_dest_not_aligned_loop: 92*4882a593Smuzhiyun subi r1, 1 93*4882a593Smuzhiyun subi r0, 1 94*4882a593Smuzhiyun /* Makes the dest align. */ 95*4882a593Smuzhiyun ldb r3, (r1, 0) 96*4882a593Smuzhiyun PRE_BNEZAD (r13) 97*4882a593Smuzhiyun stb r3, (r0, 0) 98*4882a593Smuzhiyun BNEZAD (r13, .L_dest_not_aligned_loop) 99*4882a593Smuzhiyun cmplti r2, 4 100*4882a593Smuzhiyun bt .L_copy_by_byte 101*4882a593Smuzhiyun /* Check whether the src is aligned. */ 102*4882a593Smuzhiyun jbr .L_dest_aligned 103*4882a593SmuzhiyunENDPROC(memmove) 104*4882a593SmuzhiyunENDPROC(__memmove) 105