^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 1) /* SPDX-License-Identifier: GPL-2.0 */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 2) // Copyright (C) 2018 Hangzhou C-SKY Microsystems co.,ltd.
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 3)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 4) #include <linux/linkage.h>
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 5) #include "sysdep.h"
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 6)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 7) ENTRY(memcmp)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 8) /* Test if len less than 4 bytes. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 9) mov r3, r0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 10) movi r0, 0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 11) mov r12, r4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 12) cmplti r2, 4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 13) bt .L_compare_by_byte
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 14)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 15) andi r13, r0, 3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 16) movi r19, 4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 17)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 18) /* Test if s1 is not 4 bytes aligned. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 19) bnez r13, .L_s1_not_aligned
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 20)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 21) LABLE_ALIGN
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 22) .L_s1_aligned:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 23) /* If dest is aligned, then copy. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 24) zext r18, r2, 31, 4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 25) /* Test if len less than 16 bytes. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 26) bez r18, .L_compare_by_word
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 27)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 28) .L_compare_by_4word:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 29) /* If aligned, load word each time. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 30) ldw r20, (r3, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 31) ldw r21, (r1, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 32) /* If s1[i] != s2[i], goto .L_byte_check. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 33) cmpne r20, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 34) bt .L_byte_check
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 35)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 36) ldw r20, (r3, 4)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 37) ldw r21, (r1, 4)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 38) cmpne r20, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 39) bt .L_byte_check
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 40)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 41) ldw r20, (r3, 8)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 42) ldw r21, (r1, 8)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 43) cmpne r20, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 44) bt .L_byte_check
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 45)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 46) ldw r20, (r3, 12)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 47) ldw r21, (r1, 12)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 48) cmpne r20, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 49) bt .L_byte_check
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 50)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 51) PRE_BNEZAD (r18)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 52) addi a3, 16
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 53) addi a1, 16
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 54)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 55) BNEZAD (r18, .L_compare_by_4word)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 56)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 57) .L_compare_by_word:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 58) zext r18, r2, 3, 2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 59) bez r18, .L_compare_by_byte
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 60) .L_compare_by_word_loop:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 61) ldw r20, (r3, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 62) ldw r21, (r1, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 63) addi r3, 4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 64) PRE_BNEZAD (r18)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 65) cmpne r20, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 66) addi r1, 4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 67) bt .L_byte_check
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 68) BNEZAD (r18, .L_compare_by_word_loop)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 69)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 70) .L_compare_by_byte:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 71) zext r18, r2, 1, 0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 72) bez r18, .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 73) .L_compare_by_byte_loop:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 74) ldb r0, (r3, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 75) ldb r4, (r1, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 76) addi r3, 1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 77) subu r0, r4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 78) PRE_BNEZAD (r18)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 79) addi r1, 1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 80) bnez r0, .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 81) BNEZAD (r18, .L_compare_by_byte_loop)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 82)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 83) .L_return:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 84) mov r4, r12
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 85) rts
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 86)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 87) # ifdef __CSKYBE__
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 88) /* d[i] != s[i] in word, so we check byte 0. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 89) .L_byte_check:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 90) xtrb0 r0, r20
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 91) xtrb0 r2, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 92) subu r0, r2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 93) bnez r0, .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 94)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 95) /* check byte 1 */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 96) xtrb1 r0, r20
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 97) xtrb1 r2, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 98) subu r0, r2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 99) bnez r0, .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 100)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 101) /* check byte 2 */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 102) xtrb2 r0, r20
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 103) xtrb2 r2, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 104) subu r0, r2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 105) bnez r0, .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 106)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 107) /* check byte 3 */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 108) xtrb3 r0, r20
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 109) xtrb3 r2, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 110) subu r0, r2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 111) # else
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 112) /* s1[i] != s2[i] in word, so we check byte 3. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 113) .L_byte_check:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 114) xtrb3 r0, r20
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 115) xtrb3 r2, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 116) subu r0, r2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 117) bnez r0, .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 118)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 119) /* check byte 2 */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 120) xtrb2 r0, r20
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 121) xtrb2 r2, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 122) subu r0, r2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 123) bnez r0, .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 124)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 125) /* check byte 1 */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 126) xtrb1 r0, r20
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 127) xtrb1 r2, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 128) subu r0, r2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 129) bnez r0, .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 130)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 131) /* check byte 0 */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 132) xtrb0 r0, r20
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 133) xtrb0 r2, r21
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 134) subu r0, r2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 135) br .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 136) # endif /* !__CSKYBE__ */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 137)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 138) /* Compare when s1 is not aligned. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 139) .L_s1_not_aligned:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 140) sub r13, r19, r13
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 141) sub r2, r13
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 142) .L_s1_not_aligned_loop:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 143) ldb r0, (r3, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 144) ldb r4, (r1, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 145) addi r3, 1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 146) subu r0, r4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 147) PRE_BNEZAD (r13)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 148) addi r1, 1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 149) bnez r0, .L_return
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 150) BNEZAD (r13, .L_s1_not_aligned_loop)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 151) br .L_s1_aligned
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 152) ENDPROC(memcmp)