^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 1) /* SPDX-License-Identifier: GPL-2.0 */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 2) /* linux/arch/sparc/lib/memset.S: Sparc optimized memset, bzero and clear_user code
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 3) * Copyright (C) 1991,1996 Free Software Foundation
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 4) * Copyright (C) 1996,1997 Jakub Jelinek (jj@sunsite.mff.cuni.cz)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 5) * Copyright (C) 1996 David S. Miller (davem@caip.rutgers.edu)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 6) *
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 7) * Calls to memset returns initial %o0. Calls to bzero returns 0, if ok, and
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 8) * number of bytes not yet set if exception occurs and we were called as
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 9) * clear_user.
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 10) */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 11)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 12) #include <asm/ptrace.h>
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 13) #include <asm/export.h>
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 14)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 15) /* Work around cpp -rob */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 16) #define ALLOC #alloc
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 17) #define EXECINSTR #execinstr
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 18) #define EX(x,y,a,b) \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 19) 98: x,y; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 20) .section .fixup,ALLOC,EXECINSTR; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 21) .align 4; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 22) 99: ba 30f; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 23) a, b, %o0; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 24) .section __ex_table,ALLOC; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 25) .align 4; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 26) .word 98b, 99b; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 27) .text; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 28) .align 4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 29)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 30) #define EXT(start,end,handler) \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 31) .section __ex_table,ALLOC; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 32) .align 4; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 33) .word start, 0, end, handler; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 34) .text; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 35) .align 4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 36)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 37) /* Please don't change these macros, unless you change the logic
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 38) * in the .fixup section below as well.
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 39) * Store 64 bytes at (BASE + OFFSET) using value SOURCE. */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 40) #define ZERO_BIG_BLOCK(base, offset, source) \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 41) std source, [base + offset + 0x00]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 42) std source, [base + offset + 0x08]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 43) std source, [base + offset + 0x10]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 44) std source, [base + offset + 0x18]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 45) std source, [base + offset + 0x20]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 46) std source, [base + offset + 0x28]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 47) std source, [base + offset + 0x30]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 48) std source, [base + offset + 0x38];
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 49)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 50) #define ZERO_LAST_BLOCKS(base, offset, source) \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 51) std source, [base - offset - 0x38]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 52) std source, [base - offset - 0x30]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 53) std source, [base - offset - 0x28]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 54) std source, [base - offset - 0x20]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 55) std source, [base - offset - 0x18]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 56) std source, [base - offset - 0x10]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 57) std source, [base - offset - 0x08]; \
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 58) std source, [base - offset - 0x00];
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 59)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 60) .text
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 61) .align 4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 62)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 63) .globl __bzero_begin
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 64) __bzero_begin:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 65)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 66) .globl __bzero
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 67) .type __bzero,#function
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 68) .globl memset
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 69) EXPORT_SYMBOL(__bzero)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 70) EXPORT_SYMBOL(memset)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 71) .globl __memset_start, __memset_end
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 72) __memset_start:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 73) memset:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 74) mov %o0, %g1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 75) mov 1, %g4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 76) and %o1, 0xff, %g3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 77) sll %g3, 8, %g2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 78) or %g3, %g2, %g3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 79) sll %g3, 16, %g2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 80) or %g3, %g2, %g3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 81) b 1f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 82) mov %o2, %o1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 83) 3:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 84) cmp %o2, 3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 85) be 2f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 86) EX(stb %g3, [%o0], sub %o1, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 87)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 88) cmp %o2, 2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 89) be 2f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 90) EX(stb %g3, [%o0 + 0x01], sub %o1, 1)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 91)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 92) EX(stb %g3, [%o0 + 0x02], sub %o1, 2)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 93) 2:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 94) sub %o2, 4, %o2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 95) add %o1, %o2, %o1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 96) b 4f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 97) sub %o0, %o2, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 98)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 99) __bzero:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 100) clr %g4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 101) mov %g0, %g3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 102) 1:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 103) cmp %o1, 7
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 104) bleu 7f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 105) andcc %o0, 3, %o2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 106)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 107) bne 3b
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 108) 4:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 109) andcc %o0, 4, %g0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 110)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 111) be 2f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 112) mov %g3, %g2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 113)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 114) EX(st %g3, [%o0], sub %o1, 0)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 115) sub %o1, 4, %o1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 116) add %o0, 4, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 117) 2:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 118) andcc %o1, 0xffffff80, %o3 ! Now everything is 8 aligned and o1 is len to run
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 119) be 9f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 120) andcc %o1, 0x78, %o2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 121) 10:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 122) ZERO_BIG_BLOCK(%o0, 0x00, %g2)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 123) subcc %o3, 128, %o3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 124) ZERO_BIG_BLOCK(%o0, 0x40, %g2)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 125) 11:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 126) EXT(10b, 11b, 20f)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 127) bne 10b
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 128) add %o0, 128, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 129)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 130) orcc %o2, %g0, %g0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 131) 9:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 132) be 13f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 133) andcc %o1, 7, %o1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 134)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 135) srl %o2, 1, %o3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 136) set 13f, %o4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 137) sub %o4, %o3, %o4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 138) jmp %o4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 139) add %o0, %o2, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 140)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 141) 12:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 142) ZERO_LAST_BLOCKS(%o0, 0x48, %g2)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 143) ZERO_LAST_BLOCKS(%o0, 0x08, %g2)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 144) 13:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 145) EXT(12b, 13b, 21f)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 146) be 8f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 147) andcc %o1, 4, %g0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 148)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 149) be 1f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 150) andcc %o1, 2, %g0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 151)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 152) EX(st %g3, [%o0], and %o1, 7)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 153) add %o0, 4, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 154) 1:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 155) be 1f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 156) andcc %o1, 1, %g0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 157)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 158) EX(sth %g3, [%o0], and %o1, 3)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 159) add %o0, 2, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 160) 1:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 161) bne,a 8f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 162) EX(stb %g3, [%o0], and %o1, 1)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 163) 8:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 164) b 0f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 165) nop
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 166) 7:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 167) be 13b
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 168) orcc %o1, 0, %g0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 169)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 170) be 0f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 171) 8:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 172) add %o0, 1, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 173) subcc %o1, 1, %o1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 174) bne 8b
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 175) EX(stb %g3, [%o0 - 1], add %o1, 1)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 176) 0:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 177) andcc %g4, 1, %g0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 178) be 5f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 179) nop
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 180) retl
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 181) mov %g1, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 182) 5:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 183) retl
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 184) clr %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 185) __memset_end:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 186)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 187) .section .fixup,#alloc,#execinstr
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 188) .align 4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 189) 20:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 190) cmp %g2, 8
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 191) bleu 1f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 192) and %o1, 0x7f, %o1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 193) sub %g2, 9, %g2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 194) add %o3, 64, %o3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 195) 1:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 196) sll %g2, 3, %g2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 197) add %o3, %o1, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 198) b 30f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 199) sub %o0, %g2, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 200) 21:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 201) mov 8, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 202) and %o1, 7, %o1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 203) sub %o0, %g2, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 204) sll %o0, 3, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 205) b 30f
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 206) add %o0, %o1, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 207) 30:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 208) /* %o4 is faulting address, %o5 is %pc where fault occurred */
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 209) save %sp, -104, %sp
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 210) mov %i5, %o0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 211) mov %i7, %o1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 212) call lookup_fault
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 213) mov %i4, %o2
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 214) ret
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 215) restore
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 216)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 217) .globl __bzero_end
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 218) __bzero_end: