Merge tag 'drm-misc-next-2022-11-24' of git://anongit.freedesktop.org/drm/drm-misc...
[linux-block.git] / arch / xtensa / lib / strncpy_user.S
CommitLineData
249ac17e
CZ
1/*
2 * arch/xtensa/lib/strncpy_user.S
3 *
4 * This file is subject to the terms and conditions of the GNU General
5 * Public License. See the file "COPYING" in the main directory of
6 * this archive for more details.
7 *
8 * Returns: -EFAULT if exception before terminator, N if the entire
9 * buffer filled, else strlen.
10 *
11 * Copyright (C) 2002 Tensilica Inc.
12 */
13
249ac17e 14#include <linux/errno.h>
5cf97ebd 15#include <linux/linkage.h>
0013aceb 16#include <asm/asmmacro.h>
8f8d5745 17#include <asm/core.h>
249ac17e
CZ
18
19/*
20 * char *__strncpy_user(char *dst, const char *src, size_t len)
21 */
a0bb46ba
CZ
22
23#ifdef __XTENSA_EB__
24# define MASK0 0xff000000
25# define MASK1 0x00ff0000
26# define MASK2 0x0000ff00
27# define MASK3 0x000000ff
28#else
29# define MASK0 0x000000ff
30# define MASK1 0x0000ff00
31# define MASK2 0x00ff0000
32# define MASK3 0xff000000
33#endif
249ac17e
CZ
34
35# Register use
36# a0/ return address
37# a1/ stack pointer
38# a2/ return value
39# a3/ src
40# a4/ len
41# a5/ mask0
42# a6/ mask1
43# a7/ mask2
44# a8/ mask3
45# a9/ tmp
46# a10/ tmp
47# a11/ dst
249ac17e 48
a0bb46ba 49.text
5cf97ebd
MF
50ENTRY(__strncpy_user)
51
d6d5f19e 52 abi_entry_default
249ac17e
CZ
53 # a2/ dst, a3/ src, a4/ len
54 mov a11, a2 # leave dst in return value register
55 beqz a4, .Lret # if len is zero
a0bb46ba
CZ
56 movi a5, MASK0 # mask for byte 0
57 movi a6, MASK1 # mask for byte 1
58 movi a7, MASK2 # mask for byte 2
59 movi a8, MASK3 # mask for byte 3
249ac17e
CZ
60 bbsi.l a3, 0, .Lsrc1mod2 # if only 8-bit aligned
61 bbsi.l a3, 1, .Lsrc2mod4 # if only 16-bit aligned
62.Lsrcaligned: # return here when src is word-aligned
d191323b 63 srli a10, a4, 2 # number of loop iterations with 4B per loop
249ac17e
CZ
64 movi a9, 3
65 bnone a11, a9, .Laligned
66 j .Ldstunaligned
67
68.Lsrc1mod2: # src address is odd
0013aceb 69EX(11f) l8ui a9, a3, 0 # get byte 0
249ac17e 70 addi a3, a3, 1 # advance src pointer
0013aceb 71EX(10f) s8i a9, a11, 0 # store byte 0
249ac17e
CZ
72 beqz a9, .Lret # if byte 0 is zero
73 addi a11, a11, 1 # advance dst pointer
74 addi a4, a4, -1 # decrement len
75 beqz a4, .Lret # if len is zero
76 bbci.l a3, 1, .Lsrcaligned # if src is now word-aligned
77
78.Lsrc2mod4: # src address is 2 mod 4
0013aceb 79EX(11f) l8ui a9, a3, 0 # get byte 0
249ac17e 80 /* 1-cycle interlock */
0013aceb 81EX(10f) s8i a9, a11, 0 # store byte 0
249ac17e
CZ
82 beqz a9, .Lret # if byte 0 is zero
83 addi a11, a11, 1 # advance dst pointer
84 addi a4, a4, -1 # decrement len
85 beqz a4, .Lret # if len is zero
0013aceb 86EX(11f) l8ui a9, a3, 1 # get byte 0
249ac17e 87 addi a3, a3, 2 # advance src pointer
0013aceb 88EX(10f) s8i a9, a11, 0 # store byte 0
249ac17e
CZ
89 beqz a9, .Lret # if byte 0 is zero
90 addi a11, a11, 1 # advance dst pointer
91 addi a4, a4, -1 # decrement len
92 bnez a4, .Lsrcaligned # if len is nonzero
93.Lret:
94 sub a2, a11, a2 # compute strlen
d6d5f19e 95 abi_ret_default
249ac17e
CZ
96
97/*
98 * dst is word-aligned, src is word-aligned
99 */
100 .align 4 # 1 mod 4 alignment for LOOPNEZ
101 .byte 0 # (0 mod 4 alignment for LBEG)
102.Laligned:
103#if XCHAL_HAVE_LOOPS
d191323b 104 loopnez a10, .Loop1done
249ac17e 105#else
d191323b
MF
106 beqz a10, .Loop1done
107 slli a10, a10, 2
108 add a10, a10, a11 # a10 = end of last 4B chunck
249ac17e
CZ
109#endif
110.Loop1:
0013aceb 111EX(11f) l32i a9, a3, 0 # get word from src
249ac17e
CZ
112 addi a3, a3, 4 # advance src pointer
113 bnone a9, a5, .Lz0 # if byte 0 is zero
114 bnone a9, a6, .Lz1 # if byte 1 is zero
115 bnone a9, a7, .Lz2 # if byte 2 is zero
0013aceb 116EX(10f) s32i a9, a11, 0 # store word to dst
249ac17e
CZ
117 bnone a9, a8, .Lz3 # if byte 3 is zero
118 addi a11, a11, 4 # advance dst pointer
119#if !XCHAL_HAVE_LOOPS
d191323b 120 blt a11, a10, .Loop1
249ac17e
CZ
121#endif
122
123.Loop1done:
124 bbci.l a4, 1, .L100
125 # copy 2 bytes
0013aceb 126EX(11f) l16ui a9, a3, 0
249ac17e
CZ
127 addi a3, a3, 2 # advance src pointer
128#ifdef __XTENSA_EB__
129 bnone a9, a7, .Lz0 # if byte 2 is zero
130 bnone a9, a8, .Lz1 # if byte 3 is zero
131#else
132 bnone a9, a5, .Lz0 # if byte 0 is zero
133 bnone a9, a6, .Lz1 # if byte 1 is zero
134#endif
0013aceb 135EX(10f) s16i a9, a11, 0
249ac17e
CZ
136 addi a11, a11, 2 # advance dst pointer
137.L100:
138 bbci.l a4, 0, .Lret
0013aceb 139EX(11f) l8ui a9, a3, 0
249ac17e 140 /* slot */
0013aceb 141EX(10f) s8i a9, a11, 0
249ac17e
CZ
142 beqz a9, .Lret # if byte is zero
143 addi a11, a11, 1-3 # advance dst ptr 1, but also cancel
144 # the effect of adding 3 in .Lz3 code
145 /* fall thru to .Lz3 and "retw" */
146
147.Lz3: # byte 3 is zero
148 addi a11, a11, 3 # advance dst pointer
149 sub a2, a11, a2 # compute strlen
d6d5f19e 150 abi_ret_default
249ac17e
CZ
151.Lz0: # byte 0 is zero
152#ifdef __XTENSA_EB__
153 movi a9, 0
154#endif /* __XTENSA_EB__ */
0013aceb 155EX(10f) s8i a9, a11, 0
249ac17e 156 sub a2, a11, a2 # compute strlen
d6d5f19e 157 abi_ret_default
249ac17e
CZ
158.Lz1: # byte 1 is zero
159#ifdef __XTENSA_EB__
c4c4594b 160 extui a9, a9, 16, 16
249ac17e 161#endif /* __XTENSA_EB__ */
0013aceb 162EX(10f) s16i a9, a11, 0
249ac17e
CZ
163 addi a11, a11, 1 # advance dst pointer
164 sub a2, a11, a2 # compute strlen
d6d5f19e 165 abi_ret_default
249ac17e
CZ
166.Lz2: # byte 2 is zero
167#ifdef __XTENSA_EB__
c4c4594b 168 extui a9, a9, 16, 16
249ac17e 169#endif /* __XTENSA_EB__ */
0013aceb 170EX(10f) s16i a9, a11, 0
249ac17e 171 movi a9, 0
0013aceb 172EX(10f) s8i a9, a11, 2
249ac17e
CZ
173 addi a11, a11, 2 # advance dst pointer
174 sub a2, a11, a2 # compute strlen
d6d5f19e 175 abi_ret_default
249ac17e
CZ
176
177 .align 4 # 1 mod 4 alignment for LOOPNEZ
178 .byte 0 # (0 mod 4 alignment for LBEG)
179.Ldstunaligned:
180/*
181 * for now just use byte copy loop
182 */
183#if XCHAL_HAVE_LOOPS
184 loopnez a4, .Lunalignedend
185#else
186 beqz a4, .Lunalignedend
d191323b 187 add a10, a11, a4 # a10 = ending address
249ac17e
CZ
188#endif /* XCHAL_HAVE_LOOPS */
189.Lnextbyte:
0013aceb 190EX(11f) l8ui a9, a3, 0
249ac17e 191 addi a3, a3, 1
0013aceb 192EX(10f) s8i a9, a11, 0
249ac17e
CZ
193 beqz a9, .Lunalignedend
194 addi a11, a11, 1
195#if !XCHAL_HAVE_LOOPS
d191323b 196 blt a11, a10, .Lnextbyte
249ac17e
CZ
197#endif
198
199.Lunalignedend:
200 sub a2, a11, a2 # compute strlen
d6d5f19e 201 abi_ret_default
249ac17e 202
5cf97ebd 203ENDPROC(__strncpy_user)
249ac17e
CZ
204
205 .section .fixup, "ax"
206 .align 4
207
208 /* For now, just return -EFAULT. Future implementations might
209 * like to clear remaining kernel space, like the fixup
210 * implementation in memset(). Thus, we differentiate between
211 * load/store fixups. */
212
0013aceb
MF
21310:
21411:
249ac17e 215 movi a2, -EFAULT
d6d5f19e 216 abi_ret_default