blob: 54f74de6d7f420e19ace3cc0cfd906e650367880 [file] [log] [blame]
The Android Open Source Project1dc9e472009-03-03 19:28:35 -08001/*
2 * Copyright (C) 2008 The Android Open Source Project
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * * Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in
12 * the documentation and/or other materials provided with the
13 * distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
18 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
19 * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
21 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
22 * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
23 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
25 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * SUCH DAMAGE.
27 */
The Android Open Source Project1dc9e472009-03-03 19:28:35 -080028
Henrik Smiding884e4f82010-11-05 15:07:53 +010029#include <machine/cpu-features.h>
Kenny Root420878c2011-02-16 11:55:58 -080030#include <machine/asm.h>
Henrik Smiding884e4f82010-11-05 15:07:53 +010031
The Android Open Source Project1dc9e472009-03-03 19:28:35 -080032 /*
33 * Optimized memset() for ARM.
34 *
35 * memset() returns its first argument.
36 */
Henrik Smiding884e4f82010-11-05 15:07:53 +010037
38#if defined(__ARM_NEON__)
39 .fpu neon
40#endif
41
Kenny Root420878c2011-02-16 11:55:58 -080042ENTRY(bzero)
The Android Open Source Project1dc9e472009-03-03 19:28:35 -080043 mov r2, r1
44 mov r1, #0
Kenny Root420878c2011-02-16 11:55:58 -080045END(bzero)
The Android Open Source Project1dc9e472009-03-03 19:28:35 -080046
Kenny Root420878c2011-02-16 11:55:58 -080047ENTRY(memset)
Henrik Smiding884e4f82010-11-05 15:07:53 +010048#if defined(__ARM_NEON__)
49
50#ifdef NEON_MEMSET_DIVIDER
51 cmp r2, #NEON_MEMSET_DIVIDER
52 bhi 11f
53#endif
54 .save {r0}
55 stmfd sp!, {r0}
56
57 vdup.8 q0, r1
58
59#ifndef NEON_UNALIGNED_ACCESS
60 /* do we have at least 16-bytes to write (needed for alignment below) */
61 cmp r2, #16
62 blo 3f
63
64 /* align destination to 16 bytes for the write-buffer */
65 rsb r3, r0, #0
66 ands r3, r3, #0xF
67 beq 2f
68
69 /* write up to 15-bytes (count in r3) */
70 sub r2, r2, r3
71 movs ip, r3, lsl #31
72 strmib r1, [r0], #1
73 strcsb r1, [r0], #1
74 strcsb r1, [r0], #1
75 movs ip, r3, lsl #29
76 bge 1f
77
78 // writes 4 bytes, 32-bits aligned
79 vst1.32 {d0[0]}, [r0, :32]!
801: bcc 2f
81
82 // writes 8 bytes, 64-bits aligned
83 vst1.8 {d0}, [r0, :64]!
842:
85#endif
86 /* make sure we have at least 32 bytes to write */
87 subs r2, r2, #32
88 blo 2f
89 vmov q1, q0
90
911: /* The main loop writes 32 bytes at a time */
92 subs r2, r2, #32
93#ifndef NEON_UNALIGNED_ACCESS
94 vst1.8 {d0 - d3}, [r0, :128]!
95#else
96 vst1.8 {d0 - d3}, [r0]!
97#endif
98 bhs 1b
99
1002: /* less than 32 left */
101 add r2, r2, #32
102 tst r2, #0x10
103 beq 3f
104
105 // writes 16 bytes, 128-bits aligned
106#ifndef NEON_UNALIGNED_ACCESS
107 vst1.8 {d0, d1}, [r0, :128]!
108#else
109 vst1.8 {d0, d1}, [r0]!
110#endif
1113: /* write up to 15-bytes (count in r2) */
112 movs ip, r2, lsl #29
113 bcc 1f
114 vst1.8 {d0}, [r0]!
1151: bge 2f
116 vst1.32 {d0[0]}, [r0]!
1172: movs ip, r2, lsl #31
118 strmib r1, [r0], #1
119 strcsb r1, [r0], #1
120 strcsb r1, [r0], #1
121 ldmfd sp!, {r0}
122 bx lr
12311:
124#endif
125
126 /*
127 * Optimized memset() for ARM.
128 *
129 * memset() returns its first argument.
130 */
131
The Android Open Source Project1dc9e472009-03-03 19:28:35 -0800132 /* compute the offset to align the destination
133 * offset = (4-(src&3))&3 = -src & 3
134 */
Henrik Smiding884e4f82010-11-05 15:07:53 +0100135
The Android Open Source Project1dc9e472009-03-03 19:28:35 -0800136 .save {r0, r4-r7, lr}
137 stmfd sp!, {r0, r4-r7, lr}
138 rsb r3, r0, #0
139 ands r3, r3, #3
140 cmp r3, r2
141 movhi r3, r2
142
143 /* splat r1 */
144 mov r1, r1, lsl #24
145 orr r1, r1, r1, lsr #8
146 orr r1, r1, r1, lsr #16
147
148 movs r12, r3, lsl #31
149 strcsb r1, [r0], #1 /* can't use strh (alignment unknown) */
150 strcsb r1, [r0], #1
151 strmib r1, [r0], #1
152 subs r2, r2, r3
153 ldmlsfd sp!, {r0, r4-r7, lr} /* return */
154 bxls lr
155
156 /* align the destination to a cache-line */
157 mov r12, r1
158 mov lr, r1
159 mov r4, r1
160 mov r5, r1
161 mov r6, r1
162 mov r7, r1
Henrik Smiding884e4f82010-11-05 15:07:53 +0100163
The Android Open Source Project1dc9e472009-03-03 19:28:35 -0800164 rsb r3, r0, #0
165 ands r3, r3, #0x1C
Mathias Agopian7e7d6c42009-10-19 16:34:38 -0700166 beq 3f
The Android Open Source Project1dc9e472009-03-03 19:28:35 -0800167 cmp r3, r2
168 andhi r3, r2, #0x1C
169 sub r2, r2, r3
170
Henrik Smiding884e4f82010-11-05 15:07:53 +0100171 /* conditionally writes 0 to 7 words (length in r3) */
The Android Open Source Project1dc9e472009-03-03 19:28:35 -0800172 movs r3, r3, lsl #28
173 stmcsia r0!, {r1, lr}
174 stmcsia r0!, {r1, lr}
175 stmmiia r0!, {r1, lr}
176 movs r3, r3, lsl #2
177 strcs r1, [r0], #4
178
Mathias Agopian7e7d6c42009-10-19 16:34:38 -07001793:
The Android Open Source Project1dc9e472009-03-03 19:28:35 -0800180 subs r2, r2, #32
181 mov r3, r1
182 bmi 2f
1831: subs r2, r2, #32
184 stmia r0!, {r1,r3,r4,r5,r6,r7,r12,lr}
185 bhs 1b
1862: add r2, r2, #32
187
Henrik Smiding884e4f82010-11-05 15:07:53 +0100188 /* conditionally stores 0 to 31 bytes */
The Android Open Source Project1dc9e472009-03-03 19:28:35 -0800189 movs r2, r2, lsl #28
190 stmcsia r0!, {r1,r3,r12,lr}
191 stmmiia r0!, {r1, lr}
192 movs r2, r2, lsl #2
193 strcs r1, [r0], #4
194 strmih r1, [r0], #2
195 movs r2, r2, lsl #2
196 strcsb r1, [r0]
197 ldmfd sp!, {r0, r4-r7, lr}
198 bx lr
Kenny Root420878c2011-02-16 11:55:58 -0800199END(memset)