summaryrefslogtreecommitdiff
path: root/libc/string/xtensa/strlen.S
blob: 23c68f2d5d20776619be8d1401cf256e017b51d4 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
/* Optimized strlen for Xtensa.
   Copyright (C) 2001, 2007 Free Software Foundation, Inc.
   This file is part of the GNU C Library.

   The GNU C Library is free software; you can redistribute it and/or
   modify it under the terms of the GNU Lesser General Public
   License as published by the Free Software Foundation; either
   version 2.1 of the License, or (at your option) any later version.

   The GNU C Library is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   Lesser General Public License for more details.

   You should have received a copy of the GNU Lesser General Public
   License along with the GNU C Library; if not, write to the Free
   Software Foundation, Inc., 51 Franklin Street - Fifth Floor,
   Boston, MA 02110-1301, USA.  */

#include <sysdep.h>
#include <bits/xtensa-config.h>

#ifdef __XTENSA_EB__
#define	MASK0 0xff000000
#define	MASK1 0x00ff0000
#define	MASK2 0x0000ff00
#define	MASK3 0x000000ff
#else
#define	MASK0 0x000000ff
#define	MASK1 0x0000ff00
#define	MASK2 0x00ff0000
#define	MASK3 0xff000000
#endif

	.text
ENTRY (strlen)
	/* a2 = s */

	addi	a3, a2, -4	/* because we overincrement at the end */
	movi	a4, MASK0
	movi	a5, MASK1
	movi	a6, MASK2
	movi	a7, MASK3
	bbsi.l	a2, 0, .L1mod2
	bbsi.l	a2, 1, .L2mod4
	j	.Laligned

.L1mod2: /* address is odd */
	l8ui	a8, a3, 4	/* get byte 0 */
	addi	a3, a3, 1	/* advance string pointer */
	beqz	a8, .Lz3	/* if byte 0 is zero */
	bbci.l	a3, 1, .Laligned /* if string pointer is now word-aligned */

.L2mod4: /* address is 2 mod 4 */
	addi	a3, a3, 2	/* advance ptr for aligned access */
	l32i	a8, a3, 0	/* get word with first two bytes of string */
	bnone	a8, a6, .Lz2	/* if byte 2 (of word, not string) is zero */
	bany	a8, a7, .Laligned /* if byte 3 (of word, not string) is nonzero */

	/* Byte 3 is zero.  */
	addi	a3, a3, 3	/* point to zero byte */
	sub	a2, a3, a2	/* subtract to get length */
	retw


/* String is word-aligned.  */

	.align	4
	/* (2 mod 4) alignment for loop instruction */
.Laligned:
#if XCHAL_HAVE_LOOPS
	_movi.n	a8, 0		/* set up for the maximum loop count */
	loop	a8, .Lz3	/* loop forever (almost anyway) */
#endif
1:	l32i	a8, a3, 4	/* get next word of string */
	addi	a3, a3, 4	/* advance string pointer */
	bnone	a8, a4, .Lz0	/* if byte 0 is zero */
	bnone	a8, a5, .Lz1	/* if byte 1 is zero */
	bnone	a8, a6, .Lz2	/* if byte 2 is zero */
#if XCHAL_HAVE_LOOPS
	bnone	a8, a7, .Lz3	/* if byte 3 is zero */
#else
	bany	a8, a7, 1b	/* repeat if byte 3 is non-zero */
#endif

.Lz3:	/* Byte 3 is zero.  */
	addi	a3, a3, 3	/* point to zero byte */
	/* Fall through....  */

.Lz0:	/* Byte 0 is zero.  */
	sub	a2, a3, a2	/* subtract to get length */
	retw

.Lz1:	/* Byte 1 is zero.  */
	addi	a3, a3, 1	/* point to zero byte */
	sub	a2, a3, a2	/* subtract to get length */
	retw

.Lz2:	/* Byte 2 is zero.  */
	addi	a3, a3, 2	/* point to zero byte */
	sub	a2, a3, a2	/* subtract to get length */
	retw

libc_hidden_def (strlen)