1 /* $NetBSD: strspn.c,v 1.16 2008/07/30 16:13:59 joerg Exp $ */
4 * Copyright (c) 2008 Joerg Sonnenberger
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
17 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
19 * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
20 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
21 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
22 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
23 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
25 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 #include <sys/cdefs.h>
29 __RCSID("$NetBSD: strspn.c,v 1.16 2008/07/30 16:13:59 joerg Exp $");
36 #if ULONG_MAX != 0xffffffffffffffffull
39 strspn(const char *s
, const char *charset
)
41 static const size_t idx
[8] = { 1, 2, 4, 8, 16, 32, 64, 128 };
44 #define UC(a) ((unsigned int)(unsigned char)(a))
46 _DIAGASSERT(s
!= NULL
);
47 _DIAGASSERT(charset
!= NULL
);
49 if (charset
[0] == '\0')
51 if (charset
[1] == '\0') {
52 for (t
= s
; *t
!= '\0'; ++t
) {
59 (void)memset(set
, 0, sizeof(set
));
61 for (; *charset
!= '\0'; ++charset
)
62 set
[UC(*charset
) >> 3] |= idx
[UC(*charset
) & 7];
64 for (t
= s
; *t
!= '\0'; ++t
)
65 if ((set
[UC(*t
) >> 3] & idx
[UC(*t
) & 7]) == 0)
72 /* 64 bit system, use four 64 bits registers for bitmask */
75 strspn_x(const char *s_s
, const char *charset_s
, unsigned long invert
)
77 const unsigned char *s
= (const unsigned char *)s_s
;
78 const unsigned char *charset
= (const unsigned char *)charset_s
;
79 unsigned long m_0
, m_4
, m_8
, m_c
;
80 unsigned char ch
, next_ch
;
85 /* Four 64bit registers have one bit for each character value */
91 for (ch
= *charset
; ch
!= 0; ch
= next_ch
) {
93 bit
= 1ul << (ch
& 0x3f);
94 if (__predict_true(ch
< 0x80)) {
107 /* For strcspn() we just invert the validity set */
114 * We could do remove the lsb from m_0 to terminate at the
115 * end of the input string.
116 * However prefetching the next char is benifitial and we must
117 * not read the byte after the \0 - as it might fault!
118 * So we take the 'hit' of the compare against 0.
122 for (count
= 0; ch
!= 0; ch
= next_ch
) {
124 if (__predict_true(ch
< 0x80)) {
133 if (!((check
>> (ch
& 0x3f)) & 1))
141 strspn(const char *s
, const char *charset
)
143 return strspn_x(s
, charset
, 0);
147 strcspn(const char *s
, const char *charset
)
149 return strspn_x(s
, charset
, ~0ul);