-
Notifications
You must be signed in to change notification settings - Fork 14
/
Copy pathstring.cc
294 lines (253 loc) · 6.28 KB
/
string.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
#include "string.h"
#include "utf.h"
#include "likely.h"
#include "malloc.h"
#include "assert.h"
#if defined(__x86_64__) || defined(__i386__)
#define USE_REP_STRING
#endif
size_t strlen(char const *src)
{
size_t len = 0;
for ( ; src[len]; ++len);
return len;
}
// The terminating null character is considered to be a part
// of the string and can be found when searching for '\0'.
char *strchr(char const *s, int ch)
{
for (;; ++s) {
char c = *s;
if (c == (char)ch)
return (char*)s;
if (c == 0)
return nullptr;
}
}
int strcmp(char const *lhs, char const *rhs)
{
int cmp = 0;
do {
cmp = int((unsigned)*lhs) -
int((unsigned)*rhs++);
} while (cmp == 0 && *lhs++);
return cmp;
}
int strncmp(char const *lhs, char const *rhs, size_t count)
{
int cmp = 0;
if (count) {
do {
cmp = int((unsigned)*lhs) -
int((unsigned)*rhs++);
} while (--count && cmp == 0 && *lhs++);
}
return cmp;
}
char *strcpy(char *dest, char const *src)
{
char *d = dest;
while ((*d++ = *src++) != 0);
return dest;
}
char *strncpy(char *dest, char const *src, size_t n)
{
char *d = dest;
size_t i = 0;
// Copy from src up to but not including null terminator
for ( ; i < n && src[i]; ++i)
d[i] = src[i];
// Fill dest with zeros until at least n bytes are written
for ( ; i < n; ++i)
d[i] = 0;
return dest;
}
char *strcat(char *dest, char const *src)
{
strcpy(dest + strlen(dest), src);
return dest;
}
// The behavior is undefined if the destination array
// does not have enough space for the contents of both
// dest and the first count characters of src, plus the
// terminating null character. The behavior is undefined
// if the source and destination objects overlap. The
// behavior is undefined if either dest is not a pointer
// to a null-terminated byte string or src is not a
// pointer to a character array.
char *strncat(char * restrict dest, char const * restrict src, size_t n)
{
return strncpy(dest + strlen(dest), src, n);
}
void *memchr(void const *mem, int ch, size_t count)
{
for (char const *p = (char const *)mem; count--; ++p)
if (*p == (char)ch)
return (void *)p;
return nullptr;
}
int memcmp(void const *lhs, void const *rhs, size_t count)
{
unsigned char const *lp = (unsigned char const *)lhs;
unsigned char const *rp = (unsigned char const *)rhs;
int cmp = 0;
if (count) {
do {
cmp = *lp++ - *rp++;
} while (cmp == 0 && --count);
}
return cmp;
}
char *strstr(char const *str, char const *substr)
{
// If substr is empty string, return str
if (*substr == 0)
return (char*)str;
size_t slen = strlen(str);
size_t blen = strlen(substr);
// If substring is longer than string, impossible match
if (blen > slen)
return nullptr;
// Only search as far as substr would fit within str
size_t chklen = slen - blen;
// Try each starting point
for (size_t i = 0; i <= chklen; ++i)
if (memcmp(str + i, substr, blen) == 0)
return (char*)(str + i);
return nullptr;
}
void *memcpy_rev(void *dest, void const *src, size_t n)
{
#ifdef USE_REP_STRING
if ((n & 3) == 0) {
src = (char*)src + n - 1;
char *d = (char*)dest + n - 1;
n >>= 2;
__asm__ __volatile__ (
"std\n\t"
"rep movsl\n\t"
"cld\n\t"
: "+S" (src)
, "+D" (d)
, "+c" (n)
:
: "memory"
);
} else {
src = (char*)src + n - 4;
char *d = (char*)dest + n - 4;
__asm__ __volatile__ (
"std\n\t"
"rep movsb\n\t"
"cld\n\t"
: "+S" (src)
, "+D" (d)
, "+c" (n)
:
: "memory"
);
}
return dest;
#else
char *d = (char*)dest;
char const *s = (char const *)src;
while (n--)
*d++ = *s++;
#endif
return dest;
}
void *memmove(void *dest, void const *src, size_t n)
{
char *d = (char*)dest;
char const *s = (char const *)src;
if (likely(n)) {
if (d < s || s + n <= d)
return memcpy(d, s, n);
if (d != s) {
for (size_t i = n; i; --i)
d[i-1] = s[i-1];
}
}
return dest;
}
void *memset(void *dest, int c, size_t n)
{
#ifdef USE_REP_STRING
char *d = (char*)dest;
size_t remainder = n & 3;
n >>= 2;
__asm__ __volatile__ (
"cld\n\t"
"rep stosl\n\t"
"mov %[remainder],%[count]\n\t"
"rep stosb\n\t"
: "+D" (d)
, [count] "+c" (n)
: "a" ((c & 0xFF) * 0x01010101)
, [remainder] "d" (remainder)
: "memory"
);
#else
char *p = (char*)dest;
while (n--)
*p++ = (char)c;
#endif
return dest;
}
#ifdef USE_REP_STRING
void *memcpy(void *dest, void const *src, size_t n)
{
void *ret = dest;
size_t remainder = n & 3;
n >>= 2;
__asm__ __volatile__ (
"cld\n\t"
"rep movsl\n\t"
"mov %[remainder],%[count]\n\t"
"rep movsb\n\t"
: "+D" (dest), "+S" (src), [count] "+c" (n)
: [remainder] "d" (remainder)
: "memory"
);
return ret;
}
#else
void *memcpy(void *dest, void const *src, size_t n)
{
char *d = (char*)dest;
char const *s = (char const *)src;
while (n--)
*d++ = *s++;
return dest;
}
#endif
char *utf8_from_tchar(char *block)
{
return block;
}
char *utf8_from_tchar(char16_t *block)
{
if (unlikely(!block))
return nullptr;
size_t len = 0;
char32_t codepoint;
// Measure the buffer size needed
for (char16_t const *in = block;
(codepoint = utf16_to_ucs4_upd(in)) != 0;
len += ucs4_to_utf8(nullptr, codepoint));
// Allocate output buffer
char *result = (char*)malloc(len + 1);
if (unlikely(!result))
return nullptr;
char *out = result;
if (likely(len)) {
for (char16_t const *in = block;
(codepoint = utf16_to_ucs4_upd(in)) != 0;
out += ucs4_to_utf8(out, codepoint));
} else {
*out = 0;
}
assert(result + len == out);
assert(result[len] == 0);
return result;
}