Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 2 additions & 1 deletion libc/src/string/memchr.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,8 @@ namespace __llvm_libc {
// TODO: Look at performance benefits of comparing words.
LLVM_LIBC_FUNCTION(void *, memchr, (const void *src, int c, size_t n)) {
return internal::find_first_character(
reinterpret_cast<const unsigned char *>(src), c, n);
reinterpret_cast<const unsigned char *>(src),
static_cast<unsigned char>(c), n);
}

} // namespace __llvm_libc
8 changes: 4 additions & 4 deletions libc/src/string/memcpy.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -30,8 +30,8 @@ namespace __llvm_libc {
// implementation parameters.
// - As compilers and processors get better, the generated code is improved
// with little change on the code side.
static void memcpy_impl(char *__restrict dst, const char *__restrict src,
size_t count) {
static void memcpy_impl(unsigned char *__restrict dst,
const unsigned char *__restrict src, size_t count) {
// Use scalar strategies (_1, _2, _3 ...)
using namespace __llvm_libc::scalar;

Expand Down Expand Up @@ -61,8 +61,8 @@ static void memcpy_impl(char *__restrict dst, const char *__restrict src,
LLVM_LIBC_FUNCTION(void *, memcpy,
(void *__restrict dst, const void *__restrict src,
size_t size)) {
memcpy_impl(reinterpret_cast<char *>(dst),
reinterpret_cast<const char *>(src), size);
memcpy_impl(reinterpret_cast<unsigned char *>(dst),
reinterpret_cast<const unsigned char *>(src), size);
return dst;
}

Expand Down
12 changes: 5 additions & 7 deletions libc/src/string/memmove.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -15,22 +15,20 @@

namespace __llvm_libc {

static inline void move_byte_forward(char *dest_m, const char *src_m,
size_t count) {
static inline void move_byte_forward(unsigned char *dest_m, const unsigned char *src_m, size_t count) {
for (size_t offset = 0; count; --count, ++offset)
dest_m[offset] = src_m[offset];
}

static inline void move_byte_backward(char *dest_m, const char *src_m,
size_t count) {
static inline void move_byte_backward(unsigned char *dest_m, const unsigned char *src_m, size_t count) {
for (size_t offset = count - 1; count; --count, --offset)
dest_m[offset] = src_m[offset];
}

LLVM_LIBC_FUNCTION(void *, memmove,
(void *dest, const void *src, size_t count)) {
char *dest_c = reinterpret_cast<char *>(dest);
const char *src_c = reinterpret_cast<const char *>(src);
unsigned char *dest_c = reinterpret_cast<unsigned char *>(dest);
const unsigned char *src_c = reinterpret_cast<const unsigned char *>(src);

// If the distance between src_c and dest_c is equal to or greater
// than count (integerAbs(src_c - dest_c) >= count), they would not overlap.
Expand Down Expand Up @@ -58,7 +56,7 @@ LLVM_LIBC_FUNCTION(void *, memmove,
// TODO: Optimize `move_byte_xxx(...)` functions.
if (dest_c < src_c)
move_byte_forward(dest_c, src_c, count);
if (dest_c > src_c)
else if (dest_c > src_c)
move_byte_backward(dest_c, src_c, count);
return dest;
}
Expand Down
7 changes: 3 additions & 4 deletions libc/src/string/memrchr.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -14,11 +14,10 @@ namespace __llvm_libc {

LLVM_LIBC_FUNCTION(void *, memrchr, (const void *src, int c, size_t n)) {
const unsigned char *str = reinterpret_cast<const unsigned char *>(src);
const unsigned char ch = c;
const unsigned char ch = static_cast<unsigned char>(c);
for (; n != 0; --n) {
const unsigned char *s = str + n - 1;
if (*s == ch)
return const_cast<unsigned char *>(s);
if (*(--str) == ch)
return const_cast<unsigned char *>(str);
}
return nullptr;
}
Expand Down
12 changes: 6 additions & 6 deletions libc/src/string/strchr.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -14,12 +14,12 @@ namespace __llvm_libc {

// TODO: Look at performance benefits of comparing words.
LLVM_LIBC_FUNCTION(char *, strchr, (const char *src, int c)) {
unsigned char *str =
const_cast<unsigned char *>(reinterpret_cast<const unsigned char *>(src));
const unsigned char ch = c;
for (; *str && *str != ch; ++str)
;
return *str == ch ? reinterpret_cast<char *>(str) : nullptr;
const char ch = static_cast<char>(c);
for (; *src != ch; ++src)
if (*src == '\0')
return nullptr;

return const_cast<char *>(src);
}

} // namespace __llvm_libc
54 changes: 49 additions & 5 deletions libc/src/string/strcpy.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,17 +7,61 @@
//===----------------------------------------------------------------------===//

#include "src/string/strcpy.h"
#include "src/string/memcpy.h"
#include "src/string/string_utils.h"

#include "src/__support/common.h"
#include "src/string/memory_utils/elements.h"

namespace __llvm_libc {

// Design rationale
// ================
//
// Using a profiler to observe size distributions for calls into libc
// functions, it was found most operations act on a small number of bytes.
// This makes it important to favor small sizes.
//
// The tests for `count` are in ascending order so the cost of branching is
// proportional to the cost of copying.
//
// The function is written in C++ for several reasons:
// - The compiler can __see__ the code, this is useful when performing Profile
// Guided Optimization as the optimized code can take advantage of branching
// probabilities.
// - It also allows for easier customization and favors testing multiple
// implementation parameters.
// - As compilers and processors get better, the generated code is improved
// with little change on the code side.
static void strcpy_impl(char *__restrict dst, const char *__restrict src,
size_t count) {
// Use scalar strategies (_1, _2, _3 ...)
using namespace __llvm_libc::scalar;

if (count == 0)
return;
if (count == 1)
return Copy<_1>(dst, src);
if (count == 2)
return Copy<_2>(dst, src);
if (count == 3)
return Copy<_3>(dst, src);
if (count == 4)
return Copy<_4>(dst, src);
if (count < 8)
return Copy<HeadTail<_4>>(dst, src, count);
if (count < 16)
return Copy<HeadTail<_8>>(dst, src, count);
if (count < 32)
return Copy<HeadTail<_16>>(dst, src, count);
if (count < 64)
return Copy<HeadTail<_32>>(dst, src, count);
if (count < 128)
return Copy<HeadTail<_64>>(dst, src, count);
return Copy<Align<_32, Arg::Src>::Then<Loop<_32>>>(dst, src, count);
}

LLVM_LIBC_FUNCTION(char *, strcpy,
(char *__restrict dest, const char *__restrict src)) {
return reinterpret_cast<char *>(
__llvm_libc::memcpy(dest, src, internal::string_length(src) + 1));
strcpy_impl(dest, src, internal::string_length(src) + 1));
return dest;
}

} // namespace __llvm_libc
32 changes: 16 additions & 16 deletions libc/src/string/string_utils.h
Original file line number Diff line number Diff line change
Expand Up @@ -18,30 +18,31 @@ namespace internal {
// Returns the length of a string, denoted by the first occurrence
// of a null terminator.
static inline size_t string_length(const char *src) {
size_t length;
for (length = 0; *src; ++src, ++length)
const char *const initial = src;
for (; *src != '\0'; ++src)
;
return length;
return src - initial;
}

// Returns the first occurrence of 'ch' within the first 'n' characters of
// 'src'. If 'ch' is not found, returns nullptr.
static inline void *find_first_character(const unsigned char *src,
unsigned char ch, size_t n) {
for (; n && *src != ch; --n, ++src)
;
return n ? const_cast<unsigned char *>(src) : nullptr;
for (; n != 0; --n, ++src)
if (*src == ch)
return const_cast<unsigned char *>(src);
return nullptr;
}

// Returns the maximum length span that contains only characters not found in
// 'segment'. If no characters are found, returns the length of 'src'.
static inline size_t complementary_span(const char *src, const char *segment) {
const char *initial = src;
const char *const initial = src;
cpp::Bitset<256> bitset;

for (; *segment; ++segment)
for (; *segment != '\0'; ++segment)
bitset.set(*segment);
for (; *src && !bitset.test(*src); ++src)
for (; *src != '\0' && !bitset.test(*src); ++src)
;
return src - initial;
}
Expand All @@ -59,22 +60,21 @@ static inline char *string_token(char *__restrict src,
const char *__restrict delimiter_string,
char **__restrict saveptr) {
cpp::Bitset<256> delimiter_set;
for (; *delimiter_string; ++delimiter_string)
for (; *delimiter_string != '\0'; ++delimiter_string)
delimiter_set.set(*delimiter_string);

src = src ? src : *saveptr;
for (; *src && delimiter_set.test(*src); ++src)
for (; *src != '\0' && delimiter_set.test(*src); ++src)
;
if (!*src) {
if (*src == '\0') {
*saveptr = src;
return nullptr;
}
char *token = src;
for (; *src && !delimiter_set.test(*src); ++src)
for (; *src != '\0' && !delimiter_set.test(*src); ++src)
;
if (*src) {
*src = '\0';
++src;
if (*src != '\0') {
*src++ = '\0';
}
*saveptr = src;
return token;
Expand Down
4 changes: 2 additions & 2 deletions libc/src/string/strrchr.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -13,12 +13,12 @@
namespace __llvm_libc {

LLVM_LIBC_FUNCTION(char *, strrchr, (const char *src, int c)) {
const char ch = c;
const char ch = static_cast<char>(c);
char *last_occurrence = nullptr;
do {
if (*src == ch)
last_occurrence = const_cast<char *>(src);
} while (*src++);
} while (*src++ != '\0');
return last_occurrence;
}

Expand Down