diff --git a/libc/config/linux/aarch64/entrypoints.txt b/libc/config/linux/aarch64/entrypoints.txt --- a/libc/config/linux/aarch64/entrypoints.txt +++ b/libc/config/linux/aarch64/entrypoints.txt @@ -27,6 +27,7 @@ libc.src.string.strcpy libc.src.string.strlen libc.src.string.strnlen + libc.src.string.strpbrk libc.src.string.strrchr libc.src.string.strspn libc.src.string.strstr diff --git a/libc/config/linux/x86_64/entrypoints.txt b/libc/config/linux/x86_64/entrypoints.txt --- a/libc/config/linux/x86_64/entrypoints.txt +++ b/libc/config/linux/x86_64/entrypoints.txt @@ -45,6 +45,7 @@ libc.src.string.strcpy libc.src.string.strlen libc.src.string.strnlen + libc.src.string.strpbrk libc.src.string.strrchr libc.src.string.strspn libc.src.string.strstr diff --git a/libc/src/string/CMakeLists.txt b/libc/src/string/CMakeLists.txt --- a/libc/src/string/CMakeLists.txt +++ b/libc/src/string/CMakeLists.txt @@ -100,6 +100,18 @@ strspn.cpp HDRS strspn.h + DEPENDS + libc.utils.CPP.standalone_cpp +) + +add_entrypoint_object( + strpbrk + SRCS + strpbrk.cpp + HDRS + strpbrk.h + DEPENDS + libc.utils.CPP.standalone_cpp ) # Helper to define a function with multiple implementations diff --git a/libc/src/string/strpbrk.h b/libc/src/string/strpbrk.h new file mode 100644 --- /dev/null +++ b/libc/src/string/strpbrk.h @@ -0,0 +1,20 @@ +//===-- Implementation header for strpbrk -----------------------*- C++ -*-===// +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// + +#ifndef LLVM_LIBC_SRC_STRING_STRSPN_H +#define LLVM_LIBC_SRC_STRING_STRSPN_H + +#include + +namespace __llvm_libc { + +char *strpbrk(const char *src, const char *breakset); + +} // namespace __llvm_libc + +#endif // LLVM_LIBC_SRC_STRING_STRSPN_H diff --git a/libc/src/string/strspn.cpp b/libc/src/string/strpbrk.cpp copy from libc/src/string/strspn.cpp copy to libc/src/string/strpbrk.cpp --- a/libc/src/string/strspn.cpp +++ b/libc/src/string/strpbrk.cpp @@ -1,4 +1,4 @@ -//===-- Implementation of strspn ------------------------------------------===// +//===-- Implementation of strpbrk -----------------------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. @@ -6,24 +6,22 @@ // //===----------------------------------------------------------------------===// -#include "src/string/strspn.h" +#include "src/string/strpbrk.h" #include "src/__support/common.h" #include "utils/CPP/Bitset.h" #include -#include namespace __llvm_libc { -size_t LLVM_LIBC_ENTRYPOINT(strspn)(const char *src, const char *segment) { - const char *initial = src; +char *LLVM_LIBC_ENTRYPOINT(strpbrk)(const char *src, const char *breakset) { cpp::Bitset<256> bitset; - for (; *segment; ++segment) - bitset.set(*segment); - for (; *src && bitset.test(*src); ++src) + for (; *breakset; ++breakset) + bitset.set(*breakset); + for (; *src && !bitset.test(*src); ++src) ; - return src - initial; + return *src ? const_cast(src) : nullptr; } } // namespace __llvm_libc diff --git a/libc/src/string/strspn.cpp b/libc/src/string/strspn.cpp --- a/libc/src/string/strspn.cpp +++ b/libc/src/string/strspn.cpp @@ -11,7 +11,6 @@ #include "src/__support/common.h" #include "utils/CPP/Bitset.h" #include -#include namespace __llvm_libc { diff --git a/libc/test/src/string/CMakeLists.txt b/libc/test/src/string/CMakeLists.txt --- a/libc/test/src/string/CMakeLists.txt +++ b/libc/test/src/string/CMakeLists.txt @@ -112,6 +112,15 @@ libc.src.string.strspn ) +add_libc_unittest( + strpbrk_test + SUITE + libc_string_unittests + SRCS + strpbrk_test.cpp + DEPENDS + libc.src.string.strpbrk +) # Tests all implementations that can run on the host. function(add_libc_multi_impl_test name) diff --git a/libc/test/src/string/strpbrk_test.cpp b/libc/test/src/string/strpbrk_test.cpp new file mode 100644 --- /dev/null +++ b/libc/test/src/string/strpbrk_test.cpp @@ -0,0 +1,62 @@ +//===-- Unittests for strpbrk ---------------------------------------------===// +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// + +#include "src/string/strpbrk.h" + +#include "utils/UnitTest/Test.h" + +TEST(StrPBrkTest, EmptyStringShouldReturnNullptr) { + // The search should not include the null terminator. + EXPECT_STREQ(__llvm_libc::strpbrk("", ""), nullptr); + EXPECT_STREQ(__llvm_libc::strpbrk("_", ""), nullptr); + EXPECT_STREQ(__llvm_libc::strpbrk("", "_"), nullptr); +} + +TEST(StrPBrkTest, ShouldNotFindAnythingAfterNullTerminator) { + const char src[4] = {'a', 'b', '\0', 'c'}; + EXPECT_STREQ(__llvm_libc::strpbrk(src, "c"), nullptr); +} + +TEST(StrPBrkTest, ShouldReturnNullptrIfNoCharactersFound) { + EXPECT_STREQ(__llvm_libc::strpbrk("12345", "abcdef"), nullptr); +} + +TEST(StrPBrkTest, FindsFirstCharacter) { + const char *src = "12345"; + EXPECT_STREQ(__llvm_libc::strpbrk(src, "1"), "12345"); + EXPECT_STREQ(__llvm_libc::strpbrk(src, "-1"), "12345"); + EXPECT_STREQ(__llvm_libc::strpbrk(src, "1_"), "12345"); + EXPECT_STREQ(__llvm_libc::strpbrk(src, "f1_"), "12345"); + ASSERT_STREQ(src, "12345"); +} + +TEST(StrPBrkTest, FindsMiddleCharacter) { + const char *src = "12345"; + EXPECT_STREQ(__llvm_libc::strpbrk(src, "3"), "345"); + EXPECT_STREQ(__llvm_libc::strpbrk(src, "?3"), "345"); + EXPECT_STREQ(__llvm_libc::strpbrk(src, "3F"), "345"); + EXPECT_STREQ(__llvm_libc::strpbrk(src, "z3_"), "345"); + ASSERT_STREQ(src, "12345"); +} + +TEST(StrPBrkTest, FindsLastCharacter) { + const char *src = "12345"; + EXPECT_STREQ(__llvm_libc::strpbrk(src, "5"), "5"); + EXPECT_STREQ(__llvm_libc::strpbrk(src, "r5"), "5"); + EXPECT_STREQ(__llvm_libc::strpbrk(src, "59"), "5"); + EXPECT_STREQ(__llvm_libc::strpbrk(src, "n5_"), "5"); + ASSERT_STREQ(src, "12345"); +} + +TEST(StrPBrkTest, FindsFirstOfRepeated) { + EXPECT_STREQ(__llvm_libc::strpbrk("A,B,C,D", ","), ",B,C,D"); +} + +TEST(StrPBrkTest, FindsFirstInBreakset) { + EXPECT_STREQ(__llvm_libc::strpbrk("12345", "34"), "345"); +}