123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481 |
- // Copyright 2017 The Abseil Authors.
- //
- // Licensed under the Apache License, Version 2.0 (the "License");
- // you may not use this file except in compliance with the License.
- // You may obtain a copy of the License at
- //
- // https://www.apache.org/licenses/LICENSE-2.0
- //
- // Unless required by applicable law or agreed to in writing, software
- // distributed under the License is distributed on an "AS IS" BASIS,
- // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- // See the License for the specific language governing permissions and
- // limitations under the License.
- //
- // This file declares INTERNAL parts of the Split API that are inline/templated
- // or otherwise need to be available at compile time. The main abstractions
- // defined in here are
- //
- // - ConvertibleToStringView
- // - SplitIterator<>
- // - Splitter<>
- //
- // DO NOT INCLUDE THIS FILE DIRECTLY. Use this file by including
- // absl/strings/str_split.h.
- //
- // IWYU pragma: private, include "absl/strings/str_split.h"
- #include <array>
- #include <initializer_list>
- #include <iterator>
- #include <tuple>
- #include <type_traits>
- #include <utility>
- #include <vector>
- #include "absl/base/macros.h"
- #include "absl/base/port.h"
- #include "absl/meta/type_traits.h"
- #include "absl/strings/string_view.h"
- #include "absl/strings/internal/stl_type_traits.h"
- #endif // _GLIBCXX_DEBUG
- namespace absl {
- namespace strings_internal {
- // This class is implicitly constructible from everything that absl::string_view
- // is implicitly constructible from, except for rvalue strings. This means it
- // can be used as a function parameter in places where passing a temporary
- // string might cause memory lifetime issues.
- class ConvertibleToStringView {
- public:
- ConvertibleToStringView(const char* s) // NOLINT(runtime/explicit)
- : value_(s) {}
- ConvertibleToStringView(char* s) : value_(s) {} // NOLINT(runtime/explicit)
- ConvertibleToStringView(absl::string_view s) // NOLINT(runtime/explicit)
- : value_(s) {}
- ConvertibleToStringView(const std::string& s) // NOLINT(runtime/explicit)
- : value_(s) {}
- // Disable conversion from rvalue strings.
- ConvertibleToStringView(std::string&& s) = delete;
- ConvertibleToStringView(const std::string&& s) = delete;
- absl::string_view value() const { return value_; }
- private:
- absl::string_view value_;
- };
- // An iterator that enumerates the parts of a string from a Splitter. The text
- // to be split, the Delimiter, and the Predicate are all taken from the given
- // Splitter object. Iterators may only be compared if they refer to the same
- // Splitter instance.
- //
- // This class is NOT part of the public splitting API.
- template <typename Splitter>
- class SplitIterator {
- public:
- using iterator_category = std::input_iterator_tag;
- using value_type = absl::string_view;
- using difference_type = ptrdiff_t;
- using pointer = const value_type*;
- using reference = const value_type&;
- enum State { kInitState, kLastState, kEndState };
- SplitIterator(State state, const Splitter* splitter)
- : pos_(0),
- state_(state),
- splitter_(splitter),
- delimiter_(splitter->delimiter()),
- predicate_(splitter->predicate()) {
- // Hack to maintain backward compatibility. This one block makes it so an
- // empty absl::string_view whose .data() happens to be nullptr behaves
- // *differently* from an otherwise empty absl::string_view whose .data() is
- // not nullptr. This is an undesirable difference in general, but this
- // behavior is maintained to avoid breaking existing code that happens to
- // depend on this old behavior/bug. Perhaps it will be fixed one day. The
- // difference in behavior is as follows:
- // Split(absl::string_view(""), '-'); // {""}
- // Split(absl::string_view(), '-'); // {}
- if (splitter_->text().data() == nullptr) {
- state_ = kEndState;
- pos_ = splitter_->text().size();
- return;
- }
- if (state_ == kEndState) {
- pos_ = splitter_->text().size();
- } else {
- ++(*this);
- }
- }
- bool at_end() const { return state_ == kEndState; }
- reference operator*() const { return curr_; }
- pointer operator->() const { return &curr_; }
- SplitIterator& operator++() {
- do {
- if (state_ == kLastState) {
- state_ = kEndState;
- return *this;
- }
- const absl::string_view text = splitter_->text();
- const absl::string_view d = delimiter_.Find(text, pos_);
- if (d.data() == text.data() + text.size()) state_ = kLastState;
- curr_ = text.substr(pos_,
- static_cast<size_t>(d.data() - (text.data() + pos_)));
- pos_ += curr_.size() + d.size();
- } while (!predicate_(curr_));
- return *this;
- }
- SplitIterator operator++(int) {
- SplitIterator old(*this);
- ++(*this);
- return old;
- }
- friend bool operator==(const SplitIterator& a, const SplitIterator& b) {
- return a.state_ == b.state_ && a.pos_ == b.pos_;
- }
- friend bool operator!=(const SplitIterator& a, const SplitIterator& b) {
- return !(a == b);
- }
- private:
- size_t pos_;
- State state_;
- absl::string_view curr_;
- const Splitter* splitter_;
- typename Splitter::DelimiterType delimiter_;
- typename Splitter::PredicateType predicate_;
- };
- // HasMappedType<T>::value is true iff there exists a type T::mapped_type.
- template <typename T, typename = void>
- struct HasMappedType : std::false_type {};
- template <typename T>
- struct HasMappedType<T, absl::void_t<typename T::mapped_type>>
- : std::true_type {};
- // HasValueType<T>::value is true iff there exists a type T::value_type.
- template <typename T, typename = void>
- struct HasValueType : std::false_type {};
- template <typename T>
- struct HasValueType<T, absl::void_t<typename T::value_type>> : std::true_type {
- };
- // HasConstIterator<T>::value is true iff there exists a type T::const_iterator.
- template <typename T, typename = void>
- struct HasConstIterator : std::false_type {};
- template <typename T>
- struct HasConstIterator<T, absl::void_t<typename T::const_iterator>>
- : std::true_type {};
- // HasEmplace<T>::value is true iff there exists a method T::emplace().
- template <typename T, typename = void>
- struct HasEmplace : std::false_type {};
- template <typename T>
- struct HasEmplace<T, absl::void_t<decltype(std::declval<T>().emplace())>>
- : std::true_type {};
- // IsInitializerList<T>::value is true iff T is an std::initializer_list. More
- // details below in Splitter<> where this is used.
- std::false_type IsInitializerListDispatch(...); // default: No
- template <typename T>
- std::true_type IsInitializerListDispatch(std::initializer_list<T>*);
- template <typename T>
- struct IsInitializerList
- : decltype(IsInitializerListDispatch(static_cast<T*>(nullptr))) {};
- // A SplitterIsConvertibleTo<C>::type alias exists iff the specified condition
- // is true for type 'C'.
- //
- // Restricts conversion to container-like types (by testing for the presence of
- // a const_iterator member type) and also to disable conversion to an
- // std::initializer_list (which also has a const_iterator). Otherwise, code
- // compiled in C++11 will get an error due to ambiguous conversion paths (in
- // C++11 std::vector<T>::operator= is overloaded to take either a std::vector<T>
- // or an std::initializer_list<T>).
- template <typename C, bool has_value_type, bool has_mapped_type>
- struct SplitterIsConvertibleToImpl : std::false_type {};
- template <typename C>
- struct SplitterIsConvertibleToImpl<C, true, false>
- : std::is_constructible<typename C::value_type, absl::string_view> {};
- template <typename C>
- struct SplitterIsConvertibleToImpl<C, true, true>
- : absl::conjunction<
- std::is_constructible<typename C::key_type, absl::string_view>,
- std::is_constructible<typename C::mapped_type, absl::string_view>> {};
- template <typename C>
- struct SplitterIsConvertibleTo
- : SplitterIsConvertibleToImpl<
- C,
- !IsStrictlyBaseOfAndConvertibleToSTLContainer<C>::value &&
- #endif // _GLIBCXX_DEBUG
- !IsInitializerList<
- typename std::remove_reference<C>::type>::value &&
- HasValueType<C>::value && HasConstIterator<C>::value,
- HasMappedType<C>::value> {
- };
- template <typename StringType, typename Container, typename = void>
- struct ShouldUseLifetimeBound : std::false_type {};
- template <typename StringType, typename Container>
- struct ShouldUseLifetimeBound<
- StringType, Container,
- std::enable_if_t<
- std::is_same<StringType, std::string>::value &&
- std::is_same<typename Container::value_type, absl::string_view>::value>>
- : std::true_type {};
- template <typename StringType, typename First, typename Second>
- using ShouldUseLifetimeBoundForPair = std::integral_constant<
- bool, std::is_same<StringType, std::string>::value &&
- (std::is_same<First, absl::string_view>::value ||
- std::is_same<Second, absl::string_view>::value)>;
- // This class implements the range that is returned by absl::StrSplit(). This
- // class has templated conversion operators that allow it to be implicitly
- // converted to a variety of types that the caller may have specified on the
- // left-hand side of an assignment.
- //
- // The main interface for interacting with this class is through its implicit
- // conversion operators. However, this class may also be used like a container
- // in that it has .begin() and .end() member functions. It may also be used
- // within a range-for loop.
- //
- // Output containers can be collections of any type that is constructible from
- // an absl::string_view.
- //
- // An Predicate functor may be supplied. This predicate will be used to filter
- // the split strings: only strings for which the predicate returns true will be
- // kept. A Predicate object is any unary functor that takes an absl::string_view
- // and returns bool.
- //
- // The StringType parameter can be either string_view or string, depending on
- // whether the Splitter refers to a string stored elsewhere, or if the string
- // resides inside the Splitter itself.
- template <typename Delimiter, typename Predicate, typename StringType>
- class Splitter {
- public:
- using DelimiterType = Delimiter;
- using PredicateType = Predicate;
- using const_iterator = strings_internal::SplitIterator<Splitter>;
- using value_type = typename std::iterator_traits<const_iterator>::value_type;
- Splitter(StringType input_text, Delimiter d, Predicate p)
- : text_(std::move(input_text)),
- delimiter_(std::move(d)),
- predicate_(std::move(p)) {}
- absl::string_view text() const { return text_; }
- const Delimiter& delimiter() const { return delimiter_; }
- const Predicate& predicate() const { return predicate_; }
- // Range functions that iterate the split substrings as absl::string_view
- // objects. These methods enable a Splitter to be used in a range-based for
- // loop.
- const_iterator begin() const { return {const_iterator::kInitState, this}; }
- const_iterator end() const { return {const_iterator::kEndState, this}; }
- // An implicit conversion operator that is restricted to only those containers
- // that the splitter is convertible to.
- template <
- typename Container,
- std::enable_if_t<ShouldUseLifetimeBound<StringType, Container>::value &&
- SplitterIsConvertibleTo<Container>::value,
- std::nullptr_t> = nullptr>
- // NOLINTNEXTLINE(google-explicit-constructor)
- operator Container() const ABSL_ATTRIBUTE_LIFETIME_BOUND {
- return ConvertToContainer<Container, typename Container::value_type,
- HasMappedType<Container>::value>()(*this);
- }
- template <
- typename Container,
- std::enable_if_t<!ShouldUseLifetimeBound<StringType, Container>::value &&
- SplitterIsConvertibleTo<Container>::value,
- std::nullptr_t> = nullptr>
- // NOLINTNEXTLINE(google-explicit-constructor)
- operator Container() const {
- return ConvertToContainer<Container, typename Container::value_type,
- HasMappedType<Container>::value>()(*this);
- }
- // Returns a pair with its .first and .second members set to the first two
- // strings returned by the begin() iterator. Either/both of .first and .second
- // will be constructed with empty strings if the iterator doesn't have a
- // corresponding value.
- template <typename First, typename Second,
- std::enable_if_t<
- ShouldUseLifetimeBoundForPair<StringType, First, Second>::value,
- std::nullptr_t> = nullptr>
- // NOLINTNEXTLINE(google-explicit-constructor)
- operator std::pair<First, Second>() const ABSL_ATTRIBUTE_LIFETIME_BOUND {
- return ConvertToPair<First, Second>();
- }
- template <typename First, typename Second,
- std::enable_if_t<!ShouldUseLifetimeBoundForPair<StringType, First,
- Second>::value,
- std::nullptr_t> = nullptr>
- // NOLINTNEXTLINE(google-explicit-constructor)
- operator std::pair<First, Second>() const {
- return ConvertToPair<First, Second>();
- }
- private:
- template <typename First, typename Second>
- std::pair<First, Second> ConvertToPair() const {
- absl::string_view first, second;
- auto it = begin();
- if (it != end()) {
- first = *it;
- if (++it != end()) {
- second = *it;
- }
- }
- return {First(first), Second(second)};
- }
- // ConvertToContainer is a functor converting a Splitter to the requested
- // Container of ValueType. It is specialized below to optimize splitting to
- // certain combinations of Container and ValueType.
- //
- // This base template handles the generic case of storing the split results in
- // the requested non-map-like container and converting the split substrings to
- // the requested type.
- template <typename Container, typename ValueType, bool is_map = false>
- struct ConvertToContainer {
- Container operator()(const Splitter& splitter) const {
- Container c;
- auto it = std::inserter(c, c.end());
- for (const auto& sp : splitter) {
- *it++ = ValueType(sp);
- }
- return c;
- }
- };
- // Partial specialization for a std::vector<absl::string_view>.
- //
- // Optimized for the common case of splitting to a
- // std::vector<absl::string_view>. In this case we first split the results to
- // a small array of absl::string_view on the stack, to reduce reallocations.
- template <typename A>
- struct ConvertToContainer<std::vector<absl::string_view, A>,
- absl::string_view, false> {
- std::vector<absl::string_view, A> operator()(
- const Splitter& splitter) const {
- struct raw_view {
- const char* data;
- size_t size;
- operator absl::string_view() const { // NOLINT(runtime/explicit)
- return {data, size};
- }
- };
- std::vector<absl::string_view, A> v;
- std::array<raw_view, 16> ar;
- for (auto it = splitter.begin(); !it.at_end();) {
- size_t index = 0;
- do {
- ar[index].data = it->data();
- ar[index].size = it->size();
- ++it;
- } while (++index != ar.size() && !it.at_end());
- v.insert(v.end(), ar.begin(), ar.begin() + index);
- }
- return v;
- }
- };
- // Partial specialization for a std::vector<std::string>.
- //
- // Optimized for the common case of splitting to a std::vector<std::string>.
- // In this case we first split the results to a std::vector<absl::string_view>
- // so the returned std::vector<std::string> can have space reserved to avoid
- // std::string moves.
- template <typename A>
- struct ConvertToContainer<std::vector<std::string, A>, std::string, false> {
- std::vector<std::string, A> operator()(const Splitter& splitter) const {
- const std::vector<absl::string_view> v = splitter;
- return std::vector<std::string, A>(v.begin(), v.end());
- }
- };
- // Partial specialization for containers of pairs (e.g., maps).
- //
- // The algorithm is to insert a new pair into the map for each even-numbered
- // item, with the even-numbered item as the key with a default-constructed
- // value. Each odd-numbered item will then be assigned to the last pair's
- // value.
- template <typename Container, typename First, typename Second>
- struct ConvertToContainer<Container, std::pair<const First, Second>, true> {
- using iterator = typename Container::iterator;
- Container operator()(const Splitter& splitter) const {
- Container m;
- iterator it;
- bool insert = true;
- for (const absl::string_view sv : splitter) {
- if (insert) {
- it = InsertOrEmplace(&m, sv);
- } else {
- it->second = Second(sv);
- }
- insert = !insert;
- }
- return m;
- }
- // Inserts the key and an empty value into the map, returning an iterator to
- // the inserted item. We use emplace() if available, otherwise insert().
- template <typename M>
- static absl::enable_if_t<HasEmplace<M>::value, iterator> InsertOrEmplace(
- M* m, absl::string_view key) {
- // Use piecewise_construct to support old versions of gcc in which pair
- // constructor can't otherwise construct string from string_view.
- return ToIter(m->emplace(std::piecewise_construct, std::make_tuple(key),
- std::tuple<>()));
- }
- template <typename M>
- static absl::enable_if_t<!HasEmplace<M>::value, iterator> InsertOrEmplace(
- M* m, absl::string_view key) {
- return ToIter(m->insert(std::make_pair(First(key), Second(""))));
- }
- static iterator ToIter(std::pair<iterator, bool> pair) {
- return pair.first;
- }
- static iterator ToIter(iterator iter) { return iter; }
- };
- StringType text_;
- Delimiter delimiter_;
- Predicate predicate_;
- };
- } // namespace strings_internal
- } // namespace absl