2011-08-12 00:25:59 +10:00
|
|
|
/*
|
2015-04-13 18:05:28 +10:00
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
2011-08-12 00:25:59 +10:00
|
|
|
*
|
2015-04-13 18:05:28 +10:00
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
2011-08-12 00:25:59 +10:00
|
|
|
*
|
2015-04-13 18:05:28 +10:00
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
2011-08-12 00:25:59 +10:00
|
|
|
*
|
2016-03-17 18:13:19 +11:00
|
|
|
* Copyright 2011-2016 Danny Robson <danny@nerdcruft.net>
|
2011-08-12 00:25:59 +10:00
|
|
|
*/
|
|
|
|
|
2018-01-30 11:31:40 +11:00
|
|
|
#ifndef CRUFT_UTIL_STRING_HPP
|
|
|
|
#define CRUFT_UTIL_STRING_HPP
|
2011-08-12 00:25:59 +10:00
|
|
|
|
2018-01-30 11:31:40 +11:00
|
|
|
#include "debug.hpp"
|
2017-11-22 16:49:37 +11:00
|
|
|
#include "view.hpp"
|
2016-03-17 18:13:19 +11:00
|
|
|
|
|
|
|
|
2016-11-22 21:48:57 +11:00
|
|
|
namespace util {
|
|
|
|
std::string to_utf8 (const wchar_t*);
|
|
|
|
std::string to_utf8 (const std::wstring&);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2011-08-12 00:25:59 +10:00
|
|
|
bool
|
|
|
|
strbegins(const char *restrict str,
|
|
|
|
const char *restrict prefix);
|
|
|
|
|
2016-03-17 18:13:19 +11:00
|
|
|
|
|
|
|
namespace util {
|
2016-03-18 11:08:12 +11:00
|
|
|
template <typename Iterator>
|
2016-03-17 18:13:19 +11:00
|
|
|
struct tokeniser {
|
|
|
|
public:
|
2016-03-18 11:08:12 +11:00
|
|
|
using value_type = typename std::iterator_traits<Iterator>::value_type;
|
|
|
|
using range_type = view<Iterator>;
|
2016-03-17 18:13:19 +11:00
|
|
|
|
2018-01-30 11:31:40 +11:00
|
|
|
tokeniser (util::view<Iterator,Iterator> _range, value_type _separator):
|
|
|
|
m_range (_range),
|
|
|
|
m_separator (_separator)
|
|
|
|
{ ; }
|
2016-03-17 18:13:19 +11:00
|
|
|
|
2018-01-30 11:31:40 +11:00
|
|
|
tokeniser (const char *_range, char _separator):
|
|
|
|
m_range (_range),
|
|
|
|
m_separator (_separator)
|
2017-09-15 15:22:29 +10:00
|
|
|
{ ; }
|
|
|
|
|
|
|
|
struct iterator : public std::iterator<
|
|
|
|
std::forward_iterator_tag,
|
|
|
|
range_type,
|
|
|
|
std::size_t
|
|
|
|
> {
|
2016-03-17 18:13:19 +11:00
|
|
|
public:
|
2018-01-30 11:31:40 +11:00
|
|
|
iterator operator++ (int)
|
|
|
|
{
|
|
|
|
iterator res(*this);
|
|
|
|
++*this;
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
iterator& operator++ (void)&
|
|
|
|
{
|
|
|
|
auto newend = m_range.cend ();
|
|
|
|
if (newend != m_end) {
|
|
|
|
CHECK_EQ (*m_range.cend (), m_separator);
|
|
|
|
newend++;
|
|
|
|
}
|
|
|
|
|
|
|
|
m_range = {
|
|
|
|
newend,
|
|
|
|
std::find (newend, m_end, m_separator)
|
|
|
|
};
|
|
|
|
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
2018-04-01 14:46:32 +10:00
|
|
|
iterator operator+ (int count)
|
|
|
|
{
|
|
|
|
auto next = *this;
|
|
|
|
std::advance (next, count);
|
|
|
|
return next;
|
|
|
|
}
|
|
|
|
|
2018-03-27 16:05:46 +11:00
|
|
|
const range_type& operator* (void) const
|
2018-01-30 11:31:40 +11:00
|
|
|
{
|
|
|
|
return m_range;
|
|
|
|
}
|
|
|
|
|
2018-04-01 14:44:43 +10:00
|
|
|
const range_type* operator-> (void) const
|
|
|
|
{
|
|
|
|
return &m_range;
|
|
|
|
}
|
|
|
|
|
2018-01-30 11:31:40 +11:00
|
|
|
bool operator== (const iterator &rhs) const
|
|
|
|
{
|
|
|
|
return m_range == rhs.m_range && m_separator == rhs.m_separator;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool operator!= (const iterator &rhs) const
|
|
|
|
{
|
|
|
|
return !(*this == rhs);
|
|
|
|
}
|
2016-03-17 18:13:19 +11:00
|
|
|
|
|
|
|
private:
|
2018-01-30 11:31:40 +11:00
|
|
|
iterator (range_type _range, value_type _separator):
|
|
|
|
m_separator (_separator),
|
|
|
|
m_range (_range.cbegin (),
|
|
|
|
std::find (_range.cbegin (),
|
|
|
|
_range.cend (),
|
|
|
|
_separator)
|
|
|
|
),
|
|
|
|
m_end (_range.cend ())
|
|
|
|
{ ; }
|
2016-03-18 11:08:12 +11:00
|
|
|
|
2018-04-01 14:47:33 +10:00
|
|
|
value_type m_separator;
|
2016-03-17 18:13:19 +11:00
|
|
|
range_type m_range;
|
2016-03-18 11:08:12 +11:00
|
|
|
Iterator m_end;
|
|
|
|
|
|
|
|
friend tokeniser;
|
2016-03-17 18:13:19 +11:00
|
|
|
};
|
|
|
|
|
2018-01-30 11:31:40 +11:00
|
|
|
iterator cbegin (void) const { return { m_range, m_separator }; }
|
|
|
|
iterator begin (void) const { return { m_range, m_separator }; }
|
2016-03-17 18:13:19 +11:00
|
|
|
|
2018-01-30 11:31:40 +11:00
|
|
|
iterator cend (void) const { return { { m_range.cend (), m_range.cend () }, m_separator }; }
|
|
|
|
iterator end (void) const { return { { m_range.cend (), m_range.cend () }, m_separator }; }
|
2016-03-17 18:13:19 +11:00
|
|
|
|
|
|
|
private:
|
2016-03-18 11:08:12 +11:00
|
|
|
const range_type m_range;
|
2016-03-17 18:13:19 +11:00
|
|
|
const value_type m_separator;
|
|
|
|
};
|
2016-03-18 11:08:12 +11:00
|
|
|
|
2017-09-15 15:22:29 +10:00
|
|
|
|
2018-01-30 11:31:40 +11:00
|
|
|
template <typename ContainerT>
|
|
|
|
tokeniser (ContainerT&, typename ContainerT::value_type) -> tokeniser<typename ContainerT::iterator>;
|
|
|
|
|
|
|
|
tokeniser (const char*,char) -> tokeniser<const char*>;
|
|
|
|
|
2017-09-15 15:22:29 +10:00
|
|
|
///////////////////////////////////////////////////////////////////////////
|
|
|
|
template <typename CharT, std::size_t LengthV>
|
|
|
|
auto
|
|
|
|
make_tokeniser (CharT (&data)[LengthV], CharT separator)
|
|
|
|
{
|
|
|
|
return tokeniser { std::begin (data), std::end (data), separator };
|
|
|
|
}
|
2016-03-17 18:13:19 +11:00
|
|
|
}
|
|
|
|
|
2011-08-12 00:25:59 +10:00
|
|
|
#endif // __UTIL_STRING_HPP
|
|
|
|
|