159 lines
4.4 KiB
C++
159 lines
4.4 KiB
C++
/*
|
|
* Copyright (c) 2003-2014, John Wiegley. All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are
|
|
* met:
|
|
*
|
|
* - Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
*
|
|
* - Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
*
|
|
* - Neither the name of New Artisans LLC nor the names of its
|
|
* contributors may be used to endorse or promote products derived from
|
|
* this software without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
/**
|
|
* @addtogroup utils
|
|
*/
|
|
|
|
/**
|
|
* @file unistring.h
|
|
* @author John Wiegley
|
|
*
|
|
* @ingroup utils
|
|
*/
|
|
#ifndef _UNISTRING_H
|
|
#define _UNISTRING_H
|
|
|
|
namespace ledger {
|
|
|
|
int mk_wcwidth(boost::uint32_t ucs);
|
|
|
|
/**
|
|
* @class unistring
|
|
*
|
|
* @brief Abstract working with UTF-32 encoded Unicode strings
|
|
*
|
|
* The input to the string is a UTF8 encoded ledger::string, which can
|
|
* then have its true length be taken, or characters extracted.
|
|
*/
|
|
class unistring
|
|
{
|
|
public:
|
|
static const std::size_t npos = static_cast<std::size_t>(-1);
|
|
|
|
std::vector<boost::uint32_t> utf32chars;
|
|
|
|
unistring() {
|
|
TRACE_CTOR(unistring, "");
|
|
}
|
|
unistring(const std::string& input)
|
|
{
|
|
const char * p = input.c_str();
|
|
std::size_t len = input.length();
|
|
|
|
assert(len < 1024);
|
|
VERIFY(utf8::is_valid(p, p + len));
|
|
utf8::unchecked::utf8to32(p, p + len, std::back_inserter(utf32chars));
|
|
|
|
TRACE_CTOR(unistring, "std::string");
|
|
}
|
|
~unistring() {
|
|
TRACE_DTOR(unistring);
|
|
}
|
|
|
|
std::size_t length() const {
|
|
return utf32chars.size();
|
|
}
|
|
|
|
std::size_t width() const {
|
|
std::size_t width = 0;
|
|
foreach (const boost::uint32_t& ch, utf32chars) {
|
|
width += mk_wcwidth(ch);
|
|
}
|
|
return width;
|
|
}
|
|
|
|
std::string extract(const std::string::size_type begin = 0,
|
|
const std::string::size_type len = 0) const
|
|
{
|
|
std::string utf8result;
|
|
std::string::size_type this_len = length();
|
|
|
|
assert(begin <= this_len);
|
|
assert(begin + len <= this_len);
|
|
|
|
if (this_len)
|
|
utf8::unchecked::utf32to8
|
|
(utf32chars.begin() + static_cast<std::string::difference_type>(begin),
|
|
utf32chars.begin() + static_cast<std::string::difference_type>(begin) +
|
|
static_cast<std::string::difference_type>
|
|
(len ? (len > this_len ? this_len : len) : this_len),
|
|
std::back_inserter(utf8result));
|
|
|
|
return utf8result;
|
|
}
|
|
|
|
std::size_t find(const boost::uint32_t __s, std::size_t __pos = 0) const {
|
|
std::size_t idx = 0;
|
|
foreach (const boost::uint32_t& ch, utf32chars) {
|
|
if (idx >= __pos && ch == __s)
|
|
return idx;
|
|
idx++;
|
|
}
|
|
return npos;
|
|
}
|
|
|
|
boost::uint32_t& operator[](const std::size_t index) {
|
|
return utf32chars[index];
|
|
}
|
|
const boost::uint32_t& operator[](const std::size_t index) const {
|
|
return utf32chars[index];
|
|
}
|
|
};
|
|
|
|
inline void justify(std::ostream& out,
|
|
const std::string& str,
|
|
int width,
|
|
bool right = false,
|
|
bool redden = false)
|
|
{
|
|
if (! right) {
|
|
if (redden) out << "\033[31m";
|
|
out << str;
|
|
if (redden) out << "\033[0m";
|
|
}
|
|
|
|
unistring temp(str);
|
|
|
|
int spacing = width - int(temp.width());
|
|
while (spacing-- > 0)
|
|
out << ' ';
|
|
|
|
if (right) {
|
|
if (redden) out << "\033[31m";
|
|
out << str;
|
|
if (redden) out << "\033[0m";
|
|
}
|
|
}
|
|
|
|
} // namespace ledger
|
|
|
|
#endif // _UNISTRING_H
|