diff options
Diffstat (limited to 'src/unistring.h')
-rw-r--r-- | src/unistring.h | 128 |
1 files changed, 128 insertions, 0 deletions
diff --git a/src/unistring.h b/src/unistring.h new file mode 100644 index 00000000..7c433d9d --- /dev/null +++ b/src/unistring.h @@ -0,0 +1,128 @@ +/* + * Copyright (c) 2003-2009, John Wiegley. All rights reserved. + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted provided that the following conditions are + * met: + * + * - Redistributions of source code must retain the above copyright + * notice, this list of conditions and the following disclaimer. + * + * - Redistributions in binary form must reproduce the above copyright + * notice, this list of conditions and the following disclaimer in the + * documentation and/or other materials provided with the distribution. + * + * - Neither the name of New Artisans LLC nor the names of its + * contributors may be used to endorse or promote products derived from + * this software without specific prior written permission. + * + * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS + * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT + * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR + * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT + * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, + * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT + * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, + * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY + * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT + * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE + * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + */ + +/** + * @addtogroup utils + */ + +/** + * @file unistring.h + * @author John Wiegley + * + * @ingroup utils + */ +#ifndef _UNISTRING_H +#define _UNISTRING_H + +namespace ledger { + +/** + * @class unistring + * + * @brief Abstract working with UTF-32 encoded Unicode strings + * + * The input to the string is a UTF8 encoded ledger::string, which can + * then have its true length be taken, or characters extracted. + */ +class unistring +{ +public: + std::vector<boost::uint32_t> utf32chars; + + unistring() { + TRACE_CTOR(unistring, ""); + } + unistring(const std::string& input) + { + TRACE_CTOR(unistring, "std::string"); + + const char * p = input.c_str(); + std::size_t len = input.length(); + + VERIFY(utf8::is_valid(p, p + len)); + utf8::unchecked::utf8to32(p, p + len, std::back_inserter(utf32chars)); + } + ~unistring() { + TRACE_DTOR(unistring); + } + + std::size_t length() const { + return utf32chars.size(); + } + + std::string extract(const std::string::size_type begin = 0, + const std::string::size_type len = 0) const + { + std::string utf8result; + std::string::size_type this_len = length(); + + assert(begin <= this_len); + assert(begin + len <= this_len); + + if (this_len) + utf8::unchecked::utf32to8 + (utf32chars.begin() + begin, + utf32chars.begin() + begin + + (len ? (len > this_len ? this_len : len) : this_len), + std::back_inserter(utf8result)); + + return utf8result; + } +}; + +inline void justify(std::ostream& out, + const std::string& str, + int width, + bool right = false, + bool redden = false) +{ + if (! right) { + if (redden) out << "\033[31m"; + out << str; + if (redden) out << "\033[0m"; + } + + unistring temp(str); + + int spacing = width - int(temp.length()); + while (spacing-- > 0) + out << ' '; + + if (right) { + if (redden) out << "\033[31m"; + out << str; + if (redden) out << "\033[0m"; + } +} + +} // namespace ledger + +#endif // _UNISTRING_H |