| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380 | ////  Copyright (c) 2009-2011 Artyom Beilis (Tonkikh)////  Distributed under the Boost Software License, Version 1.0. (See//  accompanying file LICENSE_1_0.txt or copy at//  http://www.boost.org/LICENSE_1_0.txt)//#ifndef BOOST_LOCALE_CONVERTER_HPP_INCLUDED#define BOOST_LOCALE_CONVERTER_HPP_INCLUDED#include <boost/locale/config.hpp>#ifdef BOOST_MSVC#  pragma warning(push)#  pragma warning(disable : 4275 4251 4231 4660)#endif#include <locale>namespace boost {    namespace locale {                ///        /// \defgroup convert Text Conversions         ///        ///  This module provides various function for string manipulation like Unicode normalization, case conversion etc.        /// @{        ///                ///        /// \brief This class provides base flags for text manipulation. It is used as base for converter facet.        ///        class converter_base {        public:            ///            /// The flag used for facet - the type of operation to perform            ///            typedef enum {                normalization,  ///< Apply Unicode normalization on the text                upper_case,     ///< Convert text to upper case                lower_case,     ///< Convert text to lower case                case_folding,   ///< Fold case in the text                title_case      ///< Convert text to title case            } conversion_type;        };        template<typename CharType>        class converter;        #ifdef BOOST_LOCALE_DOXYGEN        ///        /// \brief The facet that implements text manipulation        ///        /// It is used to performs text conversion operations defined by \ref conversion_type. It is specialized        /// for four types of characters \c char, \c wchar_t, \c char16_t, \c char32_t        ///        template<typename Char>        class BOOST_LOCALE_DECL converter: public converter_base, public std::locale::facet {        public:            /// Locale identification            static std::locale::id id;            /// Standard constructor            converter(size_t refs = 0) : std::locale::facet(refs)            {            }            ///            /// Convert text in range [\a begin, \a end) according to conversion method \a how. Parameter            /// \a flags is used for specification of normalization method like nfd, nfc etc.            ///            virtual std::basic_string<Char> convert(conversion_type how,Char const *begin,Char const *end,int flags = 0) const = 0;#if defined (__SUNPRO_CC) && defined (_RWSTD_VER)            std::locale::id& __get_id (void) const { return id; }#endif        };        #else        template<>        class BOOST_LOCALE_DECL converter<char> : public converter_base, public std::locale::facet {        public:            static std::locale::id id;            converter(size_t refs = 0) : std::locale::facet(refs)            {            }            virtual std::string convert(conversion_type how,char const *begin,char const *end,int flags = 0) const = 0;#if defined (__SUNPRO_CC) && defined (_RWSTD_VER)            std::locale::id& __get_id (void) const { return id; }#endif        };        template<>        class BOOST_LOCALE_DECL converter<wchar_t> : public converter_base, public std::locale::facet {        public:            static std::locale::id id;            converter(size_t refs = 0) : std::locale::facet(refs)            {            }             virtual std::wstring convert(conversion_type how,wchar_t const *begin,wchar_t const *end,int flags = 0) const = 0;#if defined (__SUNPRO_CC) && defined (_RWSTD_VER)            std::locale::id& __get_id (void) const { return id; }#endif        };        #ifdef BOOST_HAS_CHAR16_T        template<>        class BOOST_LOCALE_DECL converter<char16_t> : public converter_base, public std::locale::facet {        public:            static std::locale::id id;            converter(size_t refs = 0) : std::locale::facet(refs)            {            }            virtual std::u16string convert(conversion_type how,char16_t const *begin,char16_t const *end,int flags = 0) const = 0; #if defined (__SUNPRO_CC) && defined (_RWSTD_VER)            std::locale::id& __get_id (void) const { return id; }#endif        };        #endif        #ifdef BOOST_HAS_CHAR32_T        template<>        class BOOST_LOCALE_DECL converter<char32_t> : public converter_base, public std::locale::facet {        public:            static std::locale::id id;            converter(size_t refs = 0) : std::locale::facet(refs)            {            }            virtual std::u32string convert(conversion_type how,char32_t const *begin,char32_t const *end,int flags = 0) const = 0;#if defined (__SUNPRO_CC) && defined (_RWSTD_VER)            std::locale::id& __get_id (void) const { return id; }#endif        };        #endif        #endif        ///        /// The type that defined <a href="http://unicode.org/reports/tr15/#Norm_Forms">normalization form</a>        ///        typedef enum {            norm_nfd,   ///< Canonical decomposition            norm_nfc,   ///< Canonical decomposition followed by canonical composition            norm_nfkd,  ///< Compatibility decomposition            norm_nfkc,  ///< Compatibility decomposition followed by canonical composition.            norm_default = norm_nfc, ///< Default normalization - canonical decomposition followed by canonical composition        } norm_type;               ///        /// Normalize Unicode string \a str according to \ref norm_type "normalization form" \a n        ///        /// Note: This function receives only Unicode strings, i.e.: UTF-8, UTF-16 or UTF-32. It does not take        /// in account the locale encoding, because Unicode decomposition and composition are meaningless outside         /// of a Unicode character set.        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> normalize(std::basic_string<CharType> const &str,norm_type n=norm_default,std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::normalization,str.data(),str.data() + str.size(),n);        }        ///        /// Normalize NUL terminated Unicode string \a str according to \ref norm_type "normalization form" \a n        ///        /// Note: This function receives only Unicode strings, i.e.: UTF-8, UTF-16 or UTF-32. It does not take        /// in account the locale encoding, because Unicode decomposition and composition are meaningless outside         /// of a Unicode character set.        ///         /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> normalize(CharType const *str,norm_type n=norm_default,std::locale const &loc=std::locale())        {            CharType const *end=str;            while(*end)                end++;            return std::use_facet<converter<CharType> >(loc).convert(converter_base::normalization,str,end,n);        }                ///        /// Normalize Unicode string in range [begin,end) according to \ref norm_type "normalization form" \a n        ///        /// Note: This function receives only Unicode strings, i.e.: UTF-8, UTF-16 or UTF-32. It does not take        /// in account the locale encoding, because Unicode decomposition and composition are meaningless outside         /// of a Unicode character set.        ///         /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> normalize(  CharType const *begin,                                                CharType const *end,                                                norm_type n=norm_default,                                                std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::normalization,begin,end,n);        }        ///////////////////////////////////////////////////                ///        /// Convert a string \a str to upper case according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> to_upper(std::basic_string<CharType> const &str,std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::upper_case,str.data(),str.data()+str.size());        }                ///        /// Convert a NUL terminated string \a str to upper case according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> to_upper(CharType const *str,std::locale const &loc=std::locale())        {            CharType const *end=str;            while(*end)                end++;            return std::use_facet<converter<CharType> >(loc).convert(converter_base::upper_case,str,end);        }                ///        /// Convert a string in range [begin,end) to upper case according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> to_upper(CharType const *begin,CharType const *end,std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::upper_case,begin,end);        }        ///////////////////////////////////////////////////                ///        /// Convert a string \a str to lower case according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> to_lower(std::basic_string<CharType> const &str,std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::lower_case,str.data(),str.data()+str.size());        }                ///        /// Convert a NUL terminated string \a str to lower case according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> to_lower(CharType const *str,std::locale const &loc=std::locale())        {            CharType const *end=str;            while(*end)                end++;            return std::use_facet<converter<CharType> >(loc).convert(converter_base::lower_case,str,end);        }                ///        /// Convert a string in range [begin,end) to lower case according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> to_lower(CharType const *begin,CharType const *end,std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::lower_case,begin,end);        }        ///////////////////////////////////////////////////                ///        /// Convert a string \a str to title case according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> to_title(std::basic_string<CharType> const &str,std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::title_case,str.data(),str.data()+str.size());        }                ///        /// Convert a NUL terminated string \a str to title case according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> to_title(CharType const *str,std::locale const &loc=std::locale())        {            CharType const *end=str;            while(*end)                end++;            return std::use_facet<converter<CharType> >(loc).convert(converter_base::title_case,str,end);        }                ///        /// Convert a string in range [begin,end) to title case according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> to_title(CharType const *begin,CharType const *end,std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::title_case,begin,end);        }        ///////////////////////////////////////////////////                ///        /// Fold case of a string \a str according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> fold_case(std::basic_string<CharType> const &str,std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::case_folding,str.data(),str.data()+str.size());        }                ///        /// Fold case of a NUL terminated string \a str according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> fold_case(CharType const *str,std::locale const &loc=std::locale())        {            CharType const *end=str;            while(*end)                end++;            return std::use_facet<converter<CharType> >(loc).convert(converter_base::case_folding,str,end);        }                ///        /// Fold case of a string in range [begin,end) according to locale \a loc        ///        /// \note throws std::bad_cast if loc does not have \ref converter facet installed        ///         template<typename CharType>        std::basic_string<CharType> fold_case(CharType const *begin,CharType const *end,std::locale const &loc=std::locale())        {            return std::use_facet<converter<CharType> >(loc).convert(converter_base::case_folding,begin,end);        }        ///        ///@}        ///    } // locale} // boost#ifdef BOOST_MSVC#pragma warning(pop)#endif#endif////// \example conversions.cpp////// Example of using various text conversion functions.////// \example wconversions.cpp////// Example of using various text conversion functions with wide strings.///// vim: tabstop=4 expandtab shiftwidth=4 softtabstop=4
 |