wxWidgets/include/wx/stringops.h

///////////////////////////////////////////////////////////////////////////////
// Name:        wx/stringops.h
// Purpose:     implementation of wxString primitive operations
// Author:      Vaclav Slavik
// Modified by:
// Created:     2007-04-16
// Copyright:   (c) 2007 REA Elektronik GmbH
// Licence:     wxWindows licence
///////////////////////////////////////////////////////////////////////////////

#ifndef _WX_WXSTRINGOPS_H__
#define _WX_WXSTRINGOPS_H__

#include "wx/chartype.h"
#include "wx/stringimpl.h"
#include "wx/unichar.h"
#include "wx/buffer.h"

// This header contains wxStringOperations "namespace" class that implements
// elementary operations on string data as static methods; wxString methods and
// iterators are implemented in terms of it. Two implementations are available,
// one for UTF-8 encoded char* string and one for "raw" wchar_t* strings (or
// char* in ANSI build).

// FIXME-UTF8: only wchar after we remove ANSI build
#if wxUSE_UNICODE_WCHAR || !wxUSE_UNICODE
struct WXDLLIMPEXP_BASE wxStringOperationsWchar
{
    // moves the iterator to the next Unicode character
    template <typename Iterator>
    static void IncIter(Iterator& i) { ++i; }

    // moves the iterator to the previous Unicode character
    template <typename Iterator>
    static void DecIter(Iterator& i) { --i; }

    // moves the iterator by n Unicode characters
    template <typename Iterator>
    static Iterator AddToIter(const Iterator& i, ptrdiff_t n)
        { return i + n; }

    // returns distance of the two iterators in Unicode characters
    template <typename Iterator>
    static ptrdiff_t DiffIters(const Iterator& i1, const Iterator& i2)
        { return i1 - i2; }

#if wxUSE_UNICODE_UTF16
    // encodes the characters as UTF-16:
    struct Utf16CharBuffer
    {
        // Notice that data is left uninitialized, it is filled by EncodeChar()
        // which is the only function creating objects of this class.

        wchar_t data[3];
        operator const wchar_t*() const { return data; }
    };
    static Utf16CharBuffer EncodeChar(const wxUniChar& ch);
    static wxWCharBuffer EncodeNChars(size_t n, const wxUniChar& ch);
    static bool IsSingleCodeUnitCharacter(const wxUniChar& ch)
        { return !ch.IsSupplementary(); }
#else
    // encodes the character to a form used to represent it in internal
    // representation
    struct SingleCharBuffer
    {
        wxChar data[2];
        operator const wxChar*() const { return data; }
    };
    static SingleCharBuffer EncodeChar(const wxUniChar& ch)
    {
        SingleCharBuffer buf;
        buf.data[0] = (wxChar)ch;
        buf.data[1] = 0;
        return buf;
    }
    static wxWxCharBuffer EncodeNChars(size_t n, const wxUniChar& ch);
    static bool IsSingleCodeUnitCharacter(const wxUniChar&) { return true; }
#endif

    static wxUniChar DecodeChar(const wxStringImpl::const_iterator& i)
        { return *i; }
};
#endif // wxUSE_UNICODE_WCHAR || !wxUSE_UNICODE


#if wxUSE_UNICODE_UTF8
struct WXDLLIMPEXP_BASE wxStringOperationsUtf8
{
    // checks correctness of UTF-8 sequence
    static bool IsValidUtf8String(const char *c,
                                  size_t len = wxStringImpl::npos);
    static bool IsValidUtf8LeadByte(unsigned char c)
    {
        return (c <= 0x7F) || (c >= 0xC2 && c <= 0xF4);
    }

    // table of offsets to skip forward when iterating over UTF-8 sequence
    static const unsigned char ms_utf8IterTable[256];


    template<typename Iterator>
    static void IncIter(Iterator& i)
    {
        wxASSERT( IsValidUtf8LeadByte(*i) );
        i += ms_utf8IterTable[(unsigned char)*i];
    }

    template<typename Iterator>
    static void DecIter(Iterator& i)
    {
        // Non-lead bytes are all in the 0x80..0xBF range (i.e. 10xxxxxx in
        // binary), so we just have to go back until we hit a byte that is
        // either < 0x80 (i.e. 0xxxxxxx in binary) or 0xC0..0xFF (11xxxxxx in
        // binary; this includes some invalid values, but we can ignore it
        // here, because we assume valid UTF-8 input for the purpose of
        // efficient implementation).
        --i;
        while ( ((*i) & 0xC0) == 0x80 /* 2 highest bits are '10' */ )
            --i;
    }

    template<typename Iterator>
    static Iterator AddToIter(const Iterator& i, ptrdiff_t n)
    {
        Iterator out(i);

        if ( n > 0 )
        {
            for ( ptrdiff_t j = 0; j < n; ++j )
                IncIter(out);
        }
        else if ( n < 0 )
        {
            for ( ptrdiff_t j = 0; j > n; --j )
                DecIter(out);
        }

        return out;
    }

    template<typename Iterator>
    static ptrdiff_t DiffIters(Iterator i1, Iterator i2)
    {
        ptrdiff_t dist = 0;

        if ( i1 < i2 )
        {
            while ( i1 != i2 )
            {
                IncIter(i1);
                dist--;
            }
        }
        else if ( i2 < i1 )
        {
            while ( i2 != i1 )
            {
                IncIter(i2);
                dist++;
            }
        }

        return dist;
    }

    static bool IsSingleCodeUnitCharacter(const wxUniChar& ch)
        { return ch.IsAscii(); }

    // encodes the character as UTF-8:
    typedef wxUniChar::Utf8CharBuffer Utf8CharBuffer;
    static Utf8CharBuffer EncodeChar(const wxUniChar& ch)
        { return ch.AsUTF8(); }

    // returns n copies of ch encoded in UTF-8 string
    static wxCharBuffer EncodeNChars(size_t n, const wxUniChar& ch);

    // returns the length of UTF-8 encoding of the character with lead byte 'c'
    static size_t GetUtf8CharLength(char c)
    {
        wxASSERT( IsValidUtf8LeadByte(c) );
        return ms_utf8IterTable[(unsigned char)c];
    }

    // decodes single UTF-8 character from UTF-8 string
    static wxUniChar DecodeChar(wxStringImpl::const_iterator i)
    {
        if ( (unsigned char)*i < 0x80 )
            return (int)*i;
        return DecodeNonAsciiChar(i);
    }

private:
    static wxUniChar DecodeNonAsciiChar(wxStringImpl::const_iterator i);
};
#endif // wxUSE_UNICODE_UTF8


#if wxUSE_UNICODE_UTF8
typedef wxStringOperationsUtf8 wxStringOperations;
#else
typedef wxStringOperationsWchar wxStringOperations;
#endif

#endif  // _WX_WXSTRINGOPS_H_
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`///////////////////////////////////////////////////////////////////////////////`
			`// Name: wx/stringops.h`
			`// Purpose: implementation of wxString primitive operations`
			`// Author: Vaclav Slavik`
			`// Modified by:`
			`// Created: 2007-04-16`
			`// Copyright: (c) 2007 REA Elektronik GmbH`
			`// Licence: wxWindows licence`
			`///////////////////////////////////////////////////////////////////////////////`

			`#ifndef _WX_WXSTRINGOPS_H__`
			`#define _WX_WXSTRINGOPS_H__`

			`#include "wx/chartype.h"`
			`#include "wx/stringimpl.h"`
			`#include "wx/unichar.h"`
added missing #include "wx/buffer.h" git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45704 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-28 03:56:45 -04:00			`#include "wx/buffer.h"`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00
			`// This header contains wxStringOperations "namespace" class that implements`
			`// elementary operations on string data as static methods; wxString methods and`
			`// iterators are implemented in terms of it. Two implementations are available,`
			`// one for UTF-8 encoded char* string and one for "raw" wchar_t* strings (or`
			`// char* in ANSI build).`

			`// FIXME-UTF8: only wchar after we remove ANSI build`
			`#if wxUSE_UNICODE_WCHAR \|\| !wxUSE_UNICODE`
			`struct WXDLLIMPEXP_BASE wxStringOperationsWchar`
			`{`
			`// moves the iterator to the next Unicode character`
make wxStringOperationsWchar methods templates too to be able to reuse them with char pointers (and for consistency with wxStringOperationsUtf8) git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@59795 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2009-03-23 19:11:55 -04:00			`template <typename Iterator>`
			`static void IncIter(Iterator& i) { ++i; }`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00
			`// moves the iterator to the previous Unicode character`
make wxStringOperationsWchar methods templates too to be able to reuse them with char pointers (and for consistency with wxStringOperationsUtf8) git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@59795 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2009-03-23 19:11:55 -04:00			`template <typename Iterator>`
			`static void DecIter(Iterator& i) { --i; }`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00
			`// moves the iterator by n Unicode characters`
make wxStringOperationsWchar methods templates too to be able to reuse them with char pointers (and for consistency with wxStringOperationsUtf8) git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@59795 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2009-03-23 19:11:55 -04:00			`template <typename Iterator>`
			`static Iterator AddToIter(const Iterator& i, ptrdiff_t n)`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`{ return i + n; }`

			`// returns distance of the two iterators in Unicode characters`
make wxStringOperationsWchar methods templates too to be able to reuse them with char pointers (and for consistency with wxStringOperationsUtf8) git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@59795 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2009-03-23 19:11:55 -04:00			`template <typename Iterator>`
			`static ptrdiff_t DiffIters(const Iterator& i1, const Iterator& i2)`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`{ return i1 - i2; }`

Better handling of supplementary wxUniChar values in some of wxString methods On MSW, the Unicode code point is now properly encoded as UTF-16 when assigned or appended to a wxString. Closes #11827 2017-04-20 15:32:32 -04:00			`#if wxUSE_UNICODE_UTF16`
No changes, just fix a typo in a recently added comment 2017-06-21 13:07:13 -04:00			`// encodes the characters as UTF-16:`
Better handling of supplementary wxUniChar values in some of wxString methods On MSW, the Unicode code point is now properly encoded as UTF-16 when assigned or appended to a wxString. Closes #11827 2017-04-20 15:32:32 -04:00			`struct Utf16CharBuffer`
			`{`
Fix initialization of SingleCharBuffer and Utf16CharBuffer data Don't do it at all in the ctor, initializing just the first element of the array is useless as it's overwritten by EncodeChar() anyhow, so just leave the task of NUL-terminating the data to this function as well. It might be even better to just have a ctor taking wxUniChar in these classes instead and make EncodeChar() a trivial wrapper around it, but for now just apply the minimal fix to repair the test breakage after the last commit. See https://github.com/wxWidgets/wxWidgets/pull/467#issuecomment-310384946 2017-06-22 09:51:49 -04:00			`// Notice that data is left uninitialized, it is filled by EncodeChar()`
			`// which is the only function creating objects of this class.`
Avoid MSVC warning about correctly default-initializing arrays Don't rely on default array initialization, not only it may not work with some really old compilers (which is actually not that important as we don't seem to rely on these arrays being initialized, in fact), but it results in warnings about working correctly (sic) from MSVC in versions from 9 up to 12 inclusive. See https://github.com/wxWidgets/wxWidgets/pull/467#issuecomment-310193867 2017-06-21 19:47:59 -04:00
Better handling of supplementary wxUniChar values in some of wxString methods On MSW, the Unicode code point is now properly encoded as UTF-16 when assigned or appended to a wxString. Closes #11827 2017-04-20 15:32:32 -04:00			`wchar_t data[3];`
			`operator const wchar_t*() const { return data; }`
			`};`
			`static Utf16CharBuffer EncodeChar(const wxUniChar& ch);`
			`static wxWCharBuffer EncodeNChars(size_t n, const wxUniChar& ch);`
			`static bool IsSingleCodeUnitCharacter(const wxUniChar& ch)`
			`{ return !ch.IsSupplementary(); }`
			`#else`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`// encodes the character to a form used to represent it in internal`
Better handling of supplementary wxUniChar values in some of wxString methods On MSW, the Unicode code point is now properly encoded as UTF-16 when assigned or appended to a wxString. Closes #11827 2017-04-20 15:32:32 -04:00			`// representation`
			`struct SingleCharBuffer`
			`{`
			`wxChar data[2];`
			`operator const wxChar*() const { return data; }`
			`};`
			`static SingleCharBuffer EncodeChar(const wxUniChar& ch)`
			`{`
			`SingleCharBuffer buf;`
			`buf.data[0] = (wxChar)ch;`
Fix initialization of SingleCharBuffer and Utf16CharBuffer data Don't do it at all in the ctor, initializing just the first element of the array is useless as it's overwritten by EncodeChar() anyhow, so just leave the task of NUL-terminating the data to this function as well. It might be even better to just have a ctor taking wxUniChar in these classes instead and make EncodeChar() a trivial wrapper around it, but for now just apply the minimal fix to repair the test breakage after the last commit. See https://github.com/wxWidgets/wxWidgets/pull/467#issuecomment-310384946 2017-06-22 09:51:49 -04:00			`buf.data[1] = 0;`
Better handling of supplementary wxUniChar values in some of wxString methods On MSW, the Unicode code point is now properly encoded as UTF-16 when assigned or appended to a wxString. Closes #11827 2017-04-20 15:32:32 -04:00			`return buf;`
			`}`
			`static wxWxCharBuffer EncodeNChars(size_t n, const wxUniChar& ch);`
			`static bool IsSingleCodeUnitCharacter(const wxUniChar&) { return true; }`
			`#endif`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00
			`static wxUniChar DecodeChar(const wxStringImpl::const_iterator& i)`
			`{ return *i; }`
			`};`
			`#endif // wxUSE_UNICODE_WCHAR \|\| !wxUSE_UNICODE`


			`#if wxUSE_UNICODE_UTF8`
			`struct WXDLLIMPEXP_BASE wxStringOperationsUtf8`
			`{`
			`// checks correctness of UTF-8 sequence`
added code for optimized handling of UTF-8 locales: some string operations are more efficient under it and it's possible to completely compile-out support for other locales if the target system is known to only use UTF-8 locales git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45782 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-05-03 07:05:04 -04:00			`static bool IsValidUtf8String(const char *c,`
			`size_t len = wxStringImpl::npos);`
first round of debug/release merge: introduce wxDEBUG_LEVEL, for now defined as 1 if __WXDEBUG__ is defined, i.e. no real changes; don't use __WXDEBUG__ in the headers to keep debug and release builds ABI-compatible; add functions to customize or disable asserts handling git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@59711 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2009-03-21 19:36:37 -04:00			`static bool IsValidUtf8LeadByte(unsigned char c)`
			`{`
			`return (c <= 0x7F) \|\| (c >= 0xC2 && c <= 0xF4);`
			`}`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00
			`// table of offsets to skip forward when iterating over UTF-8 sequence`
made UTF-8 tables const git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@48322 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-08-22 05:30:40 -04:00			`static const unsigned char ms_utf8IterTable[256];`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00

			`template<typename Iterator>`
			`static void IncIter(Iterator& i)`
			`{`
			`wxASSERT( IsValidUtf8LeadByte(*i) );`
			`i += ms_utf8IterTable[(unsigned char)*i];`
			`}`

			`template<typename Iterator>`
			`static void DecIter(Iterator& i)`
			`{`
			`// Non-lead bytes are all in the 0x80..0xBF range (i.e. 10xxxxxx in`
			`// binary), so we just have to go back until we hit a byte that is`
			`// either < 0x80 (i.e. 0xxxxxxx in binary) or 0xC0..0xFF (11xxxxxx in`
			`// binary; this includes some invalid values, but we can ignore it`
			`// here, because we assume valid UTF-8 input for the purpose of`
			`// efficient implementation).`
			`--i;`
			`while ( ((i) & 0xC0) == 0x80 / 2 highest bits are '10' */ )`
			`--i;`
			`}`

			`template<typename Iterator>`
only provide ptrdiff_t versions of verious operator+/- working with iterators instead of overloads for both int and size_t: this seems to be enough and the existing overloads were not enough for 64 bit builds where expressions such as iter+(ptr2-ptr1) didn't compile without extra casts git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@51053 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2008-01-06 17:27:01 -05:00			`static Iterator AddToIter(const Iterator& i, ptrdiff_t n)`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`{`
			`Iterator out(i);`

			`if ( n > 0 )`
			`{`
only provide ptrdiff_t versions of verious operator+/- working with iterators instead of overloads for both int and size_t: this seems to be enough and the existing overloads were not enough for 64 bit builds where expressions such as iter+(ptr2-ptr1) didn't compile without extra casts git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@51053 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2008-01-06 17:27:01 -05:00			`for ( ptrdiff_t j = 0; j < n; ++j )`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`IncIter(out);`
			`}`
			`else if ( n < 0 )`
			`{`
only provide ptrdiff_t versions of verious operator+/- working with iterators instead of overloads for both int and size_t: this seems to be enough and the existing overloads were not enough for 64 bit builds where expressions such as iter+(ptr2-ptr1) didn't compile without extra casts git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@51053 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2008-01-06 17:27:01 -05:00			`for ( ptrdiff_t j = 0; j > n; --j )`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`DecIter(out);`
			`}`

			`return out;`
			`}`

			`template<typename Iterator>`
only provide ptrdiff_t versions of verious operator+/- working with iterators instead of overloads for both int and size_t: this seems to be enough and the existing overloads were not enough for 64 bit builds where expressions such as iter+(ptr2-ptr1) didn't compile without extra casts git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@51053 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2008-01-06 17:27:01 -05:00			`static ptrdiff_t DiffIters(Iterator i1, Iterator i2)`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`{`
only provide ptrdiff_t versions of verious operator+/- working with iterators instead of overloads for both int and size_t: this seems to be enough and the existing overloads were not enough for 64 bit builds where expressions such as iter+(ptr2-ptr1) didn't compile without extra casts git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@51053 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2008-01-06 17:27:01 -05:00			`ptrdiff_t dist = 0;`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00
			`if ( i1 < i2 )`
			`{`
			`while ( i1 != i2 )`
			`{`
			`IncIter(i1);`
			`dist--;`
			`}`
			`}`
			`else if ( i2 < i1 )`
			`{`
			`while ( i2 != i1 )`
			`{`
			`IncIter(i2);`
			`dist++;`
			`}`
			`}`

			`return dist;`
			`}`

Better handling of supplementary wxUniChar values in some of wxString methods On MSW, the Unicode code point is now properly encoded as UTF-16 when assigned or appended to a wxString. Closes #11827 2017-04-20 15:32:32 -04:00			`static bool IsSingleCodeUnitCharacter(const wxUniChar& ch)`
			`{ return ch.IsAscii(); }`

moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`// encodes the character as UTF-8:`
added wxUniChar::AsUTF8() for easy conversion in UTF8 build git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@46376 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-06-08 16:17:34 -04:00			`typedef wxUniChar::Utf8CharBuffer Utf8CharBuffer;`
			`static Utf8CharBuffer EncodeChar(const wxUniChar& ch)`
			`{ return ch.AsUTF8(); }`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00
			`// returns n copies of ch encoded in UTF-8 string`
			`static wxCharBuffer EncodeNChars(size_t n, const wxUniChar& ch);`

			`// returns the length of UTF-8 encoding of the character with lead byte 'c'`
			`static size_t GetUtf8CharLength(char c)`
			`{`
			`wxASSERT( IsValidUtf8LeadByte(c) );`
			`return ms_utf8IterTable[(unsigned char)c];`
			`}`

			`// decodes single UTF-8 character from UTF-8 string`
optimize wxStringOperationsUtf8::DecodeChar() for the ASCII case git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@48321 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-08-22 05:24:56 -04:00			`static wxUniChar DecodeChar(wxStringImpl::const_iterator i)`
			`{`
			`if ( (unsigned char)*i < 0x80 )`
			`return (int)*i;`
			`return DecodeNonAsciiChar(i);`
			`}`

			`private:`
			`static wxUniChar DecodeNonAsciiChar(wxStringImpl::const_iterator i);`
moved primitive string and string iterators operations to stringops.h/cpp files to make wxString code easier to read git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45533 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775 2007-04-19 06:05:55 -04:00			`};`
			`#endif // wxUSE_UNICODE_UTF8`


			`#if wxUSE_UNICODE_UTF8`
			`typedef wxStringOperationsUtf8 wxStringOperations;`
			`#else`
			`typedef wxStringOperationsWchar wxStringOperations;`
			`#endif`

			`#endif // _WX_WXSTRINGOPS_H_`