//%2005//////////////////////////////////////////////////////////////////////// // // Copyright (c) 2000, 2001, 2002 BMC Software; Hewlett-Packard Development // Company, L.P.; IBM Corp.; The Open Group; Tivoli Systems. // Copyright (c) 2003 BMC Software; Hewlett-Packard Development Company, L.P.; // IBM Corp.; EMC Corporation, The Open Group. // Copyright (c) 2004 BMC Software; Hewlett-Packard Development Company, L.P.; // IBM Corp.; EMC Corporation; VERITAS Software Corporation; The Open Group. // Copyright (c) 2005 Hewlett-Packard Development Company, L.P.; IBM Corp.; // EMC Corporation; VERITAS Software Corporation; The Open Group. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files (the "Software"), to // deal in the Software without restriction, including without limitation the // rights to use, copy, modify, merge, publish, distribute, sublicense, and/or // sell copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions: // // THE ABOVE COPYRIGHT NOTICE AND THIS PERMISSION NOTICE SHALL BE INCLUDED IN // ALL COPIES OR SUBSTANTIAL PORTIONS OF THE SOFTWARE. THE SOFTWARE IS PROVIDED // "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT // LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR // PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT // HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN // ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION // WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. // //============================================================================== // // Author: Dave Rosckes (rosckes@us.ibm.com) // // Modified By: Yi Zhou Hewlett-Packard Company (yi.zhou@hp.com) // //%///////////////////////////////////////////////////////////////////////////// #ifndef Pegasus_CommonUTF_h #define Pegasus_CommonUTF_h #include #include #include #include #ifdef PEGASUS_USE_EXPERIMENTAL_INTERFACES PEGASUS_NAMESPACE_BEGIN #define FIRST_HIGH_SURROGATE (Uint32)0xD800 #define LAST_HIGH_SURROGATE (Uint32)0xDBFF #define FIRST_LOW_SURROGATE (Uint32)0xDC00 #define LAST_LOW_SURROGATE (Uint32)0xDFFF #define REPLACEMENT_CHARACTER (Uint32)0x0000FFFD #define MAX_BYTE (Uint32)0x0000FFFF #define MAX_UTF16 (Uint32)0x0010FFFF static const Uint32 halfBase = 0x0010000UL; static const Uint32 halfMask = 0x3FFUL; static const int halfShift = 10; static const Uint8 firstByteMark[7] = { 0x00, 0x00, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC }; static const Uint32 offsetsFromUTF8[6] = { 0x00000000UL, 0x00003080UL, 0x000E2080UL, 0x03C82080UL, 0xFA082080UL, 0x82082080UL }; static const char trailingBytesForUTF8[256] = { 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, 3,3,3,3,3,3,3,3,4,4,4,4,5,5,5,5 }; #define UTF_8_COUNT_TRAIL_BYTES(leadByte) (trailingBytesForUTF8[(Uint8)leadByte]) #define UTF8_NEXT(s, i) { \ (i)=((i) + UTF_8_COUNT_TRAIL_BYTES((s)[(i)]) + 1); \ } PEGASUS_COMMON_LINKAGE Boolean isValid_U8(const Uint8 *src,int size); PEGASUS_COMMON_LINKAGE int UTF16toUTF8( const Uint16** srcHead, const Uint16* srcEnd, Uint8** tgtHead, Uint8* tgtEnd); PEGASUS_COMMON_LINKAGE int UTF8toUTF16( const Uint8** srcHead, const Uint8* srcEnd, Uint16** tgtHead, Uint16* tgtEnd); PEGASUS_COMMON_LINKAGE Boolean isUTF8Aux(const char*); inline Boolean isUTF8(const char* c) { return (unsigned int)c[0] < 128 || isUTF8Aux(c); } PEGASUS_COMMON_LINKAGE Boolean isUTF8Str(const char*); /** Escape all characters above 7-bit ASCII. @param String: The string to be escaped Insert text here. @return String: The escaped string. */ PEGASUS_COMMON_LINKAGE String escapeStringEncoder(const String& Str); /** decode string returned from escapeString Encoder. @param String: The string to be decoded. @return String: The decoded string. Prereq: Only the return string from the escapeStringEncoder can be used as input. */ PEGASUS_COMMON_LINKAGE String escapeStringDecoder(const String& Str); /** The InitializeICU class loads and initializes data items that are required internally by various ICU functions. It makes sure that ICU function u_init is only called once by a process. A module which is using ICU APIs needs to call InitializeICU::initICUSuccessful first before it calls other ICU APIs. If InitializeICU::initICUSuccessful is failed, the module should not call other ICU APIs. */ #ifdef PEGASUS_HAS_ICU class PEGASUS_COMMON_LINKAGE InitializeICU { public: /** Determines if ICU initialization is successful. @return true, if u_init is called and success false otherwise */ static Boolean initICUSuccessful(); private: static Boolean _initAttempted; static Boolean _initSuccessful; static Mutex _initMutex; }; #endif PEGASUS_NAMESPACE_END #endif // PEGASUS_USE_EXPERIMENTAL_INTERFACES #endif