version 1.1.2.1, 2003/08/13 19:39:50
|
version 1.18, 2006/11/07 21:30:36
|
|
|
//%///////////////////////////////////////////////////////////////////////////// |
//%2006//////////////////////////////////////////////////////////////////////// |
// | // |
// Copyright (c) 2003 BMC Software, Hewlett-Packard Company, IBM, |
// Copyright (c) 2000, 2001, 2002 BMC Software; Hewlett-Packard Development |
// The Open Group, Tivoli Systems |
// Company, L.P.; IBM Corp.; The Open Group; Tivoli Systems. |
|
// Copyright (c) 2003 BMC Software; Hewlett-Packard Development Company, L.P.; |
|
// IBM Corp.; EMC Corporation, The Open Group. |
|
// Copyright (c) 2004 BMC Software; Hewlett-Packard Development Company, L.P.; |
|
// IBM Corp.; EMC Corporation; VERITAS Software Corporation; The Open Group. |
|
// Copyright (c) 2005 Hewlett-Packard Development Company, L.P.; IBM Corp.; |
|
// EMC Corporation; VERITAS Software Corporation; The Open Group. |
|
// Copyright (c) 2006 Hewlett-Packard Development Company, L.P.; IBM Corp.; |
|
// EMC Corporation; Symantec Corporation; The Open Group. |
// | // |
// Permission is hereby granted, free of charge, to any person obtaining a copy | // Permission is hereby granted, free of charge, to any person obtaining a copy |
// of this software and associated documentation files (the "Software"), to | // of this software and associated documentation files (the "Software"), to |
|
|
// | // |
//============================================================================== | //============================================================================== |
// | // |
// Author: Dave Rosckes (rosckes@us.ibm.com) |
|
// |
|
// |
|
//%///////////////////////////////////////////////////////////////////////////// | //%///////////////////////////////////////////////////////////////////////////// |
| |
#ifndef Pegasus_CommonUTF_h | #ifndef Pegasus_CommonUTF_h |
#define Pegasus_CommonUTF_h | #define Pegasus_CommonUTF_h |
#include <Pegasus/Common/Config.h> | #include <Pegasus/Common/Config.h> |
|
#include <Pegasus/Common/Linkage.h> |
|
#include <Pegasus/Common/String.h> |
|
#include <Pegasus/Common/Mutex.h> |
| |
PEGASUS_NAMESPACE_BEGIN | PEGASUS_NAMESPACE_BEGIN |
| |
|
|
#define MAX_BYTE (Uint32)0x0000FFFF | #define MAX_BYTE (Uint32)0x0000FFFF |
#define MAX_UTF16 (Uint32)0x0010FFFF | #define MAX_UTF16 (Uint32)0x0010FFFF |
| |
static const Uint32 halfBase = 0x0010000UL; |
PEGASUS_COMMON_LINKAGE extern const Uint32 halfBase; |
static const Uint32 halfMask = 0x3FFUL; |
PEGASUS_COMMON_LINKAGE extern const Uint32 halfMask; |
static const int halfShift = 10; |
PEGASUS_COMMON_LINKAGE extern const int halfShift; |
static const Uint8 firstByteMark[7] = { 0x00, 0x00, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC }; |
PEGASUS_COMMON_LINKAGE extern const Uint8 firstByteMark[]; |
|
|
static const Uint32 offsetsFromUTF8[6] = { 0x00000000UL, 0x00003080UL, 0x000E2080UL, |
PEGASUS_COMMON_LINKAGE extern const Uint32 offsetsFromUTF8[]; |
0x03C82080UL, 0xFA082080UL, 0x82082080UL }; |
|
|
|
static const char trailingBytesForUTF8[256] = { |
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
|
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, |
|
2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, 3,3,3,3,3,3,3,3,4,4,4,4,5,5,5,5 |
|
}; |
|
| |
#define UTF_8_COUNT_TRAIL_BYTES(leadByte) (trailingBytesForUTF8[(Uint8)leadByte]) |
PEGASUS_COMMON_LINKAGE extern const char trailingBytesForUTF8[]; |
| |
#define UTF_8_MASK_LEAD_BYTE(leadByte, countTrailBytes) ((leadByte)&=(1<<(6-(countTrailBytes)))-1) |
#define UTF_8_COUNT_TRAIL_BYTES(leadByte) \ |
|
(trailingBytesForUTF8[(Uint8)leadByte]) |
| |
#define UTF8_NEXT(s, i, c) { \ |
#define UTF8_NEXT(s, i) { \ |
(c)=(s)[(i)++]; \ |
(i)=((i) + UTF_8_COUNT_TRAIL_BYTES((s)[(i)]) + 1); \ |
if((Uint8)((c)-0xc0)<0x35) { \ |
|
Uint8 __count=UTF_8_COUNT_TRAIL_BYTES(c); \ |
|
UTF_8_MASK_LEAD_BYTE(c, __count); \ |
|
switch(__count) { \ |
|
case 3: \ |
|
(c)=((c)<<6)|((s)[(i)++]&0x3f); \ |
|
case 2: \ |
|
(c)=((c)<<6)|((s)[(i)++]&0x3f); \ |
|
case 1: \ |
|
(c)=((c)<<6)|((s)[(i)++]&0x3f); \ |
|
break; \ |
|
} \ |
|
} \ |
|
} | } |
| |
int isValid_U8(const Uint8 *src,int size); |
PEGASUS_COMMON_LINKAGE Boolean isValid_U8(const Uint8 *src,int size); |
int UTF16toUTF8(const Uint16** srcHead, |
|
|
PEGASUS_COMMON_LINKAGE int UTF16toUTF8( |
|
const Uint16** srcHead, |
const Uint16* srcEnd, | const Uint16* srcEnd, |
Uint8** tgtHead, | Uint8** tgtHead, |
Uint8* tgtEnd); | Uint8* tgtEnd); |
| |
int UTF8toUTF16 (const Uint8** srcHead, |
PEGASUS_COMMON_LINKAGE int UTF8toUTF16( |
|
const Uint8** srcHead, |
const Uint8* srcEnd, | const Uint8* srcEnd, |
Uint16** tgtHead, | Uint16** tgtHead, |
Uint16* tgtEnd); | Uint16* tgtEnd); |
| |
|
PEGASUS_COMMON_LINKAGE Boolean isUTF8Aux(const char*); |
|
|
|
inline Boolean isUTF8(const char* c) |
|
{ |
|
return (unsigned int)c[0] < 128 || isUTF8Aux(c); |
|
} |
|
|
|
PEGASUS_COMMON_LINKAGE Boolean isUTF8Str(const char*); |
|
|
|
/** Escape all characters above 7-bit ASCII. |
|
@param String: The string to be escaped Insert text here. |
|
@return String: The escaped string. |
|
*/ |
|
PEGASUS_COMMON_LINKAGE String escapeStringEncoder(const String& Str); |
|
|
|
/** decode string returned from escapeString Encoder. |
|
@param String: The string to be decoded. |
|
@return String: The decoded string. |
|
|
|
Prereq: Only the return string from the escapeStringEncoder can be used |
|
as input. |
|
*/ |
|
PEGASUS_COMMON_LINKAGE String escapeStringDecoder(const String& Str); |
|
|
|
/** |
|
The InitializeICU class loads and initializes data items that are required |
|
internally by various ICU functions. It makes sure that ICU function u_init |
|
is only called once by a process. A module which is using ICU APIs needs |
|
to call InitializeICU::initICUSuccessful first before it calls other ICU |
|
APIs. If InitializeICU::initICUSuccessful is failed, the module should not |
|
call other ICU APIs. |
|
*/ |
|
|
|
#ifdef PEGASUS_HAS_ICU |
|
class PEGASUS_COMMON_LINKAGE InitializeICU |
|
{ |
|
public: |
|
|
|
/** |
|
Determines if ICU initialization is successful. |
|
|
|
@return true, if u_init is called and success |
|
false otherwise |
|
*/ |
|
|
|
static Boolean initICUSuccessful(); |
|
|
|
private: |
|
static Boolean _initAttempted; |
|
static Boolean _initSuccessful; |
|
|
|
static Mutex _initMutex; |
|
}; |
|
|
|
#endif |
|
|
|
|
PEGASUS_NAMESPACE_END | PEGASUS_NAMESPACE_END |
|
|
#endif | #endif |