version 1.68, 2003/04/30 13:50:44
|
version 1.95, 2004/06/15 18:38:24
|
|
|
//%///////////////////////////////////////////////////////////////////////////// |
//%2003//////////////////////////////////////////////////////////////////////// |
// | // |
// Copyright (c) 2000, 2001, 2002 BMC Software, Hewlett-Packard Company, IBM, |
// Copyright (c) 2000, 2001, 2002 BMC Software, Hewlett-Packard Development |
// The Open Group, Tivoli Systems |
// Company, L. P., IBM Corp., The Open Group, Tivoli Systems. |
|
// Copyright (c) 2003 BMC Software; Hewlett-Packard Development Company, L. P.; |
|
// IBM Corp.; EMC Corporation, The Open Group. |
// | // |
// Permission is hereby granted, free of charge, to any person obtaining a copy | // Permission is hereby granted, free of charge, to any person obtaining a copy |
// of this software and associated documentation files (the "Software"), to | // of this software and associated documentation files (the "Software"), to |
|
|
#include "InternalException.h" | #include "InternalException.h" |
#include <iostream> | #include <iostream> |
#include <fstream> | #include <fstream> |
#ifndef PEGASUS_REMOVE_DEPRECATED |
|
#include "System.h" // for strcasecmp |
#include "CommonUTF.h" |
|
|
|
#ifdef PEGASUS_HAS_ICU |
|
#include <unicode/unistr.h> |
#endif | #endif |
| |
PEGASUS_USING_STD; | PEGASUS_USING_STD; |
|
|
| |
CString::CString(const CString& cstr) | CString::CString(const CString& cstr) |
{ | { |
|
_rep = 0; |
|
|
|
if (cstr._rep) |
|
{ |
_rep = (void*)new char[strlen((char*)cstr._rep)+1]; | _rep = (void*)new char[strlen((char*)cstr._rep)+1]; |
strcpy((char*)_rep, (char*)cstr._rep); | strcpy((char*)_rep, (char*)cstr._rep); |
} | } |
|
} |
| |
CString::CString(char* cstr) | CString::CString(char* cstr) |
: _rep(cstr) | : _rep(cstr) |
|
|
CString::~CString() | CString::~CString() |
{ | { |
if (_rep) | if (_rep) |
|
{ |
delete [] (char*)_rep; | delete [] (char*)_rep; |
} | } |
|
} |
| |
CString& CString::operator=(const CString& cstr) | CString& CString::operator=(const CString& cstr) |
{ | { |
|
if (&cstr != this) |
|
{ |
|
if (_rep) |
|
{ |
|
delete [] (char*)_rep; |
|
_rep = 0; |
|
} |
|
if (cstr._rep) |
|
{ |
_rep = (char*)new char[strlen((char*)cstr._rep)+1]; | _rep = (char*)new char[strlen((char*)cstr._rep)+1]; |
strcpy((char*)_rep, (char*)cstr._rep); | strcpy((char*)_rep, (char*)cstr._rep); |
|
} |
|
} |
return *this; | return *this; |
} | } |
| |
|
|
| |
String& String::operator=(const String& str) | String& String::operator=(const String& str) |
{ | { |
return assign(str); |
if (&str != this) |
|
{ |
|
assign(str); |
|
} |
|
return *this; |
} | } |
| |
String& String::assign(const String& str) | String& String::assign(const String& str) |
|
|
return *this; | return *this; |
} | } |
| |
String& String::assign(const char* str) |
|
{ |
|
_rep->c16a.clear(); |
|
|
|
Uint32 n = strlen(str) + 1; |
|
_rep->c16a.reserveCapacity(n); |
|
|
|
while (n--) |
|
_rep->c16a.append(Uint8(*str++)); |
|
|
|
return *this; |
|
} |
|
|
|
String& String::assign(const char* str, Uint32 n) | String& String::assign(const char* str, Uint32 n) |
{ | { |
_rep->c16a.clear(); |
char *tmpStr = new char[n+1]; |
|
memset(tmpStr,0x00,n+1); |
Uint32 _n = _strnlen(str, n); |
|
_rep->c16a.reserveCapacity(_n + 1); |
|
| |
while (_n--) |
strncpy(tmpStr,str,n); |
_rep->c16a.append(Uint8(*str++)); |
assign(tmpStr); |
|
delete tmpStr; |
_rep->c16a.append('\0'); |
|
| |
return *this; | return *this; |
} | } |
|
|
return _rep->c16a.getData(); | return _rep->c16a.getData(); |
} | } |
| |
CString String::getCString() const |
|
{ |
|
Uint32 n = size() + 1; |
|
char* str = new char[n]; |
|
char* p = str; |
|
const Char16* q = getChar16Data(); |
|
|
|
for (Uint32 i = 0; i < n; i++) |
|
{ |
|
Uint16 c = *q++; |
|
*p++ = char(c); |
|
|
|
//if (c & 0xff00) |
|
// truncatedCharacters = true; |
|
} |
|
|
|
return CString(str); |
|
} |
|
|
|
Char16& String::operator[](Uint32 index) | Char16& String::operator[](Uint32 index) |
{ | { |
if (index > size()) | if (index > size()) |
|
|
Uint32 i = 1; | Uint32 i = 1; |
for (; i < subStrLen; i++) | for (; i < subStrLen; i++) |
if (*pStr++ != *p++ ) | if (*pStr++ != *p++ ) |
{pStr--; break;} // break from loop |
{pStr-=i; break;} // break from loop |
if (i == subStrLen) | if (i == subStrLen) |
return loc; | return loc; |
} | } |
|
|
return PEG_NOT_FOUND; | return PEG_NOT_FOUND; |
} | } |
| |
// ATTN-RK-P3-20020509: Define case-sensitivity for non-English characters |
|
void String::toLower() | void String::toLower() |
{ | { |
|
const char * noLocale = NULL; |
|
String::toLower(noLocale); |
|
} |
|
void String::toLower(const char * strLocale) |
|
{ |
|
#ifdef PEGASUS_HAS_ICU |
|
UnicodeString UniStr((const UChar *)_rep->c16a.getData()); |
|
if(strLocale == NULL) |
|
{ |
|
UniStr.toLower(); |
|
} |
|
else |
|
{ |
|
Locale loc(strLocale); |
|
if(loc.isBogus()) |
|
{ |
|
throw InvalidNameException(String(strLocale)); |
|
} |
|
UniStr.toLower(loc); |
|
} |
|
UniStr.append((UChar)'\0'); |
|
|
|
assign((Char16*)UniStr.getBuffer()); |
|
#else |
for (Char16* p = &_rep->c16a[0]; *p; p++) | for (Char16* p = &_rep->c16a[0]; *p; p++) |
{ | { |
if (*p <= PEGASUS_MAX_PRINTABLE_CHAR) | if (*p <= PEGASUS_MAX_PRINTABLE_CHAR) |
*p = tolower(*p); | *p = tolower(*p); |
} | } |
|
#endif |
|
} |
|
|
|
void String::toUpper(const char * strLocale) |
|
{ |
|
#ifdef PEGASUS_HAS_ICU |
|
UnicodeString UniStr((const UChar *)_rep->c16a.getData()); |
|
if(strLocale == NULL) |
|
{ |
|
UniStr.toUpper(); |
|
} |
|
else |
|
{ |
|
Locale loc(strLocale); |
|
if(loc.isBogus()) |
|
{ |
|
throw InvalidNameException(String(strLocale)); |
|
} |
|
UniStr.toUpper(loc); |
|
} |
|
UniStr.append((UChar)'\0'); |
|
|
|
assign((Char16*)UniStr.getBuffer()); |
|
#else |
|
for (Char16* p = &_rep->c16a[0]; *p; p++) |
|
{ |
|
if (*p <= PEGASUS_MAX_PRINTABLE_CHAR) |
|
*p = toupper(*p); |
|
} |
|
#endif |
} | } |
| |
int String::compare(const String& s1, const String& s2, Uint32 n) | int String::compare(const String& s1, const String& s2, Uint32 n) |
|
|
| |
int String::compareNoCase(const String& s1, const String& s2) | int String::compareNoCase(const String& s1, const String& s2) |
{ | { |
|
const char * noLocale = NULL; |
|
return String::compareNoCase(s1, s2, noLocale); |
|
} |
|
|
|
int String::compareNoCase(const String& s1, const String& s2,const char * strLocale) |
|
{ |
|
#ifdef PEGASUS_HAS_ICU |
|
UnicodeString UniStr1((const UChar *)s1.getChar16Data(), (int32_t)s1.size()); |
|
UnicodeString UniStr2((const UChar *)s2.getChar16Data(), (int32_t)s2.size()); |
|
if(strLocale == NULL) |
|
{ |
|
UniStr1.toLower(); |
|
UniStr2.toLower(); |
|
} |
|
else |
|
{ |
|
Locale loc(strLocale); |
|
if(loc.isBogus()) |
|
{ |
|
throw InvalidNameException(String(strLocale)); |
|
} |
|
UniStr1.toLower(loc); |
|
UniStr2.toLower(loc); |
|
} |
|
// Note: the ICU 2.6.1 documentation for UnicodeString::compare( ) is |
|
// backwards! The API actually returns +1 if this is greater than text. |
|
// This is why the line below appears wrong based on the 2.6.1 docs. |
|
// (ref. bugzilla 1207) |
|
return (UniStr1.compare(UniStr2)); |
|
#else |
const Char16* _s1 = s1.getChar16Data(); | const Char16* _s1 = s1.getChar16Data(); |
const Char16* _s2 = s2.getChar16Data(); | const Char16* _s2 = s2.getChar16Data(); |
| |
|
|
return 1; | return 1; |
| |
return 0; | return 0; |
|
#endif |
} | } |
| |
Boolean String::equal(const String& str1, const String& str2) | Boolean String::equal(const String& str1, const String& str2) |
|
|
| |
Boolean String::equalNoCase(const String& str1, const String& str2) | Boolean String::equalNoCase(const String& str1, const String& str2) |
{ | { |
|
const char * noLocale = NULL; |
|
return String::equalNoCase(str1, str2, noLocale); |
|
} |
|
|
|
Boolean String::equalNoCase(const String& str1, const String& str2,const char * strLocale) |
|
{ |
|
#ifdef PEGASUS_HAS_ICU |
|
UnicodeString UniStr1((const UChar *)str1.getChar16Data(), (int32_t)str1.size()); |
|
UnicodeString UniStr2((const UChar *)str2.getChar16Data(), (int32_t)str2.size()); |
|
if(strLocale == NULL) |
|
{ |
|
UniStr1.toLower(); |
|
UniStr2.toLower(); |
|
} |
|
else |
|
{ |
|
Locale loc(strLocale); |
|
if(loc.isBogus()) |
|
{ |
|
throw InvalidNameException(String(strLocale)); |
|
} |
|
UniStr1.toLower(loc); |
|
UniStr2.toLower(loc); |
|
} |
|
return (UniStr1 == UniStr2); |
|
#else |
if (str1.size() != str2.size()) | if (str1.size() != str2.size()) |
return false; | return false; |
| |
|
|
} | } |
| |
return true; | return true; |
|
#endif |
} | } |
| |
|
// UTF8 specific code: |
|
String& String::assign(const char* str) |
|
{ |
|
_rep->c16a.clear(); |
|
Uint32 n = strlen(str) + 1; |
|
|
|
const Uint8 *strsrc = (Uint8 *)str; |
|
Uint8 *endsrc = (Uint8 *)&str[n-1]; |
|
|
|
Char16 *msg16 = new Char16[n]; |
|
Uint16 *strtgt = (Uint16 *)msg16; |
|
Uint16 *endtgt = (Uint16 *)&msg16[n]; |
|
|
|
UTF8toUTF16(&strsrc, |
|
endsrc, |
|
&strtgt, |
|
endtgt); |
|
|
|
Uint32 count; |
|
|
|
for(count = 0; ((msg16[count]) != Char16(0x00)) && (count < (n - 1)); ++count); |
|
|
|
_rep->c16a.append(msg16, count); |
|
|
|
_rep->c16a.append('\0'); |
|
|
|
delete [] msg16; |
|
|
|
return *this; |
|
} |
|
|
|
CString String::getCString() const |
|
{ |
|
Uint32 n = 3*size() + 1; |
|
char* str = new char[n]; |
|
|
|
const Char16* msg16 = getChar16Data(); |
|
|
|
const Uint16 *strsrc = (Uint16 *)msg16; |
|
Uint16 *endsrc = (Uint16 *)&msg16[size()+1]; |
|
|
|
Uint8 *strtgt = (Uint8 *)str; |
|
Uint8 *endtgt = (Uint8 *)&str[n]; |
|
|
|
UTF16toUTF8 (&strsrc, |
|
endsrc, |
|
&strtgt, |
|
endtgt); |
|
|
|
char* str1 = new char[strlen(str)+1]; |
|
strcpy(str1,str); |
|
delete [] str; |
|
|
|
return CString(str1); |
|
} |
| |
#if 0 | #if 0 |
// ATTN-RK-P3-20020603: This code is not completely correct | // ATTN-RK-P3-20020603: This code is not completely correct |
|
|
special characters in the pattern: *?\[] (see the manual | special characters in the pattern: *?\[] (see the manual |
entry for details on what these mean). | entry for details on what these mean). |
| |
|
|
Side effects: None. | Side effects: None. |
*/ | */ |
| |
|
|
| |
inline Uint16 _ToLower(Uint16 ch) | inline Uint16 _ToLower(Uint16 ch) |
{ | { |
|
// ICU_TODO: If ICU is available we should do this the correct way. |
return ch <= PEGASUS_MAX_PRINTABLE_CHAR ? tolower(char(ch)) : ch; | return ch <= PEGASUS_MAX_PRINTABLE_CHAR ? tolower(char(ch)) : ch; |
} | } |
| |
inline Boolean _Equal(MatchChar ch1, MatchChar ch2, int nocase) | inline Boolean _Equal(MatchChar ch1, MatchChar ch2, int nocase) |
{ | { |
|
// ICU_TODO: If ICU is available we should do this the correct way. |
if (nocase) | if (nocase) |
return _ToLower(ch1) == _ToLower(ch2); | return _ToLower(ch1) == _ToLower(ch2); |
else | else |
|
|
| |
PEGASUS_STD(ostream)& operator<<(PEGASUS_STD(ostream)& os, const String& str) | PEGASUS_STD(ostream)& operator<<(PEGASUS_STD(ostream)& os, const String& str) |
{ | { |
#ifdef PEGASUS_OS_OS400 |
|
int inc = 0; |
#if defined(PEGASUS_OS_OS400) |
int newbuf = 0; |
CString cstr = str.getCString(); |
char *buffer = NULL; |
const char* utf8str = cstr; |
char buffer1[201]; |
|
char temp[2]; |
os << utf8str; |
if (str.size() > 200) |
|
{ |
#elif defined(PEGASUS_HAS_ICU) |
buffer = new char[str.size()+1]; |
if(os == cout || os == cerr){ |
newbuf = 1; |
char *buf = NULL; |
|
const int size = str.size() * 6; |
|
UnicodeString UniStr((const UChar *)str.getChar16Data(), (int32_t)str.size()); |
|
Uint32 bufsize = UniStr.extract(0,size,buf); |
|
|
|
buf = new char[bufsize+1]; |
|
UniStr.extract(0,bufsize,buf); |
|
os << buf; |
|
os.flush(); |
|
delete [] buf; |
|
}else{ |
|
CString cstr = str.getCString(); |
|
const char* utf8str = cstr; |
|
os << utf8str; |
} | } |
else |
|
buffer = buffer1; |
|
#endif |
|
| |
|
#else |
for (Uint32 i = 0, n = str.size(); i < n; i++) | for (Uint32 i = 0, n = str.size(); i < n; i++) |
{ | { |
Uint16 code = str[i]; | Uint16 code = str[i]; |
| |
if (code > 0 && code <= PEGASUS_MAX_PRINTABLE_CHAR) | if (code > 0 && code <= PEGASUS_MAX_PRINTABLE_CHAR) |
{ | { |
#ifdef PEGASUS_OS_OS400 |
|
// process so messages don't get displayed as one char per line on OS/400. |
|
// Uint16 is a 2 byte character where byte 1 is '00' and byte 2 is |
|
// the character. Also, the entire string needs to be sent to os instead |
|
// of one "byte/Unit16" at a time. Sending one "byte/Uint16" at a time also |
|
// causes one character per line. On OS/400 use of os << char(code) is a |
|
// restriction and no available c/cpp alternative was available. The |
|
// following was created to compensate for this restriction. |
|
memcpy(temp, &code, 2); |
|
memcpy(buffer+inc, &temp[1], 1); // do not include the '00' |
|
if ((i+1) == n) // last character |
|
{ |
|
memset(buffer+n, 0x00, 1); // add null terminator |
|
os << buffer; // return 1-byte per character string |
|
if (buffer && newbuf != 0) |
|
delete [] buffer; // okay; this is the end of the loop |
|
} |
|
inc++; |
|
#else |
|
os << char(code); | os << char(code); |
#endif |
|
} | } |
else | else |
{ | { |
|
|
os << buffer; | os << buffer; |
} | } |
} | } |
|
#endif // End of PEGASUS_HAS_ICU #else leg. |
| |
return os; | return os; |
} | } |
|
|
return String::compare(str1, str2) >= 0; | return String::compare(str1, str2) >= 0; |
} | } |
| |
#ifndef PEGASUS_REMOVE_DEPRECATED |
|
int CompareNoCase(const char* s1, const char* s2) |
|
{ |
|
return System::strcasecmp(s1, s2); |
|
} |
|
#endif |
|
|
|
PEGASUS_NAMESPACE_END | PEGASUS_NAMESPACE_END |