pegasus/src/Pegasus/Common/String.cpp - diff

Return to String.cpp CVS log

Up to [Pegasus] / pegasus / src / Pegasus / Common

Diff for /pegasus/src/Pegasus/Common/String.cpp between version 1.68 and 1.78

version 1.68, 2003/04/30 13:50:44

version 1.78, 2003/09/16 12:38:21

Line 39

#include "System.h" // for strcasecmp

#endif

#include "CommonUTF.h"

#ifdef PEGASUS_HAS_ICU

#include <unicode/unistr.h>

#endif

PEGASUS_USING_STD;

PEGASUS_NAMESPACE_BEGIN

Line 201

Line 207

assign(str);

}

String::String(const char* str, const char* utfFlag)

{

_rep = new StringRep;

if(!memcmp(utfFlag,STRING_FLAG_UTF8,sizeof(STRING_FLAG_UTF8)))

{

assignUTF8(str);

}

else

{

assign(str);

}

String::String(const char* str, Uint32 n)

{

_rep = new StringRep;

Line 443

Line 463

}

// ATTN-RK-P3-20020509: Define case-sensitivity for non-English characters

// ATTN-CEC-20030913: ICU code added, but uses the server's locale. Look at adding

// a toLower( ) with Locale parameter - like ICU's toLower( )

void String::toLower()

{

#ifdef PEGASUS_HAS_ICU

Char16* utf16str;

UnicodeString UniStr((const UChar *)_rep->c16a.getData());

UniStr.toLower();

UniStr.append((UChar)'\0'); // ATTN - must be after toLower, but before getTerminatedBuffer

// We should not need to do this!

utf16str = (Char16 *)UniStr.getTerminatedBuffer();

assign(utf16str);

// DEVELOPER NOTE: do not delete utf16str, this is handled by ICU

#else

for (Char16* p = &_rep->c16a[0]; *p; p++)

{

if (*p <= PEGASUS_MAX_PRINTABLE_CHAR)

*p = tolower(*p);

}

#endif

}

int String::compare(const String& s1, const String& s2, Uint32 n)

Line 491

Line 524

int String::compareNoCase(const String& s1, const String& s2)

{

#ifdef PEGASUS_HAS_ICU

UnicodeString UniStr1((const UChar *)s1.getChar16Data(), (int32_t)s1.size());

UnicodeString UniStr2((const UChar *)s2.getChar16Data(), (int32_t)s2.size());

UniStr1.toLower();

UniStr2.toLower();

return (UniStr2.compare(UniStr1));

#else

const Char16* _s1 = s1.getChar16Data();

const Char16* _s2 = s2.getChar16Data();

Line 518

Line 558

return 1;

return 0;

#endif

}

Boolean String::equal(const String& str1, const String& str2)

Line 527

Line 568

Boolean String::equalNoCase(const String& str1, const String& str2)

{

#ifdef PEGASUS_HAS_ICU

UnicodeString UniStr1((const UChar *)str1.getChar16Data(), (int32_t)str1.size());

UnicodeString UniStr2((const UChar *)str2.getChar16Data(), (int32_t)str2.size());

UniStr1.toLower();

UniStr2.toLower();

return (UniStr1 == UniStr2);

#else

if (str1.size() != str2.size())

return false;

Line 548

Line 596

}

return true;

#endif

}

// UTF8 specific code:

String& String::assignUTF8(const char* str)

{

_rep->c16a.clear();

Uint32 n = strlen(str) + 1;

const Uint8 *strsrc = (Uint8 *)str;

Uint8 *endsrc = (Uint8 *)&str[n-1];

Char16 *msg16 = new Char16[n];

Uint16 *strtgt = (Uint16 *)msg16;

Uint16 *endtgt = (Uint16 *)&msg16[n];

UTF8toUTF16(&strsrc,

endsrc,

&strtgt,

endtgt);

Uint32 count;

for(count = 0; ((msg16[count]) != Char16(0x00)) && (count <= n); ++count);

_rep->c16a.append(msg16, count);

_rep->c16a.append('\0');

delete [] msg16;

return *this;

}

CString String::getCStringUTF8() const

{

Uint32 n = 3*size();

char* str = new char[n];

const Char16* msg16 = getChar16Data();

const Uint16 *strsrc = (Uint16 *)msg16;

Uint16 *endsrc = (Uint16 *)&msg16[size()+1];

Uint8 *strtgt = (Uint8 *)str;

Uint8 *endtgt = (Uint8 *)&str[n];

UTF16toUTF8 (&strsrc,

endsrc,

&strtgt,

endtgt);

char* str1 = new char[strlen(str)+1];

strcpy(str1,str);

delete [] str;

return CString(str1);

}

Boolean String::isUTF8(const char *legal)

{

char numBytes = UTF_8_COUNT_TRAIL_BYTES(*legal)+1;

// Validate that the string is long enough to hold all the expected bytes.

// Note that if legal[0] == 0, numBytes will be 1.

for (char i=1; i<numBytes; i++)

{

if (legal[i] == 0)

{

return false;

}

return (isValid_U8((const Uint8 *)legal, numBytes));

}

#if 0

// ATTN-RK-P3-20020603: This code is not completely correct

Line 565

Line 686

special characters in the pattern: *?\[] (see the manual

entry for details on what these mean).

Side effects: None.

Line 576

Line 698

inline Uint16 _ToLower(Uint16 ch)

{

// ICU_TODO: If ICU is available we should do this the correct way.

return ch <= PEGASUS_MAX_PRINTABLE_CHAR ? tolower(char(ch)) : ch;

}

inline Boolean _Equal(MatchChar ch1, MatchChar ch2, int nocase)

{

// ICU_TODO: If ICU is available we should do this the correct way.

if (nocase)

return _ToLower(ch1) == _ToLower(ch2);

else

Line 747

Line 871

PEGASUS_STD(ostream)& operator<<(PEGASUS_STD(ostream)& os, const String& str)

{

#ifdef PEGASUS_OS_OS400

int inc = 0;

#if defined(PEGASUS_OS_OS400)

int newbuf = 0;

CString cstr = str.getCStringUTF8();

char *buffer = NULL;

const char* utf8str = cstr;

char buffer1[201];

char temp[2];

os << utf8str;

if (str.size() > 200)

{

#elif defined(PEGASUS_HAS_ICU)

buffer = new char[str.size()+1];

newbuf = 1;

char *buf = NULL;

}

const int size = str.size() * 6;

else

UnicodeString UniStr((const UChar *)str.getChar16Data(), (int32_t)str.size());

buffer = buffer1;

Uint32 bufsize = UniStr.extract(0,size,buf);

#endif

buf = new char[bufsize+1];

UniStr.extract(0,bufsize,buf);

os << buf;

os.flush();

delete [] buf;

#else

for (Uint32 i = 0, n = str.size(); i < n; i++)

{

Line 768

Line 899

if (code > 0 && code <= PEGASUS_MAX_PRINTABLE_CHAR)

{

#ifdef PEGASUS_OS_OS400

// process so messages don't get displayed as one char per line on OS/400.

// Uint16 is a 2 byte character where byte 1 is '00' and byte 2 is

// the character. Also, the entire string needs to be sent to os instead

// of one "byte/Unit16" at a time. Sending one "byte/Uint16" at a time also

// causes one character per line. On OS/400 use of os << char(code) is a

// restriction and no available c/cpp alternative was available. The

// following was created to compensate for this restriction.

memcpy(temp, &code, 2);

memcpy(buffer+inc, &temp[1], 1); // do not include the '00'

if ((i+1) == n) // last character

{

memset(buffer+n, 0x00, 1); // add null terminator

os << buffer; // return 1-byte per character string

if (buffer && newbuf != 0)

delete [] buffer; // okay; this is the end of the loop

}

inc++;

#else

os << char(code);

#endif

}

else

{

Line 798

Line 909

os << buffer;

}

#endif // End of PEGASUS_HAS_ICU #else leg.

return os;

}

Legend:

Removed from v.1.68
changed lines
	Added in v.1.78

No CVS admin address has been configured