pegasus/src/Pegasus/Common/String.cpp - diff

Return to String.cpp CVS log

Up to [Pegasus] / pegasus / src / Pegasus / Common

Diff for /pegasus/src/Pegasus/Common/String.cpp between version 1.21 and 1.109

version 1.21, 2001/06/08 00:40:42

version 1.109, 2005/05/18 20:34:36

Line 1

//%/////////////////////////////////////////////////////////////////////////////

//%2005////////////////////////////////////////////////////////////////////////

// Company, L.P.; IBM Corp.; The Open Group; Tivoli Systems.

// IBM Corp.; EMC Corporation, The Open Group.

// IBM Corp.; EMC Corporation; VERITAS Software Corporation; The Open Group.

// EMC Corporation; VERITAS Software Corporation; The Open Group.

// Permission is hereby granted, free of charge, to any person obtaining a copy

// of this software and associated documentation files (the "Software"), to

// deal in the Software without restriction, including without limitation the

// rights to use, copy, modify, merge, publish, distribute, sublicense, and/or

// sell copies of the Software, and to permit persons to whom the Software is

// furnished to do so, subject to the following conditions:

// Permission is hereby granted, free of charge, to any person obtaining a

// THE ABOVE COPYRIGHT NOTICE AND THIS PERMISSION NOTICE SHALL BE INCLUDED IN

// copy of this software and associated documentation files (the "Software"),

// ALL COPIES OR SUBSTANTIAL PORTIONS OF THE SOFTWARE. THE SOFTWARE IS PROVIDED

// to deal in the Software without restriction, including without limitation

// "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT

// the rights to use, copy, modify, merge, publish, distribute, sublicense,

// LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR

// and/or sell copies of the Software, and to permit persons to whom the

// PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT

// Software is furnished to do so, subject to the following conditions:

// HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN

// ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION

// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

// WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.

// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL

// THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING

// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER

// DEALINGS IN THE SOFTWARE.

//==============================================================================

// Author: Mike Brasher (mbrasher@bmc.com)

// Modified By:

// Modified By: Roger Kumpf, Hewlett-Packard Company (roger_kumpf@hp.com)

// Josephine Eskaline Joyce, IBM (jojustin@in.ibm.com) for Bug#3297

//%/////////////////////////////////////////////////////////////////////////////

#include <cctype>

#include <cstring>

#include "String.h"

#include "Exception.h"

#include "Array.h"

#include "String.h"

#include "AutoPtr.h"

#include "InternalException.h"

#include <iostream>

#include <fstream>

#include <Pegasus/Common/CommonUTF.h>

#include "CommonUTF.h"

#ifdef PEGASUS_HAS_ICU

#include <unicode/ustring.h>

#include <unicode/uchar.h>

#endif

PEGASUS_USING_STD;

PEGASUS_NAMESPACE_BEGIN

#define PEGASUS_ARRAY_T String

///////////////////////////////////////////////////////////////////////////////

#include <Pegasus/Common/ArrayImpl.h>

#undef PEGASUS_ARRAY_T

// CString

///////////////////////////////////////////////////////////////////////////////

CString::CString()

: _rep(0)

{

}

const String String::EMPTY;

CString::CString(const CString& cstr)

{

_rep = 0;

static inline void _SkipWhitespace(const Char16*& p)

if (cstr._rep)

{

while (*p && isspace(*p))

_rep = (void*)new char[strlen((char*)cstr._rep)+1];

p++;

strcpy((char*)_rep, (char*)cstr._rep);

}

inline Uint32 StrLen(const char* str)

CString::CString(char* cstr)

: _rep(cstr)

{

if (!str)

}

throw NullPointer();

CString::~CString()

{

if (_rep)

{

delete [] (char*)_rep;

}

CString& CString::operator=(const CString& cstr)

{

if (&cstr != this)

{

if (_rep)

{

delete [] (char*)_rep;

_rep = 0;

}

if (cstr._rep)

{

_rep = (char*)new char[strlen((char*)cstr._rep)+1];

strcpy((char*)_rep, (char*)cstr._rep);

}

return *this;

}

return strlen(str);

CString::operator const char*() const

{

return (char*)_rep;

}

inline Uint32 StrLen(const Char16* str)

///////////////////////////////////////////////////////////////////////////////

// String

///////////////////////////////////////////////////////////////////////////////

const String String::EMPTY = String();

inline Uint32 _StrLen(const Char16* str)

{

if (!str)

throw NullPointer();

Line 67

Line 135

return n;

}

String::String()

// Converts a utf-8 char buffer to utf-16 and appends the utf-16 to the Array.

// n is the length of the input char *, if stopAtTerm is 0

// A terminator character is appended to the end.

// Note that each input char is converted individually, which gives

// the fastest performance.

void _convertAndAppend(const char* str, Array<Char16>& c16a, Uint32 n, Uint8 stopAtTerm)

{

Uint32 i = 0;

while ((stopAtTerm && *str) || (!stopAtTerm && i < n))

{

if (*(Uint8*)str <= 0x7f)

{

_rep.append('\0');

// Current byte sequence is in the us-ascii range.

c16a.append(Uint8(*str++));

}

else

String::String(const String& x) : _rep(x._rep)

{

// Current byte sequence is not in the us-ascii range.

// Check if the byte sequence is valid utf-8, and if so,

// call the converter to utf-16

Uint16 tgt[3];

tgt[1] = 0;

Uint8 c = UTF_8_COUNT_TRAIL_BYTES(*str);

if ( (!stopAtTerm && i + c >= n) ||

(!isValid_U8((const Uint8 *)str, c+1)) )

{

// Note about error conditions.

// It is possible that the last utf-8 char before the

// end of input string extends past the end of the input string.

// This is caught in both cases -

// If counting up to n, then the test above catches it.

// If converting until terminator found, then a terminator

// in the middle of a multi-byte utf-8 char is invalid.

MessageLoaderParms parms("Common.String.BAD_UTF8",

"The byte sequence starting at index $0 is not valid UTF-8 encoding.",

i);

throw Exception(parms);

}

else

String::String(const String& x, Uint32 n)

{

_rep.append('\0');

// str is incremented by this call to the start of the next char

append(x.getData(), n);

Uint16 * tgtBuf = tgt;

}

UTF8toUTF16((const Uint8 **)&str, (Uint8 *)&str[c+1], &tgtBuf, &tgtBuf[2]);

c16a.append(tgt[0]);

String::String(const Char16* x) : _rep(x, StrLen(x) + 1)

if (tgt[1])

{

// Its a utf-16 surrogate pair (uses 2 Char16's)

c16a.append(tgt[1]);

}

String::String(const Char16* x, Uint32 n)

// bump by the trailing byte count

{

i += c;

assign(x, n);

}

String::String(const char* str)

i++;

{

} // end while

Uint32 n = ::strlen(str) + 1;

reserve(n);

while (n--)

c16a.append('\0');

_rep.append(*str++);

}

String::String(const char* str, Uint32 n_)

class StringRep

{

Uint32 n = _min(strlen(str), n_);

public:

reserve(n + 1);

StringRep()

{}

StringRep(const StringRep& r)

: c16a(r.c16a)

{}

StringRep(const Char16* str)

: c16a(str, _StrLen(str) + 1)

{}

while (n--)

Array<Char16> c16a;

_rep.append(*str++);

};

_rep.append('\0');

String::String()

}

String& String::assign(const Char16* x)

{

_rep.clear();

_rep = new StringRep;

_rep.append(x, StrLen(x) + 1);

_rep->c16a.append('\0');

return *this;

}

String& String::assign(const Char16* str, Uint32 n)

String::String(const String& str)

{

_rep.clear();

if (str._rep != NULL)

Uint32 m = _min(StrLen(str), n);

{

_rep.append(str, m);

_rep = new StringRep(*str._rep);

_rep.append('\0');

return *this;

}

else

String& String::assign(const char* x)

{

_rep.clear();

_rep = new StringRep();

Uint32 n = strlen(x);

}

_rep.reserve(n + 1);

}

while (n--)

_rep.append(*x++);

_rep.append('\0');

return *this;

String::String(const String& str, Uint32 n)

{

_rep = new StringRep;

assign(str.getChar16Data(), n);

}

String& String::assign(const char* x, Uint32 n_)

String::String(const Char16* str)

{

_rep.clear();

if ( str == 0 )

{

Uint32 n = _min(strlen(x), n_);

throw NullPointer();

_rep.reserve(n + 1);

}

while (n--)

_rep.append(*x++);

_rep.append('\0');

return *this;

_rep = new StringRep(str);

}

char* String::allocateCString(Uint32 extraBytes, Boolean noThrow) const

String::String(const Char16* str, Uint32 n)

{

Uint32 n = size() + 1;

if ( str == 0 )

char* str = new char[n + extraBytes];

char* p = str;

const Char16* q = getData();

for (Uint32 i = 0; i < n; i++)

{

Uint16 c = *q++;

throw NullPointer();

*p++ = char(c);

if ((c & 0xff00) && !noThrow)

throw TruncatedCharacter();

}

return str;

_rep = new StringRep;

assign(str, n);

}

void String::appendToCString(

String::String(const char* str)

char* str,

{

Uint32 length,

if ( str == 0 )

Boolean noThrow) const

{

if (!str)

throw NullPointer();

}

Uint32 n = _min(size(), length);

_rep = new StringRep;

AutoPtr<StringRep> tempRep(_rep);

char* p = str + strlen(str);

// An exception can be thrown, so use a temp AutoPtr.

const Char16* q = getData();

_convertAndAppend(str, _rep->c16a, 0, 1);

tempRep.release();

}

for (Uint32 i = 0; i < n; i++)

String::String(const char* str, Uint32 n)

{

Uint16 c = *q++;

if ( str == 0 )

*p++ = char(c);

{

throw NullPointer();

if ((c & 0xff00) && !noThrow)

throw TruncatedCharacter();

}

*p = '\0';

_rep = new StringRep;

AutoPtr<StringRep> tempRep(_rep);

// An exception can be thrown, so use a temp AutoPtr.

_convertAndAppend(str, _rep->c16a, n, 0);

tempRep.release();

}

Char16& String::operator[](Uint32 i)

String::~String()

{

if (i > size())

delete _rep;

ThrowOutOfBounds();

return _rep[i];

}

const Char16 String::operator[](Uint32 i) const

String& String::operator=(const String& str)

{

if (i > size())

if (&str != this)

ThrowOutOfBounds();

{

assign(str);

return _rep[i];

}

return *this;

}

String& String::append(const Char16* str, Uint32 n)

String& String::assign(const String& str)

{

Uint32 m = _min(StrLen(str), n);

_rep->c16a = str._rep->c16a;

_rep.reserve(_rep.size() + m);

_rep.remove(_rep.size() - 1);

_rep.append(str, m);

_rep.append('\0');

return *this;

}

void String::remove(Uint32 pos, Uint32 size)

String& String::assign(const Char16* str)

{

if (size == PEG_NOT_FOUND)

if ( str == 0 )

size = this->size() - pos;

{

throw NullPointer();

if (pos + size > this->size())

}

ThrowOutOfBounds();

if (size)

_rep->c16a.clear();

_rep.remove(pos, size);

_rep->c16a.append(str, _StrLen(str) + 1);

return *this;

}

int String::compare(const Char16* s1, const Char16* s2, Uint32 n)

String& String::assign(const Char16* str, Uint32 n)

{

while (n--)

if ( str == 0 )

{

int r = *s1++ - *s2++;

throw NullPointer();

if (r)

return r;

}

return 0;

_rep->c16a.clear();

_rep->c16a.append(str, n);

_rep->c16a.append('\0');

return *this;

}

int String::compareNoCase(const char* s1, const char* s2, Uint32 n)

String& String::assign(const char* str)

{

while (n--)

if ( str == 0 )

{

int r = tolower(*s1++) - tolower(*s2++);

throw NullPointer();

if (r)

return r;

}

return 0;

_rep->c16a.clear();

_convertAndAppend(str, _rep->c16a, 0, 1);

return *this;

}

Boolean String::equal(const String& x, const String& y)

String& String::assign(const char* str, Uint32 n)

{

if (x.size() != y.size())

if ( str == 0 )

return false;

{

throw NullPointer();

}

return String::compare(x.getData(), y.getData(), x.size()) == 0;

_rep->c16a.clear();

_convertAndAppend(str, _rep->c16a, n, 0);

return *this;

}

Boolean String::equal(const String& x, const Char16* y)

void String::clear()

{

if (x.size() != StrLen(y))

_rep->c16a.clear();

return false;

_rep->c16a.append('\0');

}

return String::compare(x.getData(), y, x.size()) == 0;

void String::reserveCapacity(Uint32 capacity)

{

_rep->c16a.reserveCapacity(capacity + 1);

}

Boolean String::equal(const Char16* x, const String& y)

Uint32 String::size() const

{

return equal(y, x);

//#if defined (PEGASUS_OS_VMS)

// This prevents returning a minus number.

// Seems as though the first time through

// the XML parser something doesn't get

// initialized and there is no check for

// a negative number in the parser!

// Uint32 foo;

// foo = _rep->c16a.size();

// if (foo == 0)

// {

// return 0;

// }

// else

// {

// return (foo -1);

// }

//#else

return _rep->c16a.size() - 1;

//#endif

}

Boolean String::equal(const String& x, const char* y)

const Char16* String::getChar16Data() const

{

return equal(x, String(y));

return _rep->c16a.getData();

}

Boolean String::equal(const char* x, const String& y)

Char16& String::operator[](Uint32 index)

{

return equal(String(x), y);

if (index > size())

throw IndexOutOfBoundsException();

return _rep->c16a[index];

}

Boolean String::equalNoCase(const String& x, const String& y)

const Char16 String::operator[](Uint32 index) const

{

if (x.size() != y.size())

if (index > size())

return false;

throw IndexOutOfBoundsException();

const Char16* p = x.getData();

return _rep->c16a[index];

const Char16* q = y.getData();

}

Uint32 n = x.size();

String& String::append(const Char16& c)

{

_rep->c16a.insert(_rep->c16a.size() - 1, c);

return *this;

}

while (n--)

String& String::append(const Char16* str, Uint32 n)

{

if (*p <= 127 && *q <= 127)

if (str == 0)

{

if (tolower(*p++) != tolower(*q++))

throw NullPointer();

return false;

}

else if (*p++ != *q++)

return false;

_rep->c16a.reserveCapacity(_rep->c16a.size() + n);

_rep->c16a.remove(_rep->c16a.size() - 1);

_rep->c16a.append(str, n);

_rep->c16a.append('\0');

return *this;

}

return true;

String& String::append(const String& str)

{

return append(str.getChar16Data(), str.size());

}

void String::remove(Uint32 index, Uint32 size)

{

if (size == PEG_NOT_FOUND)

size = this->size() - index;

if (index + size > this->size())

throw IndexOutOfBoundsException();

if (size)

_rep->c16a.remove(index, size);

}

String String::subString(Uint32 pos, Uint32 length) const

String String::subString(Uint32 index, Uint32 length) const

{

if (pos < size())

if (index < size())

{

if (length == PEG_NOT_FOUND)

if ((length == PEG_NOT_FOUND) || (length > size() - index))

length = size() - pos;

length = size() - index;

return String(getData() + pos, length);

return String(getChar16Data() + index, length);

}

else

return String();

}

Uint32 String::find(Char16 c) const

{

const Char16* first = getData();

const Char16* first = getChar16Data();

for (const Char16* p = first; *p; p++)

{

Line 347

Line 480

return PEG_NOT_FOUND;

}

Uint32 String::find(Uint32 index, Char16 c) const

{

const Char16* data = getChar16Data();

for (Uint32 i = index, n = size(); i < n; i++)

{

if (data[i] == c)

return i;

}

return PEG_NOT_FOUND;

}

Uint32 String::find(const String& s) const

{

const Char16* pSubStr = s.getData();

const Char16* pSubStr = s.getChar16Data();

const Char16* pStr = getData();

const Char16* pStr = getChar16Data();

Uint32 subStrLen = s.size();

Uint32 strLen = size();

if (subStrLen > strLen)

{

return PEG_NOT_FOUND;

}

// loop to find first char match

Uint32 loc = 0;

for( ; loc <= (strLen-subStrLen); loc++)

Line 367

Line 518

Uint32 i = 1;

for (; i < subStrLen; i++)

if (*pStr++ != *p++ )

{pStr--; break;} // break from loop

{pStr-=i; break;} // break from loop

if (i == subStrLen)

return loc;

}

Line 375

Line 526

return PEG_NOT_FOUND;

}

// ATTN:KS 5 apr 2000 Need to add the Char16* version.

Uint32 String::find(const char* s) const

{

return find(String(s));

}

Uint32 String::reverseFind(Char16 c) const

{

const Char16* first = getData();

const Char16* first = getChar16Data();

const Char16* last = getData() + size();

const Char16* last = getChar16Data() + size();

while (last != first)

{

Line 397

Line 542

void String::toLower()

{

for (Char16* p = &_rep[0]; *p; p++)

#ifdef PEGASUS_HAS_ICU

if (InitializeICU::initICUSuccessful())

{

if (*p <= 127)

// This will do a locale-insensitive, but context-sensitive convert.

*p = tolower(*p);

// Context-sensitive prevents any optimizations that try to

// convert just the ascii before calling ICU.

// The string may shrink or expand after the convert.

int32_t sz = size();

UChar* destbuf = new UChar[sz + 1];

const UChar* srcbuf = (const UChar *)getChar16Data();

UErrorCode err = U_ZERO_ERROR;

int32_t needed = u_strToLower(destbuf, sz + 1 , srcbuf, sz, NULL, &err);

if (err == U_BUFFER_OVERFLOW_ERROR)

{

delete [] destbuf;

destbuf = new UChar[needed + 1];

err = U_ZERO_ERROR;

u_strToLower(destbuf, needed + 1 , srcbuf, sz, NULL, &err);

}

if (U_FAILURE(err))

{

delete [] destbuf;

throw Exception(u_errorName(err));

}

void String::translate(Char16 fromChar, Char16 toChar)

if (needed == sz)

{

for (Char16* p = &_rep[0]; *p; p++)

Char16* from = (Char16*)destbuf;

for (Char16* to = &_rep->c16a[0]; *to; to++, from++)

{

if (*p == fromChar)

*to = *from;

*p = toChar;

}

else

{

assign((Char16 *)destbuf, needed);

}

int String::compare(const Char16* s1, const Char16* s2)

delete [] destbuf;

}

else

#endif

{

while (*s1 && *s2)

for (Char16* p = &_rep->c16a[0]; *p; p++)

{

int r = *s1++ - *s2++;

if (*p <= PEGASUS_MAX_PRINTABLE_CHAR)

*p = tolower(*p);

if (r)

}

return r;

}

if (*s2)

void String::toUpper()

return -1;

{

else if (*s1)

#ifdef PEGASUS_HAS_ICU

return 1;

if (InitializeICU::initICUSuccessful())

{

// This will do a locale-insensitive, but context-sensitive convert.

// Context-sensitive prevents any optimizations that try to

// convert just the ascii before calling ICU.

// The string may shrink or expand after the convert.

return 0;

int32_t sz = size();

}

UChar* destbuf = new UChar[sz + 1];

const UChar* srcbuf = (const UChar *)getChar16Data();

UErrorCode err = U_ZERO_ERROR;

PEGASUS_STD(ostream)& operator<<(PEGASUS_STD(ostream)& os, const String& x)

int32_t needed = u_strToUpper(destbuf, sz + 1 , srcbuf, sz, NULL, &err);

if (err == U_BUFFER_OVERFLOW_ERROR)

{

delete [] destbuf;

destbuf = new UChar[needed + 1];

err = U_ZERO_ERROR;

u_strToUpper(destbuf, needed + 1 , srcbuf, sz, NULL, &err);

}

if (U_FAILURE(err))

{

for (Uint32 i = 0, n = x.size(); i < n; i++)

delete [] destbuf;

os << x[i];

throw Exception(u_errorName(err));

}

return os;

if (needed == sz)

{

Char16* from = (Char16*)destbuf;

for (Char16* to = &_rep->c16a[0]; *to; to++, from++)

{

*to = *from;

}

else

{

assign((Char16 *)destbuf, needed);

}

void String::toLower(char* str)

delete [] destbuf;

}

else

#endif

{

for (Char16* p = &_rep->c16a[0]; *p; p++)

{

while (*str)

if (*p <= PEGASUS_MAX_PRINTABLE_CHAR)

tolower(*str++);

*p = toupper(*p);

}

String ToLower(const String& str)

int String::compare(const String& s1, const String& s2, Uint32 n)

{

String tmp(str);

const Char16* s1c16 = s1.getChar16Data();

const Char16* s2c16 = s2.getChar16Data();

for (Uint32 i = 0, n = tmp.size(); i < n; i++)

while (n--)

{

Char16 c = tmp[i];

int r = *s1c16++ - *s2c16++;

if (c <= 127)

if (r)

tmp[i] = tolower(c);

return r;

}

return tmp;

return 0;

}

int CompareNoCase(const char* s1, const char* s2)

int String::compare(const String& s1, const String& s2)

{

while (*s1 && *s2)

const Char16* s1c16 = s1.getChar16Data();

const Char16* s2c16 = s2.getChar16Data();

while (*s1c16 && *s2c16)

{

int r = tolower(*s1++) - tolower(*s2++);

int r = *s1c16++ - *s2c16++;

if (r)

return r;

}

if (*s2)

if (*s2c16)

return -1;

else if (*s1)

else if (*s1c16)

return 1;

return 0;

}

Boolean GetLine(PEGASUS_STD(istream)& is, String& line)

int String::compareNoCase(const String& s1, const String& s2)

{

line.clear();

#ifdef PEGASUS_HAS_ICU

if (InitializeICU::initICUSuccessful())

Boolean gotChar = false;

char c;

while (is.get(c))

{

gotChar = true;

return u_strcasecmp((const UChar*)s1.getChar16Data(),

(const UChar*)s2.getChar16Data(),

U_FOLD_CASE_DEFAULT);

}

#endif

const Char16* _s1 = s1.getChar16Data();

const Char16* _s2 = s2.getChar16Data();

if (c == '\n')

while (*_s1 && *_s2)

break;

{

int r;

line.append(c);

if (*_s1 <= PEGASUS_MAX_PRINTABLE_CHAR &&

*_s2 <= PEGASUS_MAX_PRINTABLE_CHAR)

{

r = tolower(*_s1++) - tolower(*_s2++);

}

else

return gotChar;

{

r = *_s1++ - *_s2++;

}

String::~String()

if (r)

{

return r;

}

String& String::assign(const String& x)

if (*_s2)

{

return -1;

_rep = x._rep;

else if (*_s1)

return *this;

return 1;

return 0;

}

String& String::append(const Char16& c)

Boolean String::equal(const String& str1, const String& str2)

{

_rep.insert(_rep.size() - 1, c);

return String::compare(str1, str2) == 0;

return *this;

}

void String::clear()

Boolean String::equalNoCase(const String& str1, const String& str2)

{

_rep.clear();

#ifdef PEGASUS_HAS_ICU

_rep.append('\0');

return compareNoCase(str1, str2) == 0;

}

#else

if (str1.size() != str2.size())

return false;

void String::reserve(Uint32 capacity)

const Char16* p = str1.getChar16Data();

const Char16* q = str2.getChar16Data();

Uint32 n = str1.size();

while (n--)

{

if (*p <= PEGASUS_MAX_PRINTABLE_CHAR &&

*q <= PEGASUS_MAX_PRINTABLE_CHAR)

{

_rep.reserve(capacity + 1);

if (tolower(*p++) != tolower(*q++))

return false;

}

else if (*p++ != *q++)

return false;

}

const Array<String>& EmptyStringArray()

return true;

{

#endif

static Array<String> tmp;

return tmp;

}

void String::split(const String& line, Array<String>& fields)

CString String::getCString() const

{

fields.clear();

Uint32 n = 3*size() + 1;

char* str = new char[n];

for (const Char16* p = line.getData(); *p; p++)

const Char16* msg16 = getChar16Data();

const Uint16 *strsrc = (Uint16 *)msg16;

Uint16 *endsrc = (Uint16 *)&msg16[size()+1];

Uint8 *strtgt = (Uint8 *)str;

Uint8 *endtgt = (Uint8 *)&str[n];

UTF16toUTF8 (&strsrc,

endsrc,

&strtgt,

endtgt);

char* str1 = new char[strlen(str)+1];

strcpy(str1,str);

delete [] str;

return CString(str1);

}

#if 0

// ATTN-RK-P3-20020603: This code is not completely correct

// Wildcard String matching function that may be useful in the future

// The following code was provided by Bob Blair.

/* _StringMatch Match input MatchString against a GLOB style pattern

Note that MatchChar is the char type so that this source

in portable to different string types. This is an internal function

Results: The return value is 1 if string matches pattern, and

0 otherwise. The matching operation permits the following

special characters in the pattern: *?\[] (see the manual

entry for details on what these mean).

Side effects: None.

/* MatchChar defined as a separate entity because this function source used

elsewhere was an unsigned char *. Here we use Uint16 to maintain 16 bit

size.

typedef Uint16 MatchChar;

inline Uint16 _ToLower(Uint16 ch)

{

// ICU_TODO: If ICU is available we should do this the correct way.

return ch <= PEGASUS_MAX_PRINTABLE_CHAR ? tolower(char(ch)) : ch;

}

inline Boolean _Equal(MatchChar ch1, MatchChar ch2, int nocase)

{

// ICU_TODO: If ICU is available we should do this the correct way.

if (nocase)

return _ToLower(ch1) == _ToLower(ch2);

return ch1 == ch2;

}

static const MatchChar *

_matchrange(const MatchChar *range, MatchChar c, int nocase)

{

const MatchChar *p = range;

const MatchChar *rstart = range + 1;

const MatchChar *rend = 0;

MatchChar compchar;

for (rend = rstart; *rend && *rend != ']'; rend++);

if (*rend == ']') { // if there is an end to this pattern

for (compchar = *rstart; rstart != rend; rstart++) {

if (_Equal(*rstart, c, nocase))

return ++rend;

if (*rstart == '-') {

rstart++;

if (c >= compchar && c <= *rstart)

return ++rend;

}

return (const MatchChar *)0;

}

static int

_StringMatch(

const MatchChar *testString,

const MatchChar *pattern,

int nocase ) /* Ignore case if this is true */

{

const MatchChar *pat = pattern;

const MatchChar *str = testString;

unsigned int done = 0;

unsigned int res = 0; // the result: 1 == match

while (!done) { // main loop walks through pattern and test string

//cerr << "Comparing <" << *pat << "> and <" << *str << ">" << endl;

if (!*pat) { //end of pattern

done = 1; // we're done

if (!*str) //end of test, too?

res = 1; // then we matched

} else { //Not end of pattern

if (!*str) { // but end of test

done = 1; // We're done

if (*pat == '*') // If pattern openends

res = 1; // then we matched

} else { //Not end of test

if (*pat == '*') { //Ambiguuity found

if (!*++pat) { //and it ends pattern

done = 1; // then we're done

res = 1; // and match

} else { //if it doesn't end

while (!done) { // until we're done

if (_StringMatch(str, pat, nocase)) { // we recurse

done = 1; //if it recurses true

res = 1; // we done and match

} else { //it recurses false

if (!*str) // see if test is done

done = 1; // yes: we done

else // not done:

str++; // keep testing

} // end test on recursive call

} // end looping on recursive calls

} // end logic when pattern is ambiguous

} else { //pattern not ambiguus

if (*pat == '?') { //pattern is 'any'

pat++, str++; // so move along

} else if (*pat == '[') { //see if it's a range

pat = _matchrange(pat, *str, nocase); // and is a match

if (!pat) { //It is not a match

done = 1; // we're done

res = 0; // no match

} else { //Range matches

str++, pat++; // keep going

}

} else { // only case left is individual characters

if (!_Equal(*pat++, *str++, nocase)) // if they don't match

done = 1; // bail.

}

} // end ("pattern is not ambiguous (*)" logic

} // end logic when pattern and string still have data

} // end logic when pattern still has data

} // end main loop

return res;

}

/** match matches a string against a GLOB style pattern.

Return trues if the String parameter matches the pattern. C-Shell style

glob matching is used.

@param str String to be matched against the pattern

@param pattern Pattern to use in the match

@return Boolean true if str matches pattern

The pattern definition is as follows:

<pre>

* Matches any number of any characters

? Match exactly one character

[chars] Match any character in chars

[chara-charb] Match any character in the range between chara and charb

</pre>

The literal characters *, ?, [, ] can be included in a string by

escaping them with backslash "\". Ranges of characters can be concatenated.

<pre>

examples:

Boolean result = String::match("This is a test", "*is*");

Boolean works = String::match("abcdef123", "*[0-9]");

</pre>

Boolean String::match(const String& str, const String& pattern)

{

return _StringMatch(

(Uint16*)str.getChar16Data(), (Uint16*)pattern.getChar16Data(), 0) != 0;

}

/** matchNoCase Matches a String against a GLOB style pattern independent

of case.

Returns true if the str parameter matches the pattern. C-Shell style

glob matching is used. Ignore case in all comparisons. Case is

ignored in the match.

@parm str String containing the string to be matched\

@parm pattern GLOB style patterh to use in the match.

@return Boolean true if str matches patterh

@see match

Boolean String::matchNoCase(const String& str, const String& pattern)

{

_SkipWhitespace(p);

return _StringMatch(

(Uint16*)str.getChar16Data(), (Uint16*)pattern.getChar16Data(), 1) != 0;

}

#endif

if (!*p)

break;

String field;

///////////////////////////////////////////////////////////////////////////////

// String-related functions

///////////////////////////////////////////////////////////////////////////////

if (*p == '"')

Boolean operator==(const String& str1, const String& str2)

{

p++;

return String::equal(str1, str2);

}

for (; *p && *p != '"'; p++)

Boolean operator==(const String& str1, const char* str2)

{

if (*p == '\\')

return String::equal(str1, str2);

}

Boolean operator==(const char* str1, const String& str2)

{

p++;

return String::equal(str1, str2);

}

switch (*p)

Boolean operator!=(const String& str1, const String& str2)

{

case '\0':

return !String::equal(str1, str2);

break;

}

case 'n':

PEGASUS_STD(ostream)& operator<<(PEGASUS_STD(ostream)& os, const String& str)

field.append('\n');

{

break;

case 't':

#if defined(PEGASUS_OS_OS400)

field.append('\t');

CString cstr = str.getCString();

break;

const char* utf8str = cstr;

case 'r':

os << utf8str;

field.append('\r');

break;

case 'f':

#elif defined(PEGASUS_HAS_ICU)

field.append('\f');

if (InitializeICU::initICUSuccessful())

break;

{

char *buf = NULL;

const int size = str.size() * 6;

UnicodeString UniStr((const UChar *)str.getChar16Data(), (int32_t)str.size());

Uint32 bufsize = UniStr.extract(0,size,buf);

default:

buf = new char[bufsize+1];

field.append(*p);

UniStr.extract(0,bufsize,buf);

}

os << buf;

os.flush();

delete [] buf;

}

else

field.append(*p);

#endif // End of PEGASUS_HAS_ICU #else leg.

}

{

for (Uint32 i = 0, n = str.size(); i < n; i++)

{

Uint16 code = str[i];

fields.append(field);

if (code > 0 && code <= PEGASUS_MAX_PRINTABLE_CHAR)

{

os << char(code);

}

else

{

for (; *p && !isspace(*p); p++)

// Print in hex format:

field.append(*p);

char buffer[8];

sprintf(buffer, "\\x%04X", code);

fields.append(field);

os << buffer;

}

if (!*p)

break;

}

void String::join(Array<String>& fields, String& line)

return os;

{

for (Uint32 i = 0, n = fields.size(); i < n; i++)

{

String tmp;

Boolean hasSpaces = escape(fields[i], tmp);

if (hasSpaces)

line += '"';

line += tmp;

if (hasSpaces)

line += '"';

if (i + 1 != n)

line += ' ';

}

Boolean String::escape(const String& in, String& out)

String operator+(const String& str1, const String& str2)

{

Boolean hasSpaces = false;

return String(str1).append(str2);

}

out.reserve(out.size() + (2 * in.size()));

for (Uint32 i = 0, n = in.size(); i < n; i++)

Boolean operator<(const String& str1, const String& str2)

{

Char16 c = in[i];

return String::compare(str1, str2) < 0;

}

switch (c)

Boolean operator<=(const String& str1, const String& str2)

{

case '\n':

return String::compare(str1, str2) <= 0;

out += "\\n";

break;

case '\t':

out += "\\t";

break;

case '\r':

out += "\\r";

break;

case '\f':

out += "\\f";

break;

case '\"':

out += "\\\"";

break;

default:

out += c;

if (!hasSpaces)

hasSpaces = c == ' ';

break;

}

Boolean operator>(const String& str1, const String& str2)

{

return String::compare(str1, str2) > 0;

}

return hasSpaces;

Boolean operator>=(const String& str1, const String& str2)

{

return String::compare(str1, str2) >= 0;

}

PEGASUS_NAMESPACE_END

Legend:

Removed from v.1.21
changed lines
	Added in v.1.109

No CVS admin address has been configured