pegasus/src/Pegasus/Common/String.cpp - diff

Return to String.cpp CVS log

Up to [Pegasus] / pegasus / src / Pegasus / Common

Diff for /pegasus/src/Pegasus/Common/String.cpp between version 1.56 and 1.95

version 1.56, 2002/08/30 00:51:59

version 1.95, 2004/06/15 18:38:24

Line 1

//%/////////////////////////////////////////////////////////////////////////////

//%2003////////////////////////////////////////////////////////////////////////

// The Open Group, Tivoli Systems

// Company, L. P., IBM Corp., The Open Group, Tivoli Systems.

// IBM Corp.; EMC Corporation, The Open Group.

// Permission is hereby granted, free of charge, to any person obtaining a copy

// of this software and associated documentation files (the "Software"), to

Line 29

Line 31

#include <cctype>

#include <cstring>

#include "String.h"

#include "Array.h"

#include "InternalException.h"

#include <iostream>

#include <fstream>

#include "CommonUTF.h"

#ifdef PEGASUS_HAS_ICU

#include <unicode/unistr.h>

#endif

PEGASUS_USING_STD;

Line 51

Line 61

CString::CString(const CString& cstr)

{

_rep = new char[strlen(cstr._rep)+1];

_rep = 0;

_rep = strcpy(_rep, cstr._rep);

if (cstr._rep)

{

_rep = (void*)new char[strlen((char*)cstr._rep)+1];

strcpy((char*)_rep, (char*)cstr._rep);

}

CString::CString(char* cstr)

Line 63

Line 78

CString::~CString()

{

if (_rep)

delete [] _rep;

{

delete [] (char*)_rep;

}

CString& CString::operator=(const CString& cstr)

{

_rep = new char[strlen(cstr._rep)+1];

if (&cstr != this)

_rep = strcpy(_rep, cstr._rep);

{

if (_rep)

{

delete [] (char*)_rep;

_rep = 0;

}

if (cstr._rep)

{

_rep = (char*)new char[strlen((char*)cstr._rep)+1];

strcpy((char*)_rep, (char*)cstr._rep);

}

return *this;

}

CString::operator const char*() const

{

return _rep;

return (char*)_rep;

}

///////////////////////////////////////////////////////////////////////////////

Line 162

Line 190

String::String(const String& str)

{

if (str._rep != NULL)

{

_rep = new StringRep(*str._rep);

}

else

{

_rep = new StringRep();

}

String::String(const String& str, Uint32 n)

{

Line 201

Line 237

String& String::operator=(const String& str)

{

return assign(str);

if (&str != this)

{

assign(str);

}

return *this;

}

String& String::assign(const String& str)

Line 226

Line 266

return *this;

}

String& String::assign(const char* str)

{

_rep->c16a.clear();

Uint32 n = strlen(str) + 1;

_rep->c16a.reserveCapacity(n);

while (n--)

_rep->c16a.append(*str++);

return *this;

}

String& String::assign(const char* str, Uint32 n)

{

_rep->c16a.clear();

char *tmpStr = new char[n+1];

memset(tmpStr,0x00,n+1);

Uint32 _n = _strnlen(str, n);

strncpy(tmpStr,str,n);

_rep->c16a.reserveCapacity(_n + 1);

assign(tmpStr);

delete tmpStr;

while (_n--)

_rep->c16a.append(*str++);

_rep->c16a.append('\0');

return *this;

}

Line 275

Line 299

return _rep->c16a.getData();

}

CString String::getCString() const

{

Uint32 n = size() + 1;

char* str = new char[n];

char* p = str;

const Char16* q = getChar16Data();

for (Uint32 i = 0; i < n; i++)

{

Uint16 c = *q++;

*p++ = char(c);

//if (c & 0xff00)

// truncatedCharacters = true;

}

return CString(str);

}

Char16& String::operator[](Uint32 index)

{

if (index > size())

Line 347

Line 352

{

if (index < size())

{

if (length == PEG_NOT_FOUND)

if ((length == PEG_NOT_FOUND) || (length > size() - index))

length = size() - index;

return String(getChar16Data() + index, length);

Line 407

Line 412

Uint32 i = 1;

for (; i < subStrLen; i++)

if (*pStr++ != *p++ )

{pStr--; break;} // break from loop

{pStr-=i; break;} // break from loop

if (i == subStrLen)

return loc;

}

Line 431

Line 436

void String::toLower()

{

const char * noLocale = NULL;

String::toLower(noLocale);

}

void String::toLower(const char * strLocale)

{

#ifdef PEGASUS_HAS_ICU

UnicodeString UniStr((const UChar *)_rep->c16a.getData());

if(strLocale == NULL)

{

UniStr.toLower();

}

else

{

Locale loc(strLocale);

if(loc.isBogus())

{

throw InvalidNameException(String(strLocale));

}

UniStr.toLower(loc);

}

UniStr.append((UChar)'\0');

assign((Char16*)UniStr.getBuffer());

#else

for (Char16* p = &_rep->c16a[0]; *p; p++)

{

if (*p <= PEGASUS_MAX_PRINTABLE_CHAR)

*p = tolower(*p);

}

#endif

}

void String::toUpper(const char * strLocale)

{

#ifdef PEGASUS_HAS_ICU

UnicodeString UniStr((const UChar *)_rep->c16a.getData());

if(strLocale == NULL)

{

UniStr.toUpper();

}

else

{

Locale loc(strLocale);

if(loc.isBogus())

{

throw InvalidNameException(String(strLocale));

}

UniStr.toUpper(loc);

}

UniStr.append((UChar)'\0');

assign((Char16*)UniStr.getBuffer());

#else

for (Char16* p = &_rep->c16a[0]; *p; p++)

{

if (*p <= PEGASUS_MAX_PRINTABLE_CHAR)

*p = toupper(*p);

}

#endif

}

int String::compare(const String& s1, const String& s2, Uint32 n)

Line 477

Line 536

int String::compareNoCase(const String& s1, const String& s2)

{

const char * noLocale = NULL;

return String::compareNoCase(s1, s2, noLocale);

}

int String::compareNoCase(const String& s1, const String& s2,const char * strLocale)

{

#ifdef PEGASUS_HAS_ICU

UnicodeString UniStr1((const UChar *)s1.getChar16Data(), (int32_t)s1.size());

UnicodeString UniStr2((const UChar *)s2.getChar16Data(), (int32_t)s2.size());

if(strLocale == NULL)

{

UniStr1.toLower();

UniStr2.toLower();

}

else

{

Locale loc(strLocale);

if(loc.isBogus())

{

throw InvalidNameException(String(strLocale));

}

UniStr1.toLower(loc);

UniStr2.toLower(loc);

}

// Note: the ICU 2.6.1 documentation for UnicodeString::compare( ) is

// backwards! The API actually returns +1 if this is greater than text.

// This is why the line below appears wrong based on the 2.6.1 docs.

// (ref. bugzilla 1207)

return (UniStr1.compare(UniStr2));

#else

const Char16* _s1 = s1.getChar16Data();

const Char16* _s2 = s2.getChar16Data();

Line 504

Line 593

return 1;

return 0;

#endif

}

Boolean String::equal(const String& str1, const String& str2)

Line 513

Line 603

Boolean String::equalNoCase(const String& str1, const String& str2)

{

const char * noLocale = NULL;

return String::equalNoCase(str1, str2, noLocale);

}

Boolean String::equalNoCase(const String& str1, const String& str2,const char * strLocale)

{

#ifdef PEGASUS_HAS_ICU

UnicodeString UniStr1((const UChar *)str1.getChar16Data(), (int32_t)str1.size());

UnicodeString UniStr2((const UChar *)str2.getChar16Data(), (int32_t)str2.size());

if(strLocale == NULL)

{

UniStr1.toLower();

UniStr2.toLower();

}

else

{

Locale loc(strLocale);

if(loc.isBogus())

{

throw InvalidNameException(String(strLocale));

}

UniStr1.toLower(loc);

UniStr2.toLower(loc);

}

return (UniStr1 == UniStr2);

#else

if (str1.size() != str2.size())

return false;

Line 534

Line 650

}

return true;

#endif

}

// UTF8 specific code:

String& String::assign(const char* str)

{

_rep->c16a.clear();

Uint32 n = strlen(str) + 1;

const Uint8 *strsrc = (Uint8 *)str;

Uint8 *endsrc = (Uint8 *)&str[n-1];

Char16 *msg16 = new Char16[n];

Uint16 *strtgt = (Uint16 *)msg16;

Uint16 *endtgt = (Uint16 *)&msg16[n];

UTF8toUTF16(&strsrc,

endsrc,

&strtgt,

endtgt);

Uint32 count;

for(count = 0; ((msg16[count]) != Char16(0x00)) && (count < (n - 1)); ++count);

_rep->c16a.append(msg16, count);

_rep->c16a.append('\0');

delete [] msg16;

return *this;

}

CString String::getCString() const

{

Uint32 n = 3*size() + 1;

char* str = new char[n];

const Char16* msg16 = getChar16Data();

const Uint16 *strsrc = (Uint16 *)msg16;

Uint16 *endsrc = (Uint16 *)&msg16[size()+1];

Uint8 *strtgt = (Uint8 *)str;

Uint8 *endtgt = (Uint8 *)&str[n];

UTF16toUTF8 (&strsrc,

endsrc,

&strtgt,

endtgt);

char* str1 = new char[strlen(str)+1];

strcpy(str1,str);

delete [] str;

return CString(str1);

}

#if 0

// ATTN-RK-P3-20020603: This code is not completely correct

// Wildcard String matching function that may be useful in the future

// The following code was provided by Bob Blair.

Line 550

Line 723

special characters in the pattern: *?\[] (see the manual

entry for details on what these mean).

Side effects: None.

Line 561

Line 735

inline Uint16 _ToLower(Uint16 ch)

{

// ICU_TODO: If ICU is available we should do this the correct way.

return ch <= PEGASUS_MAX_PRINTABLE_CHAR ? tolower(char(ch)) : ch;

}

inline Boolean _Equal(MatchChar ch1, MatchChar ch2, int nocase)

{

// ICU_TODO: If ICU is available we should do this the correct way.

if (nocase)

return _ToLower(ch1) == _ToLower(ch2);

else

Line 659

Line 835

}

/** match matches a string against a GLOB style pattern.

Return trues if the String parameter matches the pattern. C-Shell style

glob matching is used.

@param str String to be matched against the pattern

@param pattern Pattern to use in the match

@return Boolean true if str matches pattern

The pattern definition is as follows:

<pre>

* Matches any number of any characters

? Match exactly one character

[chars] Match any character in chars

[chara-charb] Match any character in the range between chara and charb

</pre>

The literal characters *, ?, [, ] can be included in a string by

escaping them with backslash "\". Ranges of characters can be concatenated.

<pre>

examples:

Boolean result = String::match("This is a test", "*is*");

Boolean works = String::match("abcdef123", "*[0-9]");

</pre>

Boolean String::match(const String& str, const String& pattern)

{

return _StringMatch(

(Uint16*)str.getChar16Data(), (Uint16*)pattern.getChar16Data(), 0) != 0;

}

/** matchNoCase Matches a String against a GLOB style pattern independent

of case.

Returns true if the str parameter matches the pattern. C-Shell style

glob matching is used. Ignore case in all comparisons. Case is

ignored in the match.

@parm str String containing the string to be matched\

@parm pattern GLOB style patterh to use in the match.

@return Boolean true if str matches patterh

@SeeAlso match

Boolean String::matchNoCase(const String& str, const String& pattern)

{

return _StringMatch(

(Uint16*)str.getChar16Data(), (Uint16*)pattern.getChar16Data(), 1) != 0;

}

#endif

///////////////////////////////////////////////////////////////////////////////

Line 700

Line 908

PEGASUS_STD(ostream)& operator<<(PEGASUS_STD(ostream)& os, const String& str)

{

#if defined(PEGASUS_OS_OS400)

CString cstr = str.getCString();

const char* utf8str = cstr;

os << utf8str;

#elif defined(PEGASUS_HAS_ICU)

if(os == cout || os == cerr){

char *buf = NULL;

const int size = str.size() * 6;

UnicodeString UniStr((const UChar *)str.getChar16Data(), (int32_t)str.size());

Uint32 bufsize = UniStr.extract(0,size,buf);

buf = new char[bufsize+1];

UniStr.extract(0,bufsize,buf);

os << buf;

os.flush();

delete [] buf;

}else{

CString cstr = str.getCString();

const char* utf8str = cstr;

os << utf8str;

}

#else

for (Uint32 i = 0, n = str.size(); i < n; i++)

{

Uint16 code = str[i];

Line 716

Line 950

os << buffer;

}

#endif // End of PEGASUS_HAS_ICU #else leg.

return os;

}

Line 745

Line 980

return String::compare(str1, str2) >= 0;

}

int CompareNoCase(const char* s1, const char* s2)

{

while (*s1 && *s2)

{

int r = tolower(*s1++) - tolower(*s2++);

if (r)

return r;

}

if (*s2)

return -1;

else if (*s1)

return 1;

return 0;

}

int EqualNoCase(const char* s1, const char* s2)

{

return CompareNoCase(s1, s2) == 0;

}

PEGASUS_NAMESPACE_END

Legend:

Removed from v.1.56
changed lines
	Added in v.1.95

No CVS admin address has been configured