pegasus/src/Pegasus/Common/String.cpp - diff

Return to String.cpp CVS log

Up to [Pegasus] / pegasus / src / Pegasus / Common

Diff for /pegasus/src/Pegasus/Common/String.cpp between version 1.111.6.7 and 1.111.6.15

version 1.111.6.7, 2005/10/11 01:44:27

version 1.111.6.15, 2005/10/14 14:09:29

Line 27

//==============================================================================

// Author: Mike Brasher (mbrasher@bmc.com)

// Author: Mike Brasher (mbrasher@austin.rr.com)

// Modified By:

// Roger Kumpf, Hewlett-Packard Company (roger_kumpf@hp.com)

Line 66

//==============================================================================

// Note: this table is much faster than the system toupper(). Please do not

// change.

const Uint8 _toUpperTable[256] =

{

0x00,0x01,0x02,0x03,0x04,0x05,0x06,0x07,

Line 102

Line 105

0xF8,0xF9,0xFA,0xFB,0xFC,0xFD,0xFE,0xFF,

};

// Note: this table is much faster than the system tulower(). Please do not

// change.

const Uint8 _toLowerTable[256] =

{

0x00,0x01,0x02,0x03,0x04,0x05,0x06,0x07,

Line 138

Line 144

0xF8,0xF9,0xFA,0xFB,0xFC,0xFD,0xFE,0xFF,

};

// Converts 16-bit characters to upper case.

// Converts 16-bit characters to upper case. This routine is faster than the

// system toupper(). Please do not change.

inline Uint16 _toUpper(Uint16 x)

{

return (x & 0xFF00) ? x : _toUpperTable[x];

}

// Converts 16-bit characters to lower case.

// Converts 16-bit characters to lower case. This routine is faster than the

// system toupper(). Please do not change.

inline Uint16 _toLower(Uint16 x)

{

return (x & 0xFF00) ? x : _toLowerTable[x];

Line 177

Line 185

template<class P, class Q>

static void _copy(P* p, const Q* q, size_t n)

{

// Use loop unrolling.

// The following employs loop unrolling for efficiency. Please do not

// eliminate.

while (n >= 8)

{

Line 211

Line 220

static Uint16* _find(const Uint16* s, size_t n, Uint16 c)

{

// The following employs loop unrolling for efficiency. Please do not

// eliminate.

while (n >= 4)

{

if (s[0] == c)

Line 292

Line 304

while (n-- && (*s1++ - *s2++) == 0)

;

return s1[-1] - s2[-1];

}

Line 302

Line 312

memcpy(s1, s2, n * sizeof(Uint16));

}

void StrinThrowOutOfBounds()

void StringThrowOutOfBounds()

{

throw IndexOutOfBoundsException();

}

#ifdef PEGASUS_STRING_NO_THROW

inline void _checkNullPointer(const void* ptr)

# define _checkNullPointer(ARG) /* empty */

#else

template<class T>

inline void _checkNullPointer(const T* ptr)

{

#ifdef PEGASUS_STRING_NO_THROW

if (!ptr)

throw NullPointer();

}

#endif

}

static void _StringThrowBadUTF8(Uint32 index)

{

MessageLoaderParms parms(

"Common.String.BAD_UTF8",

"The byte sequence starting at index $0 "

"is not valid UTF-8 encoding.",

index);

throw Exception(parms);

}

static size_t _copyFromUTF8(Uint16* dest, const char* src, size_t n)

static size_t _copyFromUTF8(

Uint16* dest,

const char* src,

size_t n,

size_t& utf8_error_index)

{

Uint16* p = dest;

const Uint8* q = (const Uint8*)src;

Line 400

Line 423

if (c > n || !isValid_U8(q, c) ||

UTF8toUTF16(&q, q + c, &p, p + n) != 0)

{

MessageLoaderParms parms("Common.String.BAD_UTF8",

utf8_error_index = q - (const Uint8*)src;

"The byte sequence starting at index $0 "

return size_t(-1);

"is not valid UTF-8 encoding.",

q - (const Uint8*)src);

throw Exception(parms);

}

n -= c;

Line 418

Line 438

// terminator).

static inline size_t _copyToUTF8(char* dest, const Uint16* src, size_t n)

{

// The following employs loop unrolling for efficiency. Please do not

// eliminate.

const Uint16* q = src;

Uint8* p = (Uint8*)dest;

Line 469

Line 492

return p - (Uint8*)dest;

}

static inline size_t _convert(Uint16* p, const char* q, size_t n)

static inline size_t _convert(

Uint16* p, const char* q, size_t n, size_t& utf8_error_index)

{

#ifdef PEGASUS_STRING_NO_UTF8

_copy(p, q, n);

return n;

#else

return _copyFromUTF8(p, q, n);

return _copyFromUTF8(p, q, n, utf8_error_index);

#endif

}

Line 537

Line 561

StringRep* rep = (StringRep*)::operator new(

sizeof(StringRep) + cap * sizeof(Uint16));

rep->cap = cap;

Atomic_create(&rep->refs, 1);

new(&rep->refs) AtomicInt(1);

return rep;

}

static inline void _reserve(StringRep*& rep, Uint32 cap)

{

if (cap > rep->cap || Atomic_get(&rep->refs) != 1)

if (cap > rep->cap || rep->refs.value() != 1)

{

size_t n = _roundUpToPow2(cap);

StringRep* newRep = StringRep::alloc(n);

Line 579

Line 603

StringRep* StringRep::create(const char* data, size_t size)

{

StringRep* rep = StringRep::alloc(size);

rep->size = _convert((Uint16*)rep->data, data, size);

size_t utf8_error_index;

rep->data[rep->size] = '\0';

rep->size = _convert((Uint16*)rep->data, data, size, utf8_error_index);

return rep;

#ifndef PEGASUS_STRING_NO_THROW

if (rep->size == size_t(-1))

{

StringRep::free(rep);

_StringThrowBadUTF8(utf8_error_index);

}

#endif

rep->data[rep->size] = '\0';

StringRep* StringRep::createASCII7(const char* data, size_t size)

{

StringRep* rep = StringRep::alloc(size);

_copy((Uint16*)rep->data, data, size);

rep->data[rep->size = size] = '\0';

return rep;

}

Line 634

Line 660

String::String(const char* str)

{

_checkNullPointer(str);

_rep = StringRep::create(str, strlen(str));

}

String::String(const char* str, String::ASCII7Tag tag)

// Set this just in case create() throws an exception.

{

_rep = &StringRep::_emptyRep;

_checkNullPointer(str);

_rep = StringRep::create(str, strlen(str));

_rep = StringRep::createASCII7(str, strlen(str));

}

String::String(const char* str, Uint32 n)

{

_checkNullPointer(str);

_rep = StringRep::create(str, n);

}

String::String(const char* str, size_t n, String::ASCII7Tag tag)

// Set this just in case create() throws an exception.

{

_rep = &StringRep::_emptyRep;

_checkNullPointer(str);

_rep = StringRep::create(str, n);

_rep = StringRep::createASCII7(str, n);

}

String::String(const String& s1, const String& s2)

Line 674

Line 694

size_t n2 = strlen(s2);

_rep = StringRep::alloc(n1 + n2);

_copy(_rep->data, s1._rep->data, n1);

_rep->size = n1 + _convert((Uint16*)_rep->data + n1, s2, n2);

size_t utf8_error_index;

size_t tmp = _convert((Uint16*)_rep->data + n1, s2, n2, utf8_error_index);

#ifndef PEGASUS_STRING_NO_THROW

if (tmp == size_t(-1))

{

StringRep::free(_rep);

_rep = &StringRep::_emptyRep;

_StringThrowBadUTF8(utf8_error_index);

}

#endif

_rep->size = n1 + tmp;

_rep->data[_rep->size] = '\0';

}

Line 684

Line 716

size_t n1 = strlen(s1);

size_t n2 = s2._rep->size;

_rep = StringRep::alloc(n1 + n2);

_rep->size = n2 + _convert((Uint16*)_rep->data, s1, n1);

size_t utf8_error_index;

size_t tmp = _convert((Uint16*)_rep->data, s1, n1, utf8_error_index);

#ifndef PEGASUS_STRING_NO_THROW

if (tmp == size_t(-1))

{

StringRep::free(_rep);

_rep = &StringRep::_emptyRep;

_StringThrowBadUTF8(utf8_error_index);

}

#endif

_rep->size = n2 + tmp;

_copy(_rep->data + n1, s2._rep->data, n2);

_rep->data[_rep->size] = '\0';

}

Line 704

Line 748

{

_checkNullPointer(str);

if (n > _rep->cap || Atomic_get(&_rep->refs) != 1)

if (n > _rep->cap || _rep->refs.value() != 1)

{

StringRep::unref(_rep);

_rep = StringRep::alloc(n);

Line 721

Line 765

{

_checkNullPointer(str);

if (n > _rep->cap || Atomic_get(&_rep->refs) != 1)

if (n > _rep->cap || _rep->refs.value() != 1)

{

StringRep::unref(_rep);

_rep = StringRep::alloc(n);

}

_rep->size = _convert(_rep->data, str, n);

size_t utf8_error_index;

_rep->data[_rep->size] = 0;

_rep->size = _convert(_rep->data, str, n, utf8_error_index);

return *this;

}

String& String::assignASCII7(const char* str, Uint32 n)

#ifndef PEGASUS_STRING_NO_THROW

{

if (_rep->size == size_t(-1))

_checkNullPointer(str);

if (n > _rep->cap || Atomic_get(&_rep->refs) != 1)

{

StringRep::unref(_rep);

StringRep::free(_rep);

_rep = StringRep::alloc(n);

_rep = &StringRep::_emptyRep;

_StringThrowBadUTF8(utf8_error_index);

}

#endif

_copy(_rep->data, str, n);

_rep->data[_rep->size] = 0;

_rep->data[_rep->size = n] = 0;

return *this;

}

Line 753

Line 792

{

if (_rep->size)

{

if (Atomic_get(&_rep->refs) == 1)

if (_rep->refs.value() == 1)

{

_rep->size = 0;

_rep->data[0] = '\0';

Line 773

Line 812

CString String::getCString() const

{

// A UTF8 string can have three times as many characters as its UTF16

// counterpart, so we allocate extra memory for the worst case. In the

// best case, we may need only one third of the memory allocated. But

// downsizing the string afterwards is expensive and unecessary since

// CString objects are usually short-lived (disappearing after only a few

// instructions). CString objects are typically created on the stack as

// means to obtain a char* pointer.

#ifdef PEGASUS_STRING_NO_UTF8

char* str = (char*)operator new(_rep->size + 1);

_copy(str, _rep->data, _rep->size);

Line 814

Line 861

size_t cap = oldSize + size;

_reserve(_rep, cap);

_rep->size += _convert((Uint16*)_rep->data + oldSize, str, size);

size_t utf8_error_index;

size_t tmp = _convert(

(Uint16*)_rep->data + oldSize, str, size, utf8_error_index);

#ifndef PEGASUS_STRING_NO_THROW

if (tmp == size_t(-1))

{

StringRep::free(_rep);

_rep = &StringRep::_emptyRep;

_StringThrowBadUTF8(utf8_error_index);

}

#endif

_rep->size += tmp;

_rep->data[_rep->size] = '\0';

return *this;

Line 827

Line 887

_checkBounds(index + n, _rep->size);

if (Atomic_get(&_rep->refs) != 1)

if (_rep->refs.value() != 1)

_rep = StringRep::copyOnWrite(_rep);

assert(index + n <= _rep->size);

Line 939

Line 999

if (InitializeICU::initICUSuccessful())

{

if (Atomic_get(&_rep->refs) != 1)

if (_rep->refs.value() != 1)

_rep = StringRep::copyOnWrite(_rep);

// This will do a locale-insensitive, but context-sensitive convert.

Line 974

Line 1034

#endif /* PEGASUS_HAS_ICU */

if (Atomic_get(&_rep->refs) != 1)

if (_rep->refs.value() != 1)

_rep = StringRep::copyOnWrite(_rep);

Uint16* p = _rep->data;

Line 993

Line 1053

if (InitializeICU::initICUSuccessful())

{

if (Atomic_get(&_rep->refs) != 1)

if (_rep->refs.value() != 1)

_rep = StringRep::copyOnWrite(_rep);

// This will do a locale-insensitive, but context-sensitive convert.

Line 1029

Line 1089

#endif /* PEGASUS_HAS_ICU */

if (Atomic_get(&_rep->refs) != 1)

if (_rep->refs.value() != 1)

_rep = StringRep::copyOnWrite(_rep);

Uint16* p = _rep->data;

Line 1104

Line 1164

#else /* PEGASUS_HAS_ICU */

// The following employs loop unrolling for efficiency. Please do not

// eliminate.

Uint16* p = (Uint16*)s1.getChar16Data();

Uint16* q = (Uint16*)s2.getChar16Data();

Uint32 n = s2.size();

Line 1446

Line 1509

(+) [DONE] Check for overlow condition in StringRep::alloc().

-----------

(+) [DONE] Remove tabs (used vim ":set expandtab" and ":retab").

(+) Fix throw-related memory leak.

(+) [DONE] Fix throw-related memory leak.

(+) DOC++ String.h

(+) [DONE] Look at PEP223 for coding security guidelines.

(+) Look at PEP223 for coding security guidelines.

(+) [DONE] Use old AtomicInt for now (split new AtomicInt into another

bug.

(+) Replace AtomicInt with new Atomic implementation.

(+) [DONE] Removed appendASCII() and the ASCII form of the constructor.

(+) Implement Atomic operations for HP.

-----------

(+) Remove tabs.

(+) DOC++ String.h

================================================================================

Legend:

Removed from v.1.111.6.7
changed lines
	Added in v.1.111.6.15

No CVS admin address has been configured