2 * Copyright (C) 1999 Lars Knoll (knoll@kde.org)
3 * (C) 1999 Antti Koivisto (koivisto@kde.org)
4 * (C) 2001 Dirk Mueller ( mueller@kde.org )
5 * Copyright (C) 2003, 2004, 2005, 2006, 2007, 2008, 2009 Apple Inc. All rights reserved.
6 * Copyright (C) 2006 Andrew Wellington (proton@wiretapped.net)
8 * This library is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Library General Public
10 * License as published by the Free Software Foundation; either
11 * version 2 of the License, or (at your option) any later version.
13 * This library is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Library General Public License for more details.
18 * You should have received a copy of the GNU Library General Public License
19 * along with this library; see the file COPYING.LIB. If not, write to
20 * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
21 * Boston, MA 02110-1301, USA.
26 #include "StringImpl.h"
28 #include "AtomicString.h"
29 #include "StringBuffer.h"
30 #include "StringHash.h"
31 #include <wtf/StdLibExtras.h>
32 #include <wtf/WTFThreadData.h>
35 using namespace Unicode
;
40 static const unsigned minLengthToShare
= 20;
42 StringImpl::~StringImpl()
47 AtomicString::remove(this);
50 wtfThreadData().currentIdentifierTable()->remove(this);
53 BufferOwnership ownership
= bufferOwnership();
54 if (ownership
!= BufferInternal
) {
55 if (ownership
== BufferOwned
) {
56 ASSERT(!m_sharedBuffer
);
58 fastFree(const_cast<UChar
*>(m_data
));
59 } else if (ownership
== BufferSubstring
) {
60 ASSERT(m_substringBuffer
);
61 m_substringBuffer
->deref();
63 ASSERT(ownership
== BufferShared
);
64 ASSERT(m_sharedBuffer
);
65 m_sharedBuffer
->deref();
70 PassRefPtr
<StringImpl
> StringImpl::createUninitialized(unsigned length
, UChar
*& data
)
77 // Allocate a single buffer large enough to contain the StringImpl
78 // struct as well as the data which it contains. This removes one
79 // heap allocation from this call.
80 if (length
> ((std::numeric_limits
<size_t>::max() - sizeof(StringImpl
)) / sizeof(UChar
)))
82 size_t size
= sizeof(StringImpl
) + length
* sizeof(UChar
);
83 StringImpl
* string
= static_cast<StringImpl
*>(fastMalloc(size
));
85 data
= reinterpret_cast<UChar
*>(string
+ 1);
86 return adoptRef(new (string
) StringImpl(length
));
89 PassRefPtr
<StringImpl
> StringImpl::create(const UChar
* characters
, unsigned length
)
91 if (!characters
|| !length
)
95 PassRefPtr
<StringImpl
> string
= createUninitialized(length
, data
);
96 memcpy(data
, characters
, length
* sizeof(UChar
));
100 PassRefPtr
<StringImpl
> StringImpl::create(const char* characters
, unsigned length
)
102 if (!characters
|| !length
)
106 PassRefPtr
<StringImpl
> string
= createUninitialized(length
, data
);
107 for (unsigned i
= 0; i
!= length
; ++i
) {
108 unsigned char c
= characters
[i
];
114 PassRefPtr
<StringImpl
> StringImpl::create(const char* string
)
118 return create(string
, strlen(string
));
121 PassRefPtr
<StringImpl
> StringImpl::create(const UChar
* characters
, unsigned length
, PassRefPtr
<SharedUChar
> sharedBuffer
)
124 ASSERT(minLengthToShare
&& length
>= minLengthToShare
);
125 return adoptRef(new StringImpl(characters
, length
, sharedBuffer
));
128 SharedUChar
* StringImpl::sharedBuffer()
130 if (m_length
< minLengthToShare
)
132 // All static strings are smaller that the minimim length to share.
135 BufferOwnership ownership
= bufferOwnership();
137 if (ownership
== BufferInternal
)
139 if (ownership
== BufferSubstring
)
140 return m_substringBuffer
->sharedBuffer();
141 if (ownership
== BufferOwned
) {
142 ASSERT(!m_sharedBuffer
);
143 m_sharedBuffer
= SharedUChar::create(new SharableUChar(m_data
)).releaseRef();
144 m_refCountAndFlags
= (m_refCountAndFlags
& ~s_refCountMaskBufferOwnership
) | BufferShared
;
147 ASSERT(bufferOwnership() == BufferShared
);
148 ASSERT(m_sharedBuffer
);
149 return m_sharedBuffer
;
152 bool StringImpl::containsOnlyWhitespace()
154 // FIXME: The definition of whitespace here includes a number of characters
155 // that are not whitespace from the point of view of RenderText; I wonder if
156 // that's a problem in practice.
157 for (unsigned i
= 0; i
< m_length
; i
++)
158 if (!isASCIISpace(m_data
[i
]))
163 PassRefPtr
<StringImpl
> StringImpl::substring(unsigned start
, unsigned length
)
165 if (start
>= m_length
)
167 unsigned maxLength
= m_length
- start
;
168 if (length
>= maxLength
) {
173 return create(m_data
+ start
, length
);
176 UChar32
StringImpl::characterStartingAt(unsigned i
)
178 if (U16_IS_SINGLE(m_data
[i
]))
180 if (i
+ 1 < m_length
&& U16_IS_LEAD(m_data
[i
]) && U16_IS_TRAIL(m_data
[i
+ 1]))
181 return U16_GET_SUPPLEMENTARY(m_data
[i
], m_data
[i
+ 1]);
185 PassRefPtr
<StringImpl
> StringImpl::lower()
187 // Note: This is a hot function in the Dromaeo benchmark, specifically the
188 // no-op code path up through the first 'return' statement.
190 // First scan the string for uppercase and non-ASCII characters:
193 const UChar
*end
= m_data
+ m_length
;
194 for (const UChar
* chp
= m_data
; chp
!= end
; chp
++) {
195 if (UNLIKELY(isASCIIUpper(*chp
)))
200 // Nothing to do if the string is all ASCII with no uppercase.
201 if (noUpper
&& !(ored
& ~0x7F))
204 int32_t length
= m_length
;
206 RefPtr
<StringImpl
> newImpl
= createUninitialized(m_length
, data
);
208 if (!(ored
& ~0x7F)) {
209 // Do a faster loop for the case where all the characters are ASCII.
210 for (int i
= 0; i
< length
; i
++) {
212 data
[i
] = toASCIILower(c
);
217 // Do a slower implementation for cases that include non-ASCII characters.
219 int32_t realLength
= Unicode::toLower(data
, length
, m_data
, m_length
, &error
);
220 if (!error
&& realLength
== length
)
222 newImpl
= createUninitialized(realLength
, data
);
223 Unicode::toLower(data
, realLength
, m_data
, m_length
, &error
);
229 PassRefPtr
<StringImpl
> StringImpl::upper()
231 // This function could be optimized for no-op cases the way lower() is,
232 // but in empirical testing, few actual calls to upper() are no-ops, so
233 // it wouldn't be worth the extra time for pre-scanning.
235 PassRefPtr
<StringImpl
> newImpl
= createUninitialized(m_length
, data
);
236 int32_t length
= m_length
;
238 // Do a faster loop for the case where all the characters are ASCII.
240 for (int i
= 0; i
< length
; i
++) {
243 data
[i
] = toASCIIUpper(c
);
248 // Do a slower implementation for cases that include non-ASCII characters.
250 int32_t realLength
= Unicode::toUpper(data
, length
, m_data
, m_length
, &error
);
251 if (!error
&& realLength
== length
)
253 newImpl
= createUninitialized(realLength
, data
);
254 Unicode::toUpper(data
, realLength
, m_data
, m_length
, &error
);
260 PassRefPtr
<StringImpl
> StringImpl::secure(UChar aChar
, bool last
)
262 int length
= m_length
;
263 Vector
<UChar
> data(length
);
265 for (int i
= 0; i
< length
- 1; ++i
)
267 data
[length
- 1] = (last
? aChar
: m_data
[length
- 1]);
272 PassRefPtr
<StringImpl
> StringImpl::foldCase()
275 PassRefPtr
<StringImpl
> newImpl
= createUninitialized(m_length
, data
);
276 int32_t length
= m_length
;
278 // Do a faster loop for the case where all the characters are ASCII.
280 for (int i
= 0; i
< length
; i
++) {
283 data
[i
] = toASCIILower(c
);
288 // Do a slower implementation for cases that include non-ASCII characters.
290 int32_t realLength
= Unicode::foldCase(data
, length
, m_data
, m_length
, &error
);
291 if (!error
&& realLength
== length
)
293 newImpl
= createUninitialized(realLength
, data
);
294 Unicode::foldCase(data
, realLength
, m_data
, m_length
, &error
);
300 PassRefPtr
<StringImpl
> StringImpl::stripWhiteSpace()
306 unsigned end
= m_length
- 1;
308 // skip white space from start
309 while (start
<= end
&& isSpaceOrNewline(m_data
[start
]))
316 // skip white space from end
317 while (end
&& isSpaceOrNewline(m_data
[end
]))
320 if (!start
&& end
== m_length
- 1)
322 return create(m_data
+ start
, end
+ 1 - start
);
325 PassRefPtr
<StringImpl
> StringImpl::removeCharacters(CharacterMatchFunctionPtr findMatch
)
327 const UChar
* from
= m_data
;
328 const UChar
* fromend
= from
+ m_length
;
330 // Assume the common case will not remove any characters
331 while (from
!= fromend
&& !findMatch(*from
))
336 StringBuffer
data(m_length
);
337 UChar
* to
= data
.characters();
338 unsigned outc
= from
- m_data
;
341 memcpy(to
, m_data
, outc
* sizeof(UChar
));
344 while (from
!= fromend
&& findMatch(*from
))
346 while (from
!= fromend
&& !findMatch(*from
))
347 to
[outc
++] = *from
++;
357 PassRefPtr
<StringImpl
> StringImpl::simplifyWhiteSpace()
359 StringBuffer
data(m_length
);
361 const UChar
* from
= m_data
;
362 const UChar
* fromend
= from
+ m_length
;
364 bool changedToSpace
= false;
366 UChar
* to
= data
.characters();
369 while (from
!= fromend
&& isSpaceOrNewline(*from
)) {
371 changedToSpace
= true;
374 while (from
!= fromend
&& !isSpaceOrNewline(*from
))
375 to
[outc
++] = *from
++;
382 if (outc
> 0 && to
[outc
- 1] == ' ')
385 if (static_cast<unsigned>(outc
) == m_length
&& !changedToSpace
)
393 int StringImpl::toIntStrict(bool* ok
, int base
)
395 return charactersToIntStrict(m_data
, m_length
, ok
, base
);
398 unsigned StringImpl::toUIntStrict(bool* ok
, int base
)
400 return charactersToUIntStrict(m_data
, m_length
, ok
, base
);
403 int64_t StringImpl::toInt64Strict(bool* ok
, int base
)
405 return charactersToInt64Strict(m_data
, m_length
, ok
, base
);
408 uint64_t StringImpl::toUInt64Strict(bool* ok
, int base
)
410 return charactersToUInt64Strict(m_data
, m_length
, ok
, base
);
413 intptr_t StringImpl::toIntPtrStrict(bool* ok
, int base
)
415 return charactersToIntPtrStrict(m_data
, m_length
, ok
, base
);
418 int StringImpl::toInt(bool* ok
)
420 return charactersToInt(m_data
, m_length
, ok
);
423 unsigned StringImpl::toUInt(bool* ok
)
425 return charactersToUInt(m_data
, m_length
, ok
);
428 int64_t StringImpl::toInt64(bool* ok
)
430 return charactersToInt64(m_data
, m_length
, ok
);
433 uint64_t StringImpl::toUInt64(bool* ok
)
435 return charactersToUInt64(m_data
, m_length
, ok
);
438 intptr_t StringImpl::toIntPtr(bool* ok
)
440 return charactersToIntPtr(m_data
, m_length
, ok
);
443 double StringImpl::toDouble(bool* ok
)
445 return charactersToDouble(m_data
, m_length
, ok
);
448 float StringImpl::toFloat(bool* ok
)
450 return charactersToFloat(m_data
, m_length
, ok
);
453 static bool equal(const UChar
* a
, const char* b
, int length
)
457 unsigned char bc
= *b
++;
464 bool equalIgnoringCase(const UChar
* a
, const char* b
, unsigned length
)
467 unsigned char bc
= *b
++;
468 if (foldCase(*a
++) != foldCase(bc
))
474 static inline bool equalIgnoringCase(const UChar
* a
, const UChar
* b
, int length
)
477 return umemcasecmp(a
, b
, length
) == 0;
480 int StringImpl::find(const char* chs
, int index
, bool caseSensitive
)
482 if (!chs
|| index
< 0)
485 int chsLength
= strlen(chs
);
486 int n
= m_length
- index
;
493 const char* chsPlusOne
= chs
+ 1;
494 int chsLengthMinusOne
= chsLength
- 1;
496 const UChar
* ptr
= m_data
+ index
- 1;
500 if (*++ptr
== c
&& equal(ptr
+ 1, chsPlusOne
, chsLengthMinusOne
))
501 return m_length
- chsLength
- n
+ 1;
504 UChar lc
= Unicode::foldCase(*chs
);
506 if (Unicode::foldCase(*++ptr
) == lc
&& equalIgnoringCase(ptr
+ 1, chsPlusOne
, chsLengthMinusOne
))
507 return m_length
- chsLength
- n
+ 1;
514 int StringImpl::find(UChar c
, int start
)
516 return WebCore::find(m_data
, m_length
, c
, start
);
519 int StringImpl::find(CharacterMatchFunctionPtr matchFunction
, int start
)
521 return WebCore::find(m_data
, m_length
, matchFunction
, start
);
524 int StringImpl::find(StringImpl
* str
, int index
, bool caseSensitive
)
527 We use a simple trick for efficiency's sake. Instead of
528 comparing strings, we compare the sum of str with that of
529 a part of this string. Only if that matches, we call memcmp
535 int lstr
= str
->m_length
;
536 int lthis
= m_length
- index
;
537 if ((unsigned)lthis
> m_length
)
539 int delta
= lthis
- lstr
;
543 const UChar
* uthis
= m_data
+ index
;
544 const UChar
* ustr
= str
->m_data
;
548 for (int i
= 0; i
< lstr
; i
++) {
554 if (hthis
== hstr
&& memcmp(uthis
+ i
, ustr
, lstr
* sizeof(UChar
)) == 0)
558 hthis
+= uthis
[i
+ lstr
];
563 for (int i
= 0; i
< lstr
; i
++ ) {
564 hthis
+= toASCIILower(uthis
[i
]);
565 hstr
+= toASCIILower(ustr
[i
]);
569 if (hthis
== hstr
&& equalIgnoringCase(uthis
+ i
, ustr
, lstr
))
573 hthis
+= toASCIILower(uthis
[i
+ lstr
]);
574 hthis
-= toASCIILower(uthis
[i
]);
580 int StringImpl::reverseFind(UChar c
, int index
)
582 return WebCore::reverseFind(m_data
, m_length
, c
, index
);
585 int StringImpl::reverseFind(StringImpl
* str
, int index
, bool caseSensitive
)
588 See StringImpl::find() for explanations.
591 int lthis
= m_length
;
595 int lstr
= str
->m_length
;
596 int delta
= lthis
- lstr
;
597 if ( index
< 0 || index
> lthis
|| delta
< 0 )
602 const UChar
*uthis
= m_data
;
603 const UChar
*ustr
= str
->m_data
;
608 for ( i
= 0; i
< lstr
; i
++ ) {
609 hthis
+= uthis
[index
+ i
];
614 if (hthis
== hstr
&& memcmp(uthis
+ i
, ustr
, lstr
* sizeof(UChar
)) == 0)
619 hthis
-= uthis
[i
+ lstr
];
623 for (i
= 0; i
< lstr
; i
++) {
624 hthis
+= toASCIILower(uthis
[index
+ i
]);
625 hstr
+= toASCIILower(ustr
[i
]);
629 if (hthis
== hstr
&& equalIgnoringCase(uthis
+ i
, ustr
, lstr
) )
634 hthis
-= toASCIILower(uthis
[i
+ lstr
]);
635 hthis
+= toASCIILower(uthis
[i
]);
639 // Should never get here.
643 bool StringImpl::endsWith(StringImpl
* m_data
, bool caseSensitive
)
646 int start
= m_length
- m_data
->m_length
;
648 return (find(m_data
, start
, caseSensitive
) == start
);
652 PassRefPtr
<StringImpl
> StringImpl::replace(UChar oldC
, UChar newC
)
657 for (i
= 0; i
!= m_length
; ++i
)
658 if (m_data
[i
] == oldC
)
664 PassRefPtr
<StringImpl
> newImpl
= createUninitialized(m_length
, data
);
666 for (i
= 0; i
!= m_length
; ++i
) {
667 UChar ch
= m_data
[i
];
675 PassRefPtr
<StringImpl
> StringImpl::replace(unsigned position
, unsigned lengthToReplace
, StringImpl
* str
)
677 position
= min(position
, length());
678 lengthToReplace
= min(lengthToReplace
, length() - position
);
679 unsigned lengthToInsert
= str
? str
->length() : 0;
680 if (!lengthToReplace
&& !lengthToInsert
)
684 if ((length() - lengthToReplace
) >= (numeric_limits
<unsigned>::max() - lengthToInsert
))
687 PassRefPtr
<StringImpl
> newImpl
=
688 createUninitialized(length() - lengthToReplace
+ lengthToInsert
, data
);
689 memcpy(data
, characters(), position
* sizeof(UChar
));
691 memcpy(data
+ position
, str
->characters(), lengthToInsert
* sizeof(UChar
));
692 memcpy(data
+ position
+ lengthToInsert
, characters() + position
+ lengthToReplace
,
693 (length() - position
- lengthToReplace
) * sizeof(UChar
));
697 PassRefPtr
<StringImpl
> StringImpl::replace(UChar pattern
, StringImpl
* replacement
)
702 int repStrLength
= replacement
->length();
703 int srcSegmentStart
= 0;
704 unsigned matchCount
= 0;
707 while ((srcSegmentStart
= find(pattern
, srcSegmentStart
)) >= 0) {
712 // If we have 0 matches, we don't have to do any more work
716 if (repStrLength
&& matchCount
> numeric_limits
<unsigned>::max() / repStrLength
)
719 unsigned replaceSize
= matchCount
* repStrLength
;
720 unsigned newSize
= m_length
- matchCount
;
721 if (newSize
>= (numeric_limits
<unsigned>::max() - replaceSize
))
724 newSize
+= replaceSize
;
727 PassRefPtr
<StringImpl
> newImpl
= createUninitialized(newSize
, data
);
729 // Construct the new data
731 int srcSegmentLength
;
735 while ((srcSegmentEnd
= find(pattern
, srcSegmentStart
)) >= 0) {
736 srcSegmentLength
= srcSegmentEnd
- srcSegmentStart
;
737 memcpy(data
+ dstOffset
, m_data
+ srcSegmentStart
, srcSegmentLength
* sizeof(UChar
));
738 dstOffset
+= srcSegmentLength
;
739 memcpy(data
+ dstOffset
, replacement
->m_data
, repStrLength
* sizeof(UChar
));
740 dstOffset
+= repStrLength
;
741 srcSegmentStart
= srcSegmentEnd
+ 1;
744 srcSegmentLength
= m_length
- srcSegmentStart
;
745 memcpy(data
+ dstOffset
, m_data
+ srcSegmentStart
, srcSegmentLength
* sizeof(UChar
));
747 ASSERT(dstOffset
+ srcSegmentLength
== static_cast<int>(newImpl
->length()));
752 PassRefPtr
<StringImpl
> StringImpl::replace(StringImpl
* pattern
, StringImpl
* replacement
)
754 if (!pattern
|| !replacement
)
757 int patternLength
= pattern
->length();
761 int repStrLength
= replacement
->length();
762 int srcSegmentStart
= 0;
763 unsigned matchCount
= 0;
766 while ((srcSegmentStart
= find(pattern
, srcSegmentStart
)) >= 0) {
768 srcSegmentStart
+= patternLength
;
771 // If we have 0 matches, we don't have to do any more work
775 unsigned newSize
= m_length
- matchCount
* patternLength
;
776 if (repStrLength
&& matchCount
> numeric_limits
<unsigned>::max() / repStrLength
)
779 if (newSize
> (numeric_limits
<unsigned>::max() - matchCount
* repStrLength
))
782 newSize
+= matchCount
* repStrLength
;
785 PassRefPtr
<StringImpl
> newImpl
= createUninitialized(newSize
, data
);
787 // Construct the new data
789 int srcSegmentLength
;
793 while ((srcSegmentEnd
= find(pattern
, srcSegmentStart
)) >= 0) {
794 srcSegmentLength
= srcSegmentEnd
- srcSegmentStart
;
795 memcpy(data
+ dstOffset
, m_data
+ srcSegmentStart
, srcSegmentLength
* sizeof(UChar
));
796 dstOffset
+= srcSegmentLength
;
797 memcpy(data
+ dstOffset
, replacement
->m_data
, repStrLength
* sizeof(UChar
));
798 dstOffset
+= repStrLength
;
799 srcSegmentStart
= srcSegmentEnd
+ patternLength
;
802 srcSegmentLength
= m_length
- srcSegmentStart
;
803 memcpy(data
+ dstOffset
, m_data
+ srcSegmentStart
, srcSegmentLength
* sizeof(UChar
));
805 ASSERT(dstOffset
+ srcSegmentLength
== static_cast<int>(newImpl
->length()));
810 bool equal(const StringImpl
* a
, const StringImpl
* b
)
812 return StringHash::equal(a
, b
);
815 bool equal(const StringImpl
* a
, const char* b
)
822 unsigned length
= a
->length();
823 const UChar
* as
= a
->characters();
824 for (unsigned i
= 0; i
!= length
; ++i
) {
825 unsigned char bc
= b
[i
];
835 bool equalIgnoringCase(StringImpl
* a
, StringImpl
* b
)
837 return CaseFoldingHash::equal(a
, b
);
840 bool equalIgnoringCase(StringImpl
* a
, const char* b
)
847 unsigned length
= a
->length();
848 const UChar
* as
= a
->characters();
850 // Do a faster loop for the case where all the characters are ASCII.
853 for (unsigned i
= 0; i
!= length
; ++i
) {
859 equal
= equal
&& (toASCIILower(ac
) == toASCIILower(bc
));
862 // Do a slower implementation for cases that include non-ASCII characters.
865 for (unsigned i
= 0; i
!= length
; ++i
) {
866 unsigned char bc
= b
[i
];
867 equal
= equal
&& (foldCase(as
[i
]) == foldCase(bc
));
871 return equal
&& !b
[length
];
874 bool equalIgnoringNullity(StringImpl
* a
, StringImpl
* b
)
876 if (StringHash::equal(a
, b
))
878 if (!a
&& b
&& !b
->length())
880 if (!b
&& a
&& !a
->length())
886 Vector
<char> StringImpl::ascii()
888 Vector
<char> buffer(m_length
+ 1);
889 for (unsigned i
= 0; i
!= m_length
; ++i
) {
891 if ((c
>= 0x20 && c
< 0x7F) || c
== 0x00)
892 buffer
[i
] = static_cast<char>(c
);
896 buffer
[m_length
] = '\0';
900 WTF::Unicode::Direction
StringImpl::defaultWritingDirection()
902 for (unsigned i
= 0; i
< m_length
; ++i
) {
903 WTF::Unicode::Direction charDirection
= WTF::Unicode::direction(m_data
[i
]);
904 if (charDirection
== WTF::Unicode::LeftToRight
)
905 return WTF::Unicode::LeftToRight
;
906 if (charDirection
== WTF::Unicode::RightToLeft
|| charDirection
== WTF::Unicode::RightToLeftArabic
)
907 return WTF::Unicode::RightToLeft
;
909 return WTF::Unicode::LeftToRight
;
912 // This is a hot function because it's used when parsing HTML.
913 PassRefPtr
<StringImpl
> StringImpl::createStrippingNullCharactersSlowCase(const UChar
* characters
, unsigned length
)
915 StringBuffer
strippedCopy(length
);
916 unsigned strippedLength
= 0;
917 for (unsigned i
= 0; i
< length
; i
++) {
918 if (int c
= characters
[i
])
919 strippedCopy
[strippedLength
++] = c
;
921 ASSERT(strippedLength
< length
); // Only take the slow case when stripping.
922 strippedCopy
.shrink(strippedLength
);
923 return adopt(strippedCopy
);
926 PassRefPtr
<StringImpl
> StringImpl::adopt(StringBuffer
& buffer
)
928 unsigned length
= buffer
.length();
931 return adoptRef(new StringImpl(buffer
.release(), length
));
934 int StringImpl::wordCount(int maxWordsToCount
)
936 unsigned wordCount
= 0;
939 for (i
= 0; i
< m_length
; i
++) {
940 if (u_isspace(m_data
[i
])) {
942 } else if (!atWord
) {
944 if (wordCount
>= (unsigned)maxWordsToCount
)
952 PassRefPtr
<StringImpl
> StringImpl::createWithTerminatingNullCharacter(const StringImpl
& string
)
954 // Use createUninitialized instead of 'new StringImpl' so that the string and its buffer
955 // get allocated in a single malloc block.
957 int length
= string
.m_length
;
958 RefPtr
<StringImpl
> terminatedString
= createUninitialized(length
+ 1, data
);
959 memcpy(data
, string
.m_data
, length
* sizeof(UChar
));
961 terminatedString
->m_length
--;
962 terminatedString
->m_hash
= string
.m_hash
;
963 terminatedString
->m_refCountAndFlags
|= s_refCountFlagHasTerminatingNullCharacter
;
964 return terminatedString
.release();
967 PassRefPtr
<StringImpl
> StringImpl::threadsafeCopy() const
969 return create(m_data
, m_length
);
972 PassRefPtr
<StringImpl
> StringImpl::crossThreadString()
974 if (SharedUChar
* sharedBuffer
= this->sharedBuffer())
975 return adoptRef(new StringImpl(m_data
, m_length
, sharedBuffer
->crossThreadCopy()));
977 // If no shared buffer is available, create a copy.
978 return threadsafeCopy();
981 } // namespace WebCore