2 * Copyright (C) 2004, 2005, 2006, 2007, 2008 Apple Inc. All rights reserved.
3 * Copyright (C) 2010 Patrick Gansterer <paroga@paroga.com>
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Library General Public
7 * License as published by the Free Software Foundation; either
8 * version 2 of the License, or (at your option) any later version.
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Library General Public License for more details.
15 * You should have received a copy of the GNU Library General Public License
16 * along with this library; see the file COPYING.LIB. If not, write to
17 * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
18 * Boston, MA 02110-1301, USA.
24 #include "AtomicString.h"
26 #include "StringHash.h"
27 #include <wtf/HashSet.h>
28 #include <wtf/Threading.h>
29 #include <wtf/WTFThreadData.h>
30 #include <wtf/unicode/UTF8.h>
32 #include <libkern/OSAtomic.h>
36 using namespace Unicode
;
38 COMPILE_ASSERT(sizeof(AtomicString
) == sizeof(String
), atomic_string_and_string_must_be_same_size
);
40 class AtomicStringTableLocker
{
41 static OSSpinLock s_stringTableLock
;
43 AtomicStringTableLocker() { OSSpinLockLock(&s_stringTableLock
); }
44 ~AtomicStringTableLocker() { OSSpinLockUnlock(&s_stringTableLock
); }
46 OSSpinLock
AtomicStringTableLocker::s_stringTableLock
= OS_SPINLOCK_INIT
;
48 class AtomicStringTable
{
50 static AtomicStringTable
* create()
52 static AtomicStringTable
* sharedStringTable
= new AtomicStringTable
;
54 WTFThreadData
& data
= wtfThreadData();
55 if (pthread_main_np() || WTF::isWebThread())
56 data
.m_atomicStringTable
= sharedStringTable
;
58 data
.m_atomicStringTable
= new AtomicStringTable
;
60 // The AtomicStringTable is shared between the main UI thread and the
61 // WebThread. We do the following so that its destruction happens only
62 // once - on the main UI thread.
63 if (!WTF::isWebThread())
64 data
.m_atomicStringTableDestructor
= AtomicStringTable::destroy
;
65 return data
.m_atomicStringTable
;
68 HashSet
<StringImpl
*>& table()
74 static void destroy(AtomicStringTable
* table
)
76 HashSet
<StringImpl
*>::iterator end
= table
->m_table
.end();
77 for (HashSet
<StringImpl
*>::iterator iter
= table
->m_table
.begin(); iter
!= end
; ++iter
)
78 (*iter
)->setIsAtomic(false);
82 HashSet
<StringImpl
*> m_table
;
85 static inline HashSet
<StringImpl
*>& stringTable()
87 // Once possible we should make this non-lazy (constructed in WTFThreadData's constructor).
88 AtomicStringTable
* table
= wtfThreadData().atomicStringTable();
90 table
= AtomicStringTable::create();
91 return table
->table();
94 template<typename T
, typename HashTranslator
>
95 static inline PassRefPtr
<StringImpl
> addToStringTable(const T
& value
)
97 pair
<HashSet
<StringImpl
*>::iterator
, bool> addResult
= stringTable().add
<T
, HashTranslator
>(value
);
99 // If the string is newly-translated, then we need to adopt it.
100 // The boolean in the pair tells us if that is so.
101 return addResult
.second
? adoptRef(*addResult
.first
) : *addResult
.first
;
104 struct CStringTranslator
{
105 static unsigned hash(const char* c
)
107 return StringHasher::computeHash(c
);
110 static bool equal(StringImpl
* r
, const char* s
)
112 int length
= r
->length();
113 const UChar
* d
= r
->characters();
114 for (int i
= 0; i
!= length
; ++i
) {
115 unsigned char c
= s
[i
];
122 static void translate(StringImpl
*& location
, const char* const& c
, unsigned hash
)
124 location
= StringImpl::create(c
).leakRef();
125 location
->setHash(hash
);
126 location
->setIsAtomic(true);
130 bool operator==(const AtomicString
& a
, const char* b
)
132 StringImpl
* impl
= a
.impl();
133 if ((!impl
|| !impl
->characters()) && !b
)
135 if ((!impl
|| !impl
->characters()) || !b
)
137 return CStringTranslator::equal(impl
, b
);
140 PassRefPtr
<StringImpl
> AtomicString::add(const char* c
)
145 return StringImpl::empty();
147 AtomicStringTableLocker locker
;
148 return addToStringTable
<const char*, CStringTranslator
>(c
);
156 static inline bool equal(StringImpl
* string
, const UChar
* characters
, unsigned length
)
158 if (string
->length() != length
)
161 // FIXME: perhaps we should have a more abstract macro that indicates when
162 // going 4 bytes at a time is unsafe
163 #if CPU(ARM) || CPU(SH4) || CPU(MIPS) || CPU(SPARC)
164 const UChar
* stringCharacters
= string
->characters();
165 for (unsigned i
= 0; i
!= length
; ++i
) {
166 if (*stringCharacters
++ != *characters
++)
171 /* Do it 4-bytes-at-a-time on architectures where it's safe */
173 const uint32_t* stringCharacters
= reinterpret_cast<const uint32_t*>(string
->characters());
174 const uint32_t* bufferCharacters
= reinterpret_cast<const uint32_t*>(characters
);
176 unsigned halfLength
= length
>> 1;
177 for (unsigned i
= 0; i
!= halfLength
; ++i
) {
178 if (*stringCharacters
++ != *bufferCharacters
++)
182 if (length
& 1 && *reinterpret_cast<const uint16_t*>(stringCharacters
) != *reinterpret_cast<const uint16_t*>(bufferCharacters
))
189 bool operator==(const AtomicString
& string
, const Vector
<UChar
>& vector
)
191 return string
.impl() && equal(string
.impl(), vector
.data(), vector
.size());
194 struct UCharBufferTranslator
{
195 static unsigned hash(const UCharBuffer
& buf
)
197 return StringHasher::computeHash(buf
.s
, buf
.length
);
200 static bool equal(StringImpl
* const& str
, const UCharBuffer
& buf
)
202 return WTF::equal(str
, buf
.s
, buf
.length
);
205 static void translate(StringImpl
*& location
, const UCharBuffer
& buf
, unsigned hash
)
207 location
= StringImpl::create(buf
.s
, buf
.length
).leakRef();
208 location
->setHash(hash
);
209 location
->setIsAtomic(true);
213 struct HashAndCharacters
{
215 const UChar
* characters
;
219 struct HashAndCharactersTranslator
{
220 static unsigned hash(const HashAndCharacters
& buffer
)
222 ASSERT(buffer
.hash
== StringHasher::computeHash(buffer
.characters
, buffer
.length
));
226 static bool equal(StringImpl
* const& string
, const HashAndCharacters
& buffer
)
228 return WTF::equal(string
, buffer
.characters
, buffer
.length
);
231 static void translate(StringImpl
*& location
, const HashAndCharacters
& buffer
, unsigned hash
)
233 location
= StringImpl::create(buffer
.characters
, buffer
.length
).leakRef();
234 location
->setHash(hash
);
235 location
->setIsAtomic(true);
239 struct HashAndUTF8Characters
{
241 const char* characters
;
243 unsigned utf16Length
;
246 struct HashAndUTF8CharactersTranslator
{
247 static unsigned hash(const HashAndUTF8Characters
& buffer
)
252 static bool equal(StringImpl
* const& string
, const HashAndUTF8Characters
& buffer
)
254 if (buffer
.utf16Length
!= string
->length())
257 const UChar
* stringCharacters
= string
->characters();
259 // If buffer contains only ASCII characters UTF-8 and UTF16 length are the same.
260 if (buffer
.utf16Length
!= buffer
.length
)
261 return equalUTF16WithUTF8(stringCharacters
, stringCharacters
+ string
->length(), buffer
.characters
, buffer
.characters
+ buffer
.length
);
263 for (unsigned i
= 0; i
< buffer
.length
; ++i
) {
264 ASSERT(isASCII(buffer
.characters
[i
]));
265 if (stringCharacters
[i
] != buffer
.characters
[i
])
272 static void translate(StringImpl
*& location
, const HashAndUTF8Characters
& buffer
, unsigned hash
)
275 location
= StringImpl::createUninitialized(buffer
.utf16Length
, target
).releaseRef();
277 const char* source
= buffer
.characters
;
278 if (convertUTF8ToUTF16(&source
, source
+ buffer
.length
, &target
, target
+ buffer
.utf16Length
) != conversionOK
)
279 ASSERT_NOT_REACHED();
281 location
->setHash(hash
);
282 location
->setIsAtomic(true);
286 PassRefPtr
<StringImpl
> AtomicString::add(const UChar
* s
, unsigned length
)
292 return StringImpl::empty();
294 UCharBuffer buffer
= { s
, length
};
295 AtomicStringTableLocker locker
;
296 return addToStringTable
<UCharBuffer
, UCharBufferTranslator
>(buffer
);
299 PassRefPtr
<StringImpl
> AtomicString::add(const UChar
* s
, unsigned length
, unsigned existingHash
)
302 ASSERT(existingHash
);
305 return StringImpl::empty();
307 HashAndCharacters buffer
= { existingHash
, s
, length
};
308 AtomicStringTableLocker locker
;
309 return addToStringTable
<HashAndCharacters
, HashAndCharactersTranslator
>(buffer
);
312 PassRefPtr
<StringImpl
> AtomicString::add(const UChar
* s
)
318 while (s
[length
] != UChar(0))
322 return StringImpl::empty();
324 UCharBuffer buffer
= { s
, length
};
325 AtomicStringTableLocker locker
;
326 return addToStringTable
<UCharBuffer
, UCharBufferTranslator
>(buffer
);
329 PassRefPtr
<StringImpl
> AtomicString::addSlowCase(StringImpl
* r
)
331 if (!r
|| r
->isAtomic())
335 return StringImpl::empty();
337 AtomicStringTableLocker locker
;
338 StringImpl
* result
= *stringTable().add(r
).first
;
340 r
->setIsAtomic(true);
344 AtomicStringImpl
* AtomicString::find(const UChar
* s
, unsigned length
, unsigned existingHash
)
347 ASSERT(existingHash
);
350 return static_cast<AtomicStringImpl
*>(StringImpl::empty());
352 HashAndCharacters buffer
= { existingHash
, s
, length
};
353 AtomicStringTableLocker locker
;
354 HashSet
<StringImpl
*>::iterator iterator
= stringTable().find
<HashAndCharacters
, HashAndCharactersTranslator
>(buffer
);
355 if (iterator
== stringTable().end())
357 return static_cast<AtomicStringImpl
*>(*iterator
);
360 void AtomicString::remove(StringImpl
* r
)
362 AtomicStringTableLocker locker
;
363 stringTable().remove(r
);
366 AtomicString
AtomicString::lower() const
368 // Note: This is a hot function in the Dromaeo benchmark.
369 StringImpl
* impl
= this->impl();
372 RefPtr
<StringImpl
> newImpl
= impl
->lower();
373 if (LIKELY(newImpl
== impl
))
375 return AtomicString(newImpl
);
378 AtomicString
AtomicString::fromUTF8Internal(const char* charactersStart
, const char* charactersEnd
)
380 HashAndUTF8Characters buffer
;
381 buffer
.characters
= charactersStart
;
382 buffer
.hash
= calculateStringHashAndLengthFromUTF8(charactersStart
, charactersEnd
, buffer
.length
, buffer
.utf16Length
);
387 AtomicString atomicString
;
388 AtomicStringTableLocker locker
;
389 atomicString
.m_string
= addToStringTable
<HashAndUTF8Characters
, HashAndUTF8CharactersTranslator
>(buffer
);