blob: 963c527e461932205c7cb330a5121e04847aae1c [file] [log] [blame]
/*
* Copyright (C) 1999-2000 Harri Porten (porten@kde.org)
* Copyright (C) 2004, 2005, 2006, 2007, 2008, 2009 Apple Inc. All rights reserved.
* Copyright (C) 2009 Google Inc. All rights reserved.
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Library General Public
* License as published by the Free Software Foundation; either
* version 2 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Library General Public License for more details.
*
* You should have received a copy of the GNU Library General Public License
* along with this library; see the file COPYING.LIB. If not, write to
* the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
* Boston, MA 02110-1301, USA.
*
*/
#ifndef UString_h
#define UString_h
#include "Collector.h"
#include "UStringImpl.h"
#include <stdint.h>
#include <string.h>
#include <wtf/Assertions.h>
#include <wtf/CrossThreadRefCounted.h>
#include <wtf/OwnFastMallocPtr.h>
#include <wtf/PassRefPtr.h>
#include <wtf/PtrAndFlags.h>
#include <wtf/RefPtr.h>
#include <wtf/Vector.h>
#include <wtf/unicode/Unicode.h>
#if PLATFORM(QT)
#include <QtCore/qstring.h>
#endif
namespace JSC {
using WTF::PlacementNewAdoptType;
using WTF::PlacementNewAdopt;
class CString {
public:
CString()
: m_length(0)
, m_data(0)
{
}
CString(const char*);
CString(const char*, size_t);
CString(const CString&);
~CString();
static CString adopt(char*, size_t); // buffer should be allocated with new[].
CString& append(const CString&);
CString& operator=(const char* c);
CString& operator=(const CString&);
CString& operator+=(const CString& c) { return append(c); }
size_t size() const { return m_length; }
const char* c_str() const { return m_data; }
private:
size_t m_length;
char* m_data;
};
bool operator==(const CString&, const CString&);
typedef Vector<char, 32> CStringBuffer;
class UString {
friend class JIT;
public:
#if PLATFORM(QT)
operator QT_PREPEND_NAMESPACE(QString)() const
{
return QT_PREPEND_NAMESPACE(QString)(reinterpret_cast<const QT_PREPEND_NAMESPACE(QChar)*>(this->data()), this->size());
}
UString(const QT_PREPEND_NAMESPACE(QString)& str)
{
*this = JSC::UString(reinterpret_cast<const UChar*>(str.constData()), str.length());
}
#endif
typedef UStringImpl Rep;
public:
// UString constructors passed char*s assume ISO Latin-1 encoding; for UTF8 use 'createFromUTF8', below.
UString();
UString(const char*); // Constructor for null-terminated string.
UString(const char*, int length);
UString(const UChar*, int length);
UString(const Vector<UChar>& buffer);
UString(const UString& s)
: m_rep(s.m_rep)
{
}
// Special constructor for cases where we overwrite an object in place.
UString(PlacementNewAdoptType)
: m_rep(PlacementNewAdopt)
{
}
~UString()
{
}
template<size_t inlineCapacity>
static PassRefPtr<UStringImpl> adopt(Vector<UChar, inlineCapacity>& vector)
{
return Rep::adopt(vector);
}
static UString createFromUTF8(const char*);
static UString from(int);
static UString from(long long);
static UString from(unsigned int);
static UString from(long);
static UString from(double);
struct Range {
public:
Range(int pos, int len)
: position(pos)
, length(len)
{
}
Range()
{
}
int position;
int length;
};
UString spliceSubstringsWithSeparators(const Range* substringRanges, int rangeCount, const UString* separators, int separatorCount) const;
UString replaceRange(int rangeStart, int RangeEnd, const UString& replacement) const;
bool getCString(CStringBuffer&) const;
// NOTE: This method should only be used for *debugging* purposes as it
// is neither Unicode safe nor free from side effects nor thread-safe.
char* ascii() const;
/**
* Convert the string to UTF-8, assuming it is UTF-16 encoded.
* In non-strict mode, this function is tolerant of badly formed UTF-16, it
* can create UTF-8 strings that are invalid because they have characters in
* the range U+D800-U+DDFF, U+FFFE, or U+FFFF, but the UTF-8 string is
* guaranteed to be otherwise valid.
* In strict mode, error is returned as null CString.
*/
CString UTF8String(bool strict = false) const;
UString& operator=(const char*c);
const UChar* data() const { return m_rep->data(); }
bool isNull() const { return m_rep == &Rep::null(); }
bool isEmpty() const { return !m_rep->size(); }
bool is8Bit() const;
int size() const { return m_rep->size(); }
UChar operator[](int pos) const;
double toDouble(bool tolerateTrailingJunk, bool tolerateEmptyString) const;
double toDouble(bool tolerateTrailingJunk) const;
double toDouble() const;
uint32_t toUInt32(bool* ok = 0) const;
uint32_t toUInt32(bool* ok, bool tolerateEmptyString) const;
uint32_t toStrictUInt32(bool* ok = 0) const;
unsigned toArrayIndex(bool* ok = 0) const;
int find(const UString& f, int pos = 0) const;
int find(UChar, int pos = 0) const;
int rfind(const UString& f, int pos) const;
int rfind(UChar, int pos) const;
UString substr(int pos = 0, int len = -1) const;
static const UString& null() { return *nullUString; }
Rep* rep() const { return m_rep.get(); }
static Rep* nullRep();
UString(PassRefPtr<Rep> r)
: m_rep(r)
{
ASSERT(m_rep);
}
size_t cost() const { return m_rep->cost(); }
private:
void makeNull();
RefPtr<Rep> m_rep;
static UString* nullUString;
friend void initializeUString();
friend bool operator==(const UString&, const UString&);
};
ALWAYS_INLINE bool operator==(const UString& s1, const UString& s2)
{
int size = s1.size();
switch (size) {
case 0:
return !s2.size();
case 1:
return s2.size() == 1 && s1.data()[0] == s2.data()[0];
case 2: {
if (s2.size() != 2)
return false;
const UChar* d1 = s1.data();
const UChar* d2 = s2.data();
return (d1[0] == d2[0]) & (d1[1] == d2[1]);
}
default:
return s2.size() == size && memcmp(s1.data(), s2.data(), size * sizeof(UChar)) == 0;
}
}
inline bool operator!=(const UString& s1, const UString& s2)
{
return !JSC::operator==(s1, s2);
}
bool operator<(const UString& s1, const UString& s2);
bool operator>(const UString& s1, const UString& s2);
bool operator==(const UString& s1, const char* s2);
inline bool operator!=(const UString& s1, const char* s2)
{
return !JSC::operator==(s1, s2);
}
inline bool operator==(const char *s1, const UString& s2)
{
return operator==(s2, s1);
}
inline bool operator!=(const char *s1, const UString& s2)
{
return !JSC::operator==(s1, s2);
}
int compare(const UString&, const UString&);
inline UString::UString()
: m_rep(&Rep::null())
{
}
// Rule from ECMA 15.2 about what an array index is.
// Must exactly match string form of an unsigned integer, and be less than 2^32 - 1.
inline unsigned UString::toArrayIndex(bool* ok) const
{
unsigned i = toStrictUInt32(ok);
if (ok && i >= 0xFFFFFFFFU)
*ok = false;
return i;
}
// We'd rather not do shared substring append for small strings, since
// this runs too much risk of a tiny initial string holding down a
// huge buffer.
// FIXME: this should be size_t but that would cause warnings until we
// fix UString sizes to be size_t instead of int
static const int minShareSize = Heap::minExtraCost / sizeof(UChar);
struct IdentifierRepHash : PtrHash<RefPtr<JSC::UString::Rep> > {
static unsigned hash(const RefPtr<JSC::UString::Rep>& key) { return key->existingHash(); }
static unsigned hash(JSC::UString::Rep* key) { return key->existingHash(); }
};
void initializeUString();
template<typename StringType>
class StringTypeAdapter {
};
template<>
class StringTypeAdapter<char*> {
public:
StringTypeAdapter<char*>(char* buffer)
: m_buffer((unsigned char*)buffer)
, m_length(strlen(buffer))
{
}
unsigned length() { return m_length; }
void writeTo(UChar* destination)
{
for (unsigned i = 0; i < m_length; ++i)
destination[i] = m_buffer[i];
}
private:
const unsigned char* m_buffer;
unsigned m_length;
};
template<>
class StringTypeAdapter<const char*> {
public:
StringTypeAdapter<const char*>(const char* buffer)
: m_buffer((unsigned char*)buffer)
, m_length(strlen(buffer))
{
}
unsigned length() { return m_length; }
void writeTo(UChar* destination)
{
for (unsigned i = 0; i < m_length; ++i)
destination[i] = m_buffer[i];
}
private:
const unsigned char* m_buffer;
unsigned m_length;
};
template<>
class StringTypeAdapter<UString> {
public:
StringTypeAdapter<UString>(UString& string)
: m_data(string.data())
, m_length(string.size())
{
}
unsigned length() { return m_length; }
void writeTo(UChar* destination)
{
for (unsigned i = 0; i < m_length; ++i)
destination[i] = m_data[i];
}
private:
const UChar* m_data;
unsigned m_length;
};
template<typename StringType1, typename StringType2>
UString makeString(StringType1 string1, StringType2 string2)
{
StringTypeAdapter<StringType1> adapter1(string1);
StringTypeAdapter<StringType2> adapter2(string2);
UChar* buffer;
unsigned length = adapter1.length() + adapter2.length();
PassRefPtr<UStringImpl> resultImpl = UStringImpl::tryCreateUninitialized(length, buffer);
if (!resultImpl)
return UString();
UChar* result = buffer;
adapter1.writeTo(result);
result += adapter1.length();
adapter2.writeTo(result);
return resultImpl;
}
template<typename StringType1, typename StringType2, typename StringType3>
UString makeString(StringType1 string1, StringType2 string2, StringType3 string3)
{
StringTypeAdapter<StringType1> adapter1(string1);
StringTypeAdapter<StringType2> adapter2(string2);
StringTypeAdapter<StringType3> adapter3(string3);
UChar* buffer;
unsigned length = adapter1.length() + adapter2.length() + adapter3.length();
PassRefPtr<UStringImpl> resultImpl = UStringImpl::tryCreateUninitialized(length, buffer);
if (!resultImpl)
return UString();
UChar* result = buffer;
adapter1.writeTo(result);
result += adapter1.length();
adapter2.writeTo(result);
result += adapter2.length();
adapter3.writeTo(result);
return resultImpl;
}
template<typename StringType1, typename StringType2, typename StringType3, typename StringType4>
UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4)
{
StringTypeAdapter<StringType1> adapter1(string1);
StringTypeAdapter<StringType2> adapter2(string2);
StringTypeAdapter<StringType3> adapter3(string3);
StringTypeAdapter<StringType4> adapter4(string4);
UChar* buffer;
unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length();
PassRefPtr<UStringImpl> resultImpl = UStringImpl::tryCreateUninitialized(length, buffer);
if (!resultImpl)
return UString();
UChar* result = buffer;
adapter1.writeTo(result);
result += adapter1.length();
adapter2.writeTo(result);
result += adapter2.length();
adapter3.writeTo(result);
result += adapter3.length();
adapter4.writeTo(result);
return resultImpl;
}
template<typename StringType1, typename StringType2, typename StringType3, typename StringType4, typename StringType5>
UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4, StringType5 string5)
{
StringTypeAdapter<StringType1> adapter1(string1);
StringTypeAdapter<StringType2> adapter2(string2);
StringTypeAdapter<StringType3> adapter3(string3);
StringTypeAdapter<StringType4> adapter4(string4);
StringTypeAdapter<StringType5> adapter5(string5);
UChar* buffer;
unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length() + adapter5.length();
PassRefPtr<UStringImpl> resultImpl = UStringImpl::tryCreateUninitialized(length, buffer);
if (!resultImpl)
return UString();
UChar* result = buffer;
adapter1.writeTo(result);
result += adapter1.length();
adapter2.writeTo(result);
result += adapter2.length();
adapter3.writeTo(result);
result += adapter3.length();
adapter4.writeTo(result);
result += adapter4.length();
adapter5.writeTo(result);
return resultImpl;
}
template<typename StringType1, typename StringType2, typename StringType3, typename StringType4, typename StringType5, typename StringType6>
UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4, StringType5 string5, StringType6 string6)
{
StringTypeAdapter<StringType1> adapter1(string1);
StringTypeAdapter<StringType2> adapter2(string2);
StringTypeAdapter<StringType3> adapter3(string3);
StringTypeAdapter<StringType4> adapter4(string4);
StringTypeAdapter<StringType5> adapter5(string5);
StringTypeAdapter<StringType6> adapter6(string6);
UChar* buffer;
unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length() + adapter5.length() + adapter6.length();
PassRefPtr<UStringImpl> resultImpl = UStringImpl::tryCreateUninitialized(length, buffer);
if (!resultImpl)
return UString();
UChar* result = buffer;
adapter1.writeTo(result);
result += adapter1.length();
adapter2.writeTo(result);
result += adapter2.length();
adapter3.writeTo(result);
result += adapter3.length();
adapter4.writeTo(result);
result += adapter4.length();
adapter5.writeTo(result);
result += adapter5.length();
adapter6.writeTo(result);
return resultImpl;
}
template<typename StringType1, typename StringType2, typename StringType3, typename StringType4, typename StringType5, typename StringType6, typename StringType7>
UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4, StringType5 string5, StringType6 string6, StringType7 string7)
{
StringTypeAdapter<StringType1> adapter1(string1);
StringTypeAdapter<StringType2> adapter2(string2);
StringTypeAdapter<StringType3> adapter3(string3);
StringTypeAdapter<StringType4> adapter4(string4);
StringTypeAdapter<StringType5> adapter5(string5);
StringTypeAdapter<StringType6> adapter6(string6);
StringTypeAdapter<StringType7> adapter7(string7);
UChar* buffer;
unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length() + adapter5.length() + adapter6.length() + adapter7.length();
PassRefPtr<UStringImpl> resultImpl = UStringImpl::tryCreateUninitialized(length, buffer);
if (!resultImpl)
return UString();
UChar* result = buffer;
adapter1.writeTo(result);
result += adapter1.length();
adapter2.writeTo(result);
result += adapter2.length();
adapter3.writeTo(result);
result += adapter3.length();
adapter4.writeTo(result);
result += adapter4.length();
adapter5.writeTo(result);
result += adapter5.length();
adapter6.writeTo(result);
result += adapter6.length();
adapter7.writeTo(result);
return resultImpl;
}
template<typename StringType1, typename StringType2, typename StringType3, typename StringType4, typename StringType5, typename StringType6, typename StringType7, typename StringType8>
UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4, StringType5 string5, StringType6 string6, StringType7 string7, StringType8 string8)
{
StringTypeAdapter<StringType1> adapter1(string1);
StringTypeAdapter<StringType2> adapter2(string2);
StringTypeAdapter<StringType3> adapter3(string3);
StringTypeAdapter<StringType4> adapter4(string4);
StringTypeAdapter<StringType5> adapter5(string5);
StringTypeAdapter<StringType6> adapter6(string6);
StringTypeAdapter<StringType7> adapter7(string7);
StringTypeAdapter<StringType8> adapter8(string8);
UChar* buffer;
unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length() + adapter5.length() + adapter6.length() + adapter7.length() + adapter8.length();
PassRefPtr<UStringImpl> resultImpl = UStringImpl::tryCreateUninitialized(length, buffer);
if (!resultImpl)
return UString();
UChar* result = buffer;
adapter1.writeTo(result);
result += adapter1.length();
adapter2.writeTo(result);
result += adapter2.length();
adapter3.writeTo(result);
result += adapter3.length();
adapter4.writeTo(result);
result += adapter4.length();
adapter5.writeTo(result);
result += adapter5.length();
adapter6.writeTo(result);
result += adapter6.length();
adapter7.writeTo(result);
result += adapter7.length();
adapter8.writeTo(result);
return resultImpl;
}
} // namespace JSC
namespace WTF {
template<typename T> struct DefaultHash;
template<typename T> struct StrHash;
template<> struct StrHash<JSC::UString::Rep*> {
static unsigned hash(const JSC::UString::Rep* key) { return key->hash(); }
static bool equal(const JSC::UString::Rep* a, const JSC::UString::Rep* b) { return JSC::equal(a, b); }
static const bool safeToCompareToEmptyOrDeleted = false;
};
template<> struct StrHash<RefPtr<JSC::UString::Rep> > : public StrHash<JSC::UString::Rep*> {
using StrHash<JSC::UString::Rep*>::hash;
static unsigned hash(const RefPtr<JSC::UString::Rep>& key) { return key->hash(); }
using StrHash<JSC::UString::Rep*>::equal;
static bool equal(const RefPtr<JSC::UString::Rep>& a, const RefPtr<JSC::UString::Rep>& b) { return JSC::equal(a.get(), b.get()); }
static bool equal(const JSC::UString::Rep* a, const RefPtr<JSC::UString::Rep>& b) { return JSC::equal(a, b.get()); }
static bool equal(const RefPtr<JSC::UString::Rep>& a, const JSC::UString::Rep* b) { return JSC::equal(a.get(), b); }
static const bool safeToCompareToEmptyOrDeleted = false;
};
template<> struct DefaultHash<JSC::UString::Rep*> {
typedef StrHash<JSC::UString::Rep*> Hash;
};
template<> struct DefaultHash<RefPtr<JSC::UString::Rep> > {
typedef StrHash<RefPtr<JSC::UString::Rep> > Hash;
};
} // namespace WTF
#endif