/* * Copyright (C) 1999-2000 Harri Porten (porten@kde.org) * Copyright (C) 2004, 2005, 2006, 2007, 2008, 2009 Apple Inc. All rights reserved. * Copyright (C) 2009 Google Inc. All rights reserved. * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Library General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Library General Public License for more details. * * You should have received a copy of the GNU Library General Public License * along with this library; see the file COPYING.LIB. If not, write to * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, * Boston, MA 02110-1301, USA. * */ #ifndef UString_h #define UString_h #include "Collector.h" #include "UStringImpl.h" #include #include #include #include #include #include #include #include #include #include #if PLATFORM(QT) #include #endif namespace JSC { using WTF::PlacementNewAdoptType; using WTF::PlacementNewAdopt; class CString { public: CString() : m_length(0) , m_data(0) { } CString(const char*); CString(const char*, size_t); CString(const CString&); ~CString(); static CString adopt(char*, size_t); // buffer should be allocated with new[]. CString& append(const CString&); CString& operator=(const char* c); CString& operator=(const CString&); CString& operator+=(const CString& c) { return append(c); } size_t size() const { return m_length; } const char* c_str() const { return m_data; } private: size_t m_length; char* m_data; }; bool operator==(const CString&, const CString&); typedef Vector CStringBuffer; class UString { friend class JIT; public: #if PLATFORM(QT) operator QT_PREPEND_NAMESPACE(QString)() const { return QT_PREPEND_NAMESPACE(QString)(reinterpret_cast(this->data()), this->size()); } UString(const QT_PREPEND_NAMESPACE(QString)& str) { *this = JSC::UString(reinterpret_cast(str.constData()), str.length()); } #endif typedef UStringImpl Rep; public: // UString constructors passed char*s assume ISO Latin-1 encoding; for UTF8 use 'createFromUTF8', below. UString(); UString(const char*); // Constructor for null-terminated string. UString(const char*, int length); UString(const UChar*, int length); UString(const Vector& buffer); UString(const UString& s) : m_rep(s.m_rep) { } // Special constructor for cases where we overwrite an object in place. UString(PlacementNewAdoptType) : m_rep(PlacementNewAdopt) { } ~UString() { } template static PassRefPtr adopt(Vector& vector) { return Rep::adopt(vector); } static UString createFromUTF8(const char*); static UString from(int); static UString from(long long); static UString from(unsigned int); static UString from(long); static UString from(double); struct Range { public: Range(int pos, int len) : position(pos) , length(len) { } Range() { } int position; int length; }; UString spliceSubstringsWithSeparators(const Range* substringRanges, int rangeCount, const UString* separators, int separatorCount) const; UString replaceRange(int rangeStart, int RangeEnd, const UString& replacement) const; bool getCString(CStringBuffer&) const; // NOTE: This method should only be used for *debugging* purposes as it // is neither Unicode safe nor free from side effects nor thread-safe. char* ascii() const; /** * Convert the string to UTF-8, assuming it is UTF-16 encoded. * In non-strict mode, this function is tolerant of badly formed UTF-16, it * can create UTF-8 strings that are invalid because they have characters in * the range U+D800-U+DDFF, U+FFFE, or U+FFFF, but the UTF-8 string is * guaranteed to be otherwise valid. * In strict mode, error is returned as null CString. */ CString UTF8String(bool strict = false) const; UString& operator=(const char*c); const UChar* data() const { return m_rep->data(); } bool isNull() const { return m_rep == &Rep::null(); } bool isEmpty() const { return !m_rep->size(); } bool is8Bit() const; int size() const { return m_rep->size(); } UChar operator[](int pos) const; double toDouble(bool tolerateTrailingJunk, bool tolerateEmptyString) const; double toDouble(bool tolerateTrailingJunk) const; double toDouble() const; uint32_t toUInt32(bool* ok = 0) const; uint32_t toUInt32(bool* ok, bool tolerateEmptyString) const; uint32_t toStrictUInt32(bool* ok = 0) const; unsigned toArrayIndex(bool* ok = 0) const; int find(const UString& f, int pos = 0) const; int find(UChar, int pos = 0) const; int rfind(const UString& f, int pos) const; int rfind(UChar, int pos) const; UString substr(int pos = 0, int len = -1) const; static const UString& null() { return *nullUString; } Rep* rep() const { return m_rep.get(); } static Rep* nullRep(); UString(PassRefPtr r) : m_rep(r) { ASSERT(m_rep); } size_t cost() const { return m_rep->cost(); } private: void makeNull(); RefPtr m_rep; static UString* nullUString; friend void initializeUString(); friend bool operator==(const UString&, const UString&); }; ALWAYS_INLINE bool operator==(const UString& s1, const UString& s2) { int size = s1.size(); switch (size) { case 0: return !s2.size(); case 1: return s2.size() == 1 && s1.data()[0] == s2.data()[0]; case 2: { if (s2.size() != 2) return false; const UChar* d1 = s1.data(); const UChar* d2 = s2.data(); return (d1[0] == d2[0]) & (d1[1] == d2[1]); } default: return s2.size() == size && memcmp(s1.data(), s2.data(), size * sizeof(UChar)) == 0; } } inline bool operator!=(const UString& s1, const UString& s2) { return !JSC::operator==(s1, s2); } bool operator<(const UString& s1, const UString& s2); bool operator>(const UString& s1, const UString& s2); bool operator==(const UString& s1, const char* s2); inline bool operator!=(const UString& s1, const char* s2) { return !JSC::operator==(s1, s2); } inline bool operator==(const char *s1, const UString& s2) { return operator==(s2, s1); } inline bool operator!=(const char *s1, const UString& s2) { return !JSC::operator==(s1, s2); } int compare(const UString&, const UString&); inline UString::UString() : m_rep(&Rep::null()) { } // Rule from ECMA 15.2 about what an array index is. // Must exactly match string form of an unsigned integer, and be less than 2^32 - 1. inline unsigned UString::toArrayIndex(bool* ok) const { unsigned i = toStrictUInt32(ok); if (ok && i >= 0xFFFFFFFFU) *ok = false; return i; } // We'd rather not do shared substring append for small strings, since // this runs too much risk of a tiny initial string holding down a // huge buffer. // FIXME: this should be size_t but that would cause warnings until we // fix UString sizes to be size_t instead of int static const int minShareSize = Heap::minExtraCost / sizeof(UChar); struct IdentifierRepHash : PtrHash > { static unsigned hash(const RefPtr& key) { return key->existingHash(); } static unsigned hash(JSC::UString::Rep* key) { return key->existingHash(); } }; void initializeUString(); template class StringTypeAdapter { }; template<> class StringTypeAdapter { public: StringTypeAdapter(char* buffer) : m_buffer((unsigned char*)buffer) , m_length(strlen(buffer)) { } unsigned length() { return m_length; } void writeTo(UChar* destination) { for (unsigned i = 0; i < m_length; ++i) destination[i] = m_buffer[i]; } private: const unsigned char* m_buffer; unsigned m_length; }; template<> class StringTypeAdapter { public: StringTypeAdapter(const char* buffer) : m_buffer((unsigned char*)buffer) , m_length(strlen(buffer)) { } unsigned length() { return m_length; } void writeTo(UChar* destination) { for (unsigned i = 0; i < m_length; ++i) destination[i] = m_buffer[i]; } private: const unsigned char* m_buffer; unsigned m_length; }; template<> class StringTypeAdapter { public: StringTypeAdapter(UString& string) : m_data(string.data()) , m_length(string.size()) { } unsigned length() { return m_length; } void writeTo(UChar* destination) { for (unsigned i = 0; i < m_length; ++i) destination[i] = m_data[i]; } private: const UChar* m_data; unsigned m_length; }; template UString makeString(StringType1 string1, StringType2 string2) { StringTypeAdapter adapter1(string1); StringTypeAdapter adapter2(string2); UChar* buffer; unsigned length = adapter1.length() + adapter2.length(); PassRefPtr resultImpl = UStringImpl::tryCreateUninitialized(length, buffer); if (!resultImpl) return UString(); UChar* result = buffer; adapter1.writeTo(result); result += adapter1.length(); adapter2.writeTo(result); return resultImpl; } template UString makeString(StringType1 string1, StringType2 string2, StringType3 string3) { StringTypeAdapter adapter1(string1); StringTypeAdapter adapter2(string2); StringTypeAdapter adapter3(string3); UChar* buffer; unsigned length = adapter1.length() + adapter2.length() + adapter3.length(); PassRefPtr resultImpl = UStringImpl::tryCreateUninitialized(length, buffer); if (!resultImpl) return UString(); UChar* result = buffer; adapter1.writeTo(result); result += adapter1.length(); adapter2.writeTo(result); result += adapter2.length(); adapter3.writeTo(result); return resultImpl; } template UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4) { StringTypeAdapter adapter1(string1); StringTypeAdapter adapter2(string2); StringTypeAdapter adapter3(string3); StringTypeAdapter adapter4(string4); UChar* buffer; unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length(); PassRefPtr resultImpl = UStringImpl::tryCreateUninitialized(length, buffer); if (!resultImpl) return UString(); UChar* result = buffer; adapter1.writeTo(result); result += adapter1.length(); adapter2.writeTo(result); result += adapter2.length(); adapter3.writeTo(result); result += adapter3.length(); adapter4.writeTo(result); return resultImpl; } template UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4, StringType5 string5) { StringTypeAdapter adapter1(string1); StringTypeAdapter adapter2(string2); StringTypeAdapter adapter3(string3); StringTypeAdapter adapter4(string4); StringTypeAdapter adapter5(string5); UChar* buffer; unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length() + adapter5.length(); PassRefPtr resultImpl = UStringImpl::tryCreateUninitialized(length, buffer); if (!resultImpl) return UString(); UChar* result = buffer; adapter1.writeTo(result); result += adapter1.length(); adapter2.writeTo(result); result += adapter2.length(); adapter3.writeTo(result); result += adapter3.length(); adapter4.writeTo(result); result += adapter4.length(); adapter5.writeTo(result); return resultImpl; } template UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4, StringType5 string5, StringType6 string6) { StringTypeAdapter adapter1(string1); StringTypeAdapter adapter2(string2); StringTypeAdapter adapter3(string3); StringTypeAdapter adapter4(string4); StringTypeAdapter adapter5(string5); StringTypeAdapter adapter6(string6); UChar* buffer; unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length() + adapter5.length() + adapter6.length(); PassRefPtr resultImpl = UStringImpl::tryCreateUninitialized(length, buffer); if (!resultImpl) return UString(); UChar* result = buffer; adapter1.writeTo(result); result += adapter1.length(); adapter2.writeTo(result); result += adapter2.length(); adapter3.writeTo(result); result += adapter3.length(); adapter4.writeTo(result); result += adapter4.length(); adapter5.writeTo(result); result += adapter5.length(); adapter6.writeTo(result); return resultImpl; } template UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4, StringType5 string5, StringType6 string6, StringType7 string7) { StringTypeAdapter adapter1(string1); StringTypeAdapter adapter2(string2); StringTypeAdapter adapter3(string3); StringTypeAdapter adapter4(string4); StringTypeAdapter adapter5(string5); StringTypeAdapter adapter6(string6); StringTypeAdapter adapter7(string7); UChar* buffer; unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length() + adapter5.length() + adapter6.length() + adapter7.length(); PassRefPtr resultImpl = UStringImpl::tryCreateUninitialized(length, buffer); if (!resultImpl) return UString(); UChar* result = buffer; adapter1.writeTo(result); result += adapter1.length(); adapter2.writeTo(result); result += adapter2.length(); adapter3.writeTo(result); result += adapter3.length(); adapter4.writeTo(result); result += adapter4.length(); adapter5.writeTo(result); result += adapter5.length(); adapter6.writeTo(result); result += adapter6.length(); adapter7.writeTo(result); return resultImpl; } template UString makeString(StringType1 string1, StringType2 string2, StringType3 string3, StringType4 string4, StringType5 string5, StringType6 string6, StringType7 string7, StringType8 string8) { StringTypeAdapter adapter1(string1); StringTypeAdapter adapter2(string2); StringTypeAdapter adapter3(string3); StringTypeAdapter adapter4(string4); StringTypeAdapter adapter5(string5); StringTypeAdapter adapter6(string6); StringTypeAdapter adapter7(string7); StringTypeAdapter adapter8(string8); UChar* buffer; unsigned length = adapter1.length() + adapter2.length() + adapter3.length() + adapter4.length() + adapter5.length() + adapter6.length() + adapter7.length() + adapter8.length(); PassRefPtr resultImpl = UStringImpl::tryCreateUninitialized(length, buffer); if (!resultImpl) return UString(); UChar* result = buffer; adapter1.writeTo(result); result += adapter1.length(); adapter2.writeTo(result); result += adapter2.length(); adapter3.writeTo(result); result += adapter3.length(); adapter4.writeTo(result); result += adapter4.length(); adapter5.writeTo(result); result += adapter5.length(); adapter6.writeTo(result); result += adapter6.length(); adapter7.writeTo(result); result += adapter7.length(); adapter8.writeTo(result); return resultImpl; } } // namespace JSC namespace WTF { template struct DefaultHash; template struct StrHash; template<> struct StrHash { static unsigned hash(const JSC::UString::Rep* key) { return key->hash(); } static bool equal(const JSC::UString::Rep* a, const JSC::UString::Rep* b) { return JSC::equal(a, b); } static const bool safeToCompareToEmptyOrDeleted = false; }; template<> struct StrHash > : public StrHash { using StrHash::hash; static unsigned hash(const RefPtr& key) { return key->hash(); } using StrHash::equal; static bool equal(const RefPtr& a, const RefPtr& b) { return JSC::equal(a.get(), b.get()); } static bool equal(const JSC::UString::Rep* a, const RefPtr& b) { return JSC::equal(a, b.get()); } static bool equal(const RefPtr& a, const JSC::UString::Rep* b) { return JSC::equal(a.get(), b); } static const bool safeToCompareToEmptyOrDeleted = false; }; template<> struct DefaultHash { typedef StrHash Hash; }; template<> struct DefaultHash > { typedef StrHash > Hash; }; } // namespace WTF #endif