You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
314 lines
10 KiB
314 lines
10 KiB
// Copyright 2017 PDFium Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
// found in the LICENSE file.
|
|
|
|
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
|
|
|
|
#ifndef CORE_FXCRT_WIDESTRING_H_
|
|
#define CORE_FXCRT_WIDESTRING_H_
|
|
|
|
#include <functional>
|
|
#include <iterator>
|
|
#include <ostream>
|
|
#include <utility>
|
|
|
|
#include "core/fxcrt/fx_system.h"
|
|
#include "core/fxcrt/retain_ptr.h"
|
|
#include "core/fxcrt/string_data_template.h"
|
|
#include "core/fxcrt/string_view_template.h"
|
|
#include "third_party/base/logging.h"
|
|
#include "third_party/base/optional.h"
|
|
#include "third_party/base/span.h"
|
|
|
|
namespace fxcrt {
|
|
|
|
class ByteString;
|
|
|
|
// A mutable string with shared buffers using copy-on-write semantics that
|
|
// avoids the cost of std::string's iterator stability guarantees.
|
|
class WideString {
|
|
public:
|
|
using CharType = wchar_t;
|
|
using const_iterator = const CharType*;
|
|
using const_reverse_iterator = std::reverse_iterator<const_iterator>;
|
|
|
|
static WideString Format(const wchar_t* pFormat, ...) WARN_UNUSED_RESULT;
|
|
static WideString FormatV(const wchar_t* lpszFormat,
|
|
va_list argList) WARN_UNUSED_RESULT;
|
|
|
|
WideString();
|
|
WideString(const WideString& other);
|
|
|
|
// Move-construct a WideString. After construction, |other| is empty.
|
|
WideString(WideString&& other) noexcept;
|
|
|
|
// Deliberately implicit to avoid calling on every string literal.
|
|
// NOLINTNEXTLINE(runtime/explicit)
|
|
WideString(wchar_t ch);
|
|
// NOLINTNEXTLINE(runtime/explicit)
|
|
WideString(const wchar_t* ptr);
|
|
|
|
// No implicit conversions from byte strings.
|
|
// NOLINTNEXTLINE(runtime/explicit)
|
|
WideString(char) = delete;
|
|
|
|
WideString(const wchar_t* pStr, size_t len);
|
|
|
|
explicit WideString(WideStringView str);
|
|
WideString(WideStringView str1, WideStringView str2);
|
|
WideString(const std::initializer_list<WideStringView>& list);
|
|
|
|
~WideString();
|
|
|
|
static WideString FromASCII(ByteStringView str) WARN_UNUSED_RESULT;
|
|
static WideString FromLatin1(ByteStringView str) WARN_UNUSED_RESULT;
|
|
static WideString FromDefANSI(ByteStringView str) WARN_UNUSED_RESULT;
|
|
static WideString FromUTF8(ByteStringView str) WARN_UNUSED_RESULT;
|
|
static WideString FromUTF16LE(const unsigned short* str,
|
|
size_t len) WARN_UNUSED_RESULT;
|
|
static WideString FromUTF16BE(const unsigned short* wstr,
|
|
size_t wlen) WARN_UNUSED_RESULT;
|
|
|
|
static size_t WStringLength(const unsigned short* str) WARN_UNUSED_RESULT;
|
|
|
|
// Explicit conversion to C-style wide string.
|
|
// Note: Any subsequent modification of |this| will invalidate the result.
|
|
const wchar_t* c_str() const { return m_pData ? m_pData->m_String : L""; }
|
|
|
|
// Explicit conversion to WideStringView.
|
|
// Note: Any subsequent modification of |this| will invalidate the result.
|
|
WideStringView AsStringView() const {
|
|
return WideStringView(c_str(), GetLength());
|
|
}
|
|
|
|
// Explicit conversion to span.
|
|
// Note: Any subsequent modification of |this| will invalidate the result.
|
|
pdfium::span<const wchar_t> span() const {
|
|
return pdfium::make_span(m_pData ? m_pData->m_String : nullptr,
|
|
GetLength());
|
|
}
|
|
|
|
// Note: Any subsequent modification of |this| will invalidate iterators.
|
|
const_iterator begin() const { return m_pData ? m_pData->m_String : nullptr; }
|
|
const_iterator end() const {
|
|
return m_pData ? m_pData->m_String + m_pData->m_nDataLength : nullptr;
|
|
}
|
|
|
|
// Note: Any subsequent modification of |this| will invalidate iterators.
|
|
const_reverse_iterator rbegin() const {
|
|
return const_reverse_iterator(end());
|
|
}
|
|
const_reverse_iterator rend() const {
|
|
return const_reverse_iterator(begin());
|
|
}
|
|
|
|
void clear() { m_pData.Reset(); }
|
|
|
|
size_t GetLength() const { return m_pData ? m_pData->m_nDataLength : 0; }
|
|
size_t GetStringLength() const {
|
|
return m_pData ? wcslen(m_pData->m_String) : 0;
|
|
}
|
|
bool IsEmpty() const { return !GetLength(); }
|
|
bool IsValidIndex(size_t index) const { return index < GetLength(); }
|
|
bool IsValidLength(size_t length) const { return length <= GetLength(); }
|
|
|
|
WideString& operator=(const wchar_t* str);
|
|
WideString& operator=(WideStringView str);
|
|
WideString& operator=(const WideString& that);
|
|
|
|
// Move-assign a WideString. After assignment, |that| is empty.
|
|
WideString& operator=(WideString&& that);
|
|
|
|
WideString& operator+=(const wchar_t* str);
|
|
WideString& operator+=(wchar_t ch);
|
|
WideString& operator+=(const WideString& str);
|
|
WideString& operator+=(WideStringView str);
|
|
|
|
bool operator==(const wchar_t* ptr) const;
|
|
bool operator==(WideStringView str) const;
|
|
bool operator==(const WideString& other) const;
|
|
|
|
bool operator!=(const wchar_t* ptr) const { return !(*this == ptr); }
|
|
bool operator!=(WideStringView str) const { return !(*this == str); }
|
|
bool operator!=(const WideString& other) const { return !(*this == other); }
|
|
|
|
bool operator<(const wchar_t* ptr) const;
|
|
bool operator<(WideStringView str) const;
|
|
bool operator<(const WideString& other) const;
|
|
|
|
CharType operator[](const size_t index) const {
|
|
CHECK(IsValidIndex(index));
|
|
return m_pData->m_String[index];
|
|
}
|
|
|
|
CharType Front() const { return GetLength() ? (*this)[0] : 0; }
|
|
CharType Back() const { return GetLength() ? (*this)[GetLength() - 1] : 0; }
|
|
|
|
void SetAt(size_t index, wchar_t c);
|
|
|
|
int Compare(const wchar_t* str) const;
|
|
int Compare(const WideString& str) const;
|
|
int CompareNoCase(const wchar_t* str) const;
|
|
|
|
WideString Substr(size_t first, size_t count) const;
|
|
WideString First(size_t count) const;
|
|
WideString Last(size_t count) const;
|
|
|
|
size_t Insert(size_t index, wchar_t ch);
|
|
size_t InsertAtFront(wchar_t ch) { return Insert(0, ch); }
|
|
size_t InsertAtBack(wchar_t ch) { return Insert(GetLength(), ch); }
|
|
size_t Delete(size_t index, size_t count = 1);
|
|
|
|
void MakeLower();
|
|
void MakeUpper();
|
|
|
|
void Trim();
|
|
void Trim(wchar_t target);
|
|
void Trim(WideStringView targets);
|
|
|
|
void TrimLeft();
|
|
void TrimLeft(wchar_t target);
|
|
void TrimLeft(WideStringView targets);
|
|
|
|
void TrimRight();
|
|
void TrimRight(wchar_t target);
|
|
void TrimRight(WideStringView targets);
|
|
|
|
void Reserve(size_t len);
|
|
|
|
// Note: any modification of the string (including ReleaseBuffer()) may
|
|
// invalidate the span, which must not outlive its buffer.
|
|
pdfium::span<wchar_t> GetBuffer(size_t nMinBufLength);
|
|
void ReleaseBuffer(size_t nNewLength);
|
|
|
|
int GetInteger() const;
|
|
|
|
Optional<size_t> Find(WideStringView subStr, size_t start = 0) const;
|
|
Optional<size_t> Find(wchar_t ch, size_t start = 0) const;
|
|
Optional<size_t> ReverseFind(wchar_t ch) const;
|
|
|
|
bool Contains(WideStringView lpszSub, size_t start = 0) const {
|
|
return Find(lpszSub, start).has_value();
|
|
}
|
|
|
|
bool Contains(char ch, size_t start = 0) const {
|
|
return Find(ch, start).has_value();
|
|
}
|
|
|
|
size_t Replace(WideStringView pOld, WideStringView pNew);
|
|
size_t Remove(wchar_t ch);
|
|
|
|
bool IsASCII() const { return AsStringView().IsASCII(); }
|
|
bool EqualsASCII(ByteStringView that) const {
|
|
return AsStringView().EqualsASCII(that);
|
|
}
|
|
bool EqualsASCIINoCase(ByteStringView that) const {
|
|
return AsStringView().EqualsASCIINoCase(that);
|
|
}
|
|
|
|
ByteString ToASCII() const;
|
|
ByteString ToLatin1() const;
|
|
ByteString ToDefANSI() const;
|
|
ByteString ToUTF8() const;
|
|
|
|
// This method will add \0\0 to the end of the string to represent the
|
|
// wide string terminator. These values are in the string, not just the data,
|
|
// so GetLength() will include them.
|
|
ByteString ToUTF16LE() const;
|
|
|
|
protected:
|
|
using StringData = StringDataTemplate<wchar_t>;
|
|
|
|
void ReallocBeforeWrite(size_t nNewLength);
|
|
void AllocBeforeWrite(size_t nNewLength);
|
|
void AllocCopy(WideString& dest, size_t nCopyLen, size_t nCopyIndex) const;
|
|
void AssignCopy(const wchar_t* pSrcData, size_t nSrcLen);
|
|
void Concat(const wchar_t* pSrcData, size_t nSrcLen);
|
|
intptr_t ReferenceCountForTesting() const;
|
|
|
|
RetainPtr<StringData> m_pData;
|
|
|
|
friend class WideString_Assign_Test;
|
|
friend class WideString_ConcatInPlace_Test;
|
|
friend class WideString_Construct_Test;
|
|
friend class StringPool_WideString_Test;
|
|
};
|
|
|
|
inline WideString operator+(WideStringView str1, WideStringView str2) {
|
|
return WideString(str1, str2);
|
|
}
|
|
inline WideString operator+(WideStringView str1, const wchar_t* str2) {
|
|
return WideString(str1, str2);
|
|
}
|
|
inline WideString operator+(const wchar_t* str1, WideStringView str2) {
|
|
return WideString(str1, str2);
|
|
}
|
|
inline WideString operator+(WideStringView str1, wchar_t ch) {
|
|
return WideString(str1, WideStringView(ch));
|
|
}
|
|
inline WideString operator+(wchar_t ch, WideStringView str2) {
|
|
return WideString(ch, str2);
|
|
}
|
|
inline WideString operator+(const WideString& str1, const WideString& str2) {
|
|
return WideString(str1.AsStringView(), str2.AsStringView());
|
|
}
|
|
inline WideString operator+(const WideString& str1, wchar_t ch) {
|
|
return WideString(str1.AsStringView(), WideStringView(ch));
|
|
}
|
|
inline WideString operator+(wchar_t ch, const WideString& str2) {
|
|
return WideString(ch, str2.AsStringView());
|
|
}
|
|
inline WideString operator+(const WideString& str1, const wchar_t* str2) {
|
|
return WideString(str1.AsStringView(), str2);
|
|
}
|
|
inline WideString operator+(const wchar_t* str1, const WideString& str2) {
|
|
return WideString(str1, str2.AsStringView());
|
|
}
|
|
inline WideString operator+(const WideString& str1, WideStringView str2) {
|
|
return WideString(str1.AsStringView(), str2);
|
|
}
|
|
inline WideString operator+(WideStringView str1, const WideString& str2) {
|
|
return WideString(str1, str2.AsStringView());
|
|
}
|
|
inline bool operator==(const wchar_t* lhs, const WideString& rhs) {
|
|
return rhs == lhs;
|
|
}
|
|
inline bool operator==(WideStringView lhs, const WideString& rhs) {
|
|
return rhs == lhs;
|
|
}
|
|
inline bool operator!=(const wchar_t* lhs, const WideString& rhs) {
|
|
return rhs != lhs;
|
|
}
|
|
inline bool operator!=(WideStringView lhs, const WideString& rhs) {
|
|
return rhs != lhs;
|
|
}
|
|
inline bool operator<(const wchar_t* lhs, const WideString& rhs) {
|
|
return rhs.Compare(lhs) > 0;
|
|
}
|
|
|
|
std::wostream& operator<<(std::wostream& os, const WideString& str);
|
|
std::ostream& operator<<(std::ostream& os, const WideString& str);
|
|
std::wostream& operator<<(std::wostream& os, WideStringView str);
|
|
std::ostream& operator<<(std::ostream& os, WideStringView str);
|
|
|
|
} // namespace fxcrt
|
|
|
|
using WideString = fxcrt::WideString;
|
|
|
|
uint32_t FX_HashCode_GetW(WideStringView str, bool bIgnoreCase);
|
|
|
|
namespace std {
|
|
|
|
template <>
|
|
struct hash<WideString> {
|
|
std::size_t operator()(const WideString& str) const {
|
|
return FX_HashCode_GetW(str.AsStringView(), false);
|
|
}
|
|
};
|
|
|
|
} // namespace std
|
|
|
|
extern template struct std::hash<WideString>;
|
|
|
|
#endif // CORE_FXCRT_WIDESTRING_H_
|