blob: f87447da329ca5135a8954602670aa0774851faf [file] [log] [blame] [edit]
// Copyright 2014 The PDFium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
#include "core/fxcrt/widestring.h"
#include <stddef.h>
#include <string.h>
#include <algorithm>
#include <sstream>
#include "core/fxcrt/fx_codepage.h"
#include "core/fxcrt/fx_extension.h"
#include "core/fxcrt/fx_safe_types.h"
#include "core/fxcrt/fx_system.h"
#include "core/fxcrt/string_pool_template.h"
#include "third_party/base/check.h"
#include "third_party/base/check_op.h"
#include "third_party/base/cxx17_backports.h"
#include "third_party/base/numerics/safe_math.h"
template class fxcrt::StringDataTemplate<wchar_t>;
template class fxcrt::StringViewTemplate<wchar_t>;
template class fxcrt::StringPoolTemplate<WideString>;
template struct std::hash<WideString>;
#define FORCE_ANSI 0x10000
#define FORCE_UNICODE 0x20000
#define FORCE_INT64 0x40000
namespace {
constexpr wchar_t kWideTrimChars[] = L"\x09\x0a\x0b\x0c\x0d\x20";
const wchar_t* FX_wcsstr(const wchar_t* haystack,
size_t haystack_len,
const wchar_t* needle,
size_t needle_len) {
if (needle_len > haystack_len || needle_len == 0)
return nullptr;
const wchar_t* end_ptr = haystack + haystack_len - needle_len;
while (haystack <= end_ptr) {
size_t i = 0;
while (true) {
if (haystack[i] != needle[i])
break;
i++;
if (i == needle_len)
return haystack;
}
haystack++;
}
return nullptr;
}
absl::optional<size_t> GuessSizeForVSWPrintf(const wchar_t* pFormat,
va_list argList) {
size_t nMaxLen = 0;
for (const wchar_t* pStr = pFormat; *pStr != 0; pStr++) {
if (*pStr != '%' || *(pStr = pStr + 1) == '%') {
++nMaxLen;
continue;
}
int iWidth = 0;
for (; *pStr != 0; pStr++) {
if (*pStr == '#') {
nMaxLen += 2;
} else if (*pStr == '*') {
iWidth = va_arg(argList, int);
} else if (*pStr != '-' && *pStr != '+' && *pStr != '0' && *pStr != ' ') {
break;
}
}
if (iWidth == 0) {
iWidth = FXSYS_wtoi(pStr);
while (FXSYS_IsDecimalDigit(*pStr))
++pStr;
}
if (iWidth < 0 || iWidth > 128 * 1024)
return absl::nullopt;
uint32_t nWidth = static_cast<uint32_t>(iWidth);
int iPrecision = 0;
if (*pStr == '.') {
pStr++;
if (*pStr == '*') {
iPrecision = va_arg(argList, int);
pStr++;
} else {
iPrecision = FXSYS_wtoi(pStr);
while (FXSYS_IsDecimalDigit(*pStr))
++pStr;
}
}
if (iPrecision < 0 || iPrecision > 128 * 1024)
return absl::nullopt;
uint32_t nPrecision = static_cast<uint32_t>(iPrecision);
int nModifier = 0;
if (*pStr == L'I' && *(pStr + 1) == L'6' && *(pStr + 2) == L'4') {
pStr += 3;
nModifier = FORCE_INT64;
} else {
switch (*pStr) {
case 'h':
nModifier = FORCE_ANSI;
pStr++;
break;
case 'l':
nModifier = FORCE_UNICODE;
pStr++;
break;
case 'F':
case 'N':
case 'L':
pStr++;
break;
}
}
size_t nItemLen = 0;
switch (*pStr | nModifier) {
case 'c':
case 'C':
nItemLen = 2;
va_arg(argList, int);
break;
case 'c' | FORCE_ANSI:
case 'C' | FORCE_ANSI:
nItemLen = 2;
va_arg(argList, int);
break;
case 'c' | FORCE_UNICODE:
case 'C' | FORCE_UNICODE:
nItemLen = 2;
va_arg(argList, int);
break;
case 's': {
const wchar_t* pstrNextArg = va_arg(argList, const wchar_t*);
if (pstrNextArg) {
nItemLen = wcslen(pstrNextArg);
if (nItemLen < 1) {
nItemLen = 1;
}
} else {
nItemLen = 6;
}
} break;
case 'S': {
const char* pstrNextArg = va_arg(argList, const char*);
if (pstrNextArg) {
nItemLen = strlen(pstrNextArg);
if (nItemLen < 1) {
nItemLen = 1;
}
} else {
nItemLen = 6;
}
} break;
case 's' | FORCE_ANSI:
case 'S' | FORCE_ANSI: {
const char* pstrNextArg = va_arg(argList, const char*);
if (pstrNextArg) {
nItemLen = strlen(pstrNextArg);
if (nItemLen < 1) {
nItemLen = 1;
}
} else {
nItemLen = 6;
}
} break;
case 's' | FORCE_UNICODE:
case 'S' | FORCE_UNICODE: {
const wchar_t* pstrNextArg = va_arg(argList, wchar_t*);
if (pstrNextArg) {
nItemLen = wcslen(pstrNextArg);
if (nItemLen < 1) {
nItemLen = 1;
}
} else {
nItemLen = 6;
}
} break;
}
if (nItemLen != 0) {
if (nPrecision != 0 && nItemLen > nPrecision) {
nItemLen = nPrecision;
}
if (nItemLen < nWidth) {
nItemLen = nWidth;
}
} else {
switch (*pStr) {
case 'd':
case 'i':
case 'u':
case 'x':
case 'X':
case 'o':
if (nModifier & FORCE_INT64) {
va_arg(argList, int64_t);
} else {
va_arg(argList, int);
}
nItemLen = 32;
if (nItemLen < nWidth + nPrecision) {
nItemLen = nWidth + nPrecision;
}
break;
case 'a':
case 'A':
case 'e':
case 'E':
case 'g':
case 'G':
va_arg(argList, double);
nItemLen = 128;
if (nItemLen < nWidth + nPrecision) {
nItemLen = nWidth + nPrecision;
}
break;
case 'f':
if (nWidth + nPrecision > 100) {
nItemLen = nPrecision + nWidth + 128;
} else {
double f;
char pszTemp[256];
f = va_arg(argList, double);
FXSYS_snprintf(pszTemp, sizeof(pszTemp), "%*.*f", nWidth,
nPrecision + 6, f);
nItemLen = strlen(pszTemp);
}
break;
case 'p':
va_arg(argList, void*);
nItemLen = 32;
if (nItemLen < nWidth + nPrecision) {
nItemLen = nWidth + nPrecision;
}
break;
case 'n':
va_arg(argList, int*);
break;
}
}
nMaxLen += nItemLen;
}
nMaxLen += 32; // Fudge factor.
return nMaxLen;
}
// Returns string unless we ran out of space.
absl::optional<WideString> TryVSWPrintf(size_t size,
const wchar_t* pFormat,
va_list argList) {
if (!size)
return absl::nullopt;
WideString str;
{
// Span's lifetime must end before ReleaseBuffer() below.
pdfium::span<wchar_t> buffer = str.GetBuffer(size);
// In the following two calls, there's always space in the WideString
// for a terminating NUL that's not included in the span.
// For vswprintf(), MSAN won't untaint the buffer on a truncated write's
// -1 return code even though the buffer is written. Probably just as well
// not to trust the vendor's implementation to write anything anyways.
// See https://crbug.com/705912.
memset(buffer.data(), 0, (size + 1) * sizeof(wchar_t));
int ret = vswprintf(buffer.data(), size + 1, pFormat, argList);
bool bSufficientBuffer = ret >= 0 || buffer[size - 1] == 0;
if (!bSufficientBuffer)
return absl::nullopt;
}
str.ReleaseBuffer(str.GetStringLength());
return str;
}
} // namespace
namespace fxcrt {
static_assert(sizeof(WideString) <= sizeof(wchar_t*),
"Strings must not require more space than pointers");
// static
WideString WideString::FormatInteger(int i) {
wchar_t wbuf[32];
swprintf(wbuf, std::size(wbuf), L"%d", i);
return WideString(wbuf);
}
// static
WideString WideString::FormatV(const wchar_t* format, va_list argList) {
va_list argListCopy;
va_copy(argListCopy, argList);
auto guess = GuessSizeForVSWPrintf(format, argListCopy);
va_end(argListCopy);
if (!guess.has_value()) {
return WideString();
}
int maxLen = pdfium::base::checked_cast<int>(guess.value());
while (maxLen < 32 * 1024) {
va_copy(argListCopy, argList);
absl::optional<WideString> ret =
TryVSWPrintf(static_cast<size_t>(maxLen), format, argListCopy);
va_end(argListCopy);
if (ret.has_value())
return ret.value();
maxLen *= 2;
}
return WideString();
}
// static
WideString WideString::Format(const wchar_t* pFormat, ...) {
va_list argList;
va_start(argList, pFormat);
WideString ret = FormatV(pFormat, argList);
va_end(argList);
return ret;
}
WideString::WideString() = default;
WideString::WideString(const WideString& other) : m_pData(other.m_pData) {}
WideString::WideString(WideString&& other) noexcept {
m_pData.Swap(other.m_pData);
}
WideString::WideString(const wchar_t* pStr, size_t nLen) {
if (nLen)
m_pData.Reset(StringData::Create(pStr, nLen));
}
WideString::WideString(wchar_t ch) {
m_pData.Reset(StringData::Create(1));
m_pData->m_String[0] = ch;
}
WideString::WideString(const wchar_t* ptr)
: WideString(ptr, ptr ? wcslen(ptr) : 0) {}
WideString::WideString(WideStringView stringSrc) {
if (!stringSrc.IsEmpty()) {
m_pData.Reset(StringData::Create(stringSrc.unterminated_c_str(),
stringSrc.GetLength()));
}
}
WideString::WideString(WideStringView str1, WideStringView str2) {
FX_SAFE_SIZE_T nSafeLen = str1.GetLength();
nSafeLen += str2.GetLength();
size_t nNewLen = nSafeLen.ValueOrDie();
if (nNewLen == 0)
return;
m_pData.Reset(StringData::Create(nNewLen));
m_pData->CopyContents(str1.unterminated_c_str(), str1.GetLength());
m_pData->CopyContentsAt(str1.GetLength(), str2.unterminated_c_str(),
str2.GetLength());
}
WideString::WideString(const std::initializer_list<WideStringView>& list) {
FX_SAFE_SIZE_T nSafeLen = 0;
for (const auto& item : list)
nSafeLen += item.GetLength();
size_t nNewLen = nSafeLen.ValueOrDie();
if (nNewLen == 0)
return;
m_pData.Reset(StringData::Create(nNewLen));
size_t nOffset = 0;
for (const auto& item : list) {
m_pData->CopyContentsAt(nOffset, item.unterminated_c_str(),
item.GetLength());
nOffset += item.GetLength();
}
}
WideString::~WideString() = default;
void WideString::clear() {
if (m_pData && m_pData->CanOperateInPlace(0)) {
m_pData->m_nDataLength = 0;
return;
}
m_pData.Reset();
}
WideString& WideString::operator=(const wchar_t* str) {
if (!str || !str[0])
clear();
else
AssignCopy(str, wcslen(str));
return *this;
}
WideString& WideString::operator=(WideStringView str) {
if (str.IsEmpty())
clear();
else
AssignCopy(str.unterminated_c_str(), str.GetLength());
return *this;
}
WideString& WideString::operator=(const WideString& that) {
if (m_pData != that.m_pData)
m_pData = that.m_pData;
return *this;
}
WideString& WideString::operator=(WideString&& that) noexcept {
if (m_pData != that.m_pData)
m_pData = std::move(that.m_pData);
return *this;
}
WideString& WideString::operator+=(const wchar_t* str) {
if (str)
Concat(str, wcslen(str));
return *this;
}
WideString& WideString::operator+=(wchar_t ch) {
Concat(&ch, 1);
return *this;
}
WideString& WideString::operator+=(const WideString& str) {
if (str.m_pData)
Concat(str.m_pData->m_String, str.m_pData->m_nDataLength);
return *this;
}
WideString& WideString::operator+=(WideStringView str) {
if (!str.IsEmpty())
Concat(str.unterminated_c_str(), str.GetLength());
return *this;
}
bool WideString::operator==(const wchar_t* ptr) const {
if (!m_pData)
return !ptr || !ptr[0];
if (!ptr)
return m_pData->m_nDataLength == 0;
return wcslen(ptr) == m_pData->m_nDataLength &&
wmemcmp(ptr, m_pData->m_String, m_pData->m_nDataLength) == 0;
}
bool WideString::operator==(WideStringView str) const {
if (!m_pData)
return str.IsEmpty();
return m_pData->m_nDataLength == str.GetLength() &&
wmemcmp(m_pData->m_String, str.unterminated_c_str(),
str.GetLength()) == 0;
}
bool WideString::operator==(const WideString& other) const {
if (m_pData == other.m_pData)
return true;
if (IsEmpty())
return other.IsEmpty();
if (other.IsEmpty())
return false;
return other.m_pData->m_nDataLength == m_pData->m_nDataLength &&
wmemcmp(other.m_pData->m_String, m_pData->m_String,
m_pData->m_nDataLength) == 0;
}
bool WideString::operator<(const wchar_t* ptr) const {
return Compare(ptr) < 0;
}
bool WideString::operator<(WideStringView str) const {
if (!m_pData && !str.unterminated_c_str())
return false;
if (c_str() == str.unterminated_c_str())
return false;
size_t len = GetLength();
size_t other_len = str.GetLength();
int result =
wmemcmp(c_str(), str.unterminated_c_str(), std::min(len, other_len));
return result < 0 || (result == 0 && len < other_len);
}
bool WideString::operator<(const WideString& other) const {
return Compare(other) < 0;
}
void WideString::AssignCopy(const wchar_t* pSrcData, size_t nSrcLen) {
AllocBeforeWrite(nSrcLen);
m_pData->CopyContents(pSrcData, nSrcLen);
m_pData->m_nDataLength = nSrcLen;
}
void WideString::ReallocBeforeWrite(size_t nNewLength) {
if (m_pData && m_pData->CanOperateInPlace(nNewLength))
return;
if (nNewLength == 0) {
clear();
return;
}
RetainPtr<StringData> pNewData(StringData::Create(nNewLength));
if (m_pData) {
size_t nCopyLength = std::min(m_pData->m_nDataLength, nNewLength);
pNewData->CopyContents(m_pData->m_String, nCopyLength);
pNewData->m_nDataLength = nCopyLength;
} else {
pNewData->m_nDataLength = 0;
}
pNewData->m_String[pNewData->m_nDataLength] = 0;
m_pData.Swap(pNewData);
}
void WideString::AllocBeforeWrite(size_t nNewLength) {
if (m_pData && m_pData->CanOperateInPlace(nNewLength))
return;
if (nNewLength == 0) {
clear();
return;
}
m_pData.Reset(StringData::Create(nNewLength));
}
void WideString::ReleaseBuffer(size_t nNewLength) {
if (!m_pData)
return;
nNewLength = std::min(nNewLength, m_pData->m_nAllocLength);
if (nNewLength == 0) {
clear();
return;
}
DCHECK_EQ(m_pData->m_nRefs, 1);
m_pData->m_nDataLength = nNewLength;
m_pData->m_String[nNewLength] = 0;
if (m_pData->m_nAllocLength - nNewLength >= 32) {
// Over arbitrary threshold, so pay the price to relocate. Force copy to
// always occur by holding a second reference to the string.
WideString preserve(*this);
ReallocBeforeWrite(nNewLength);
}
}
void WideString::Reserve(size_t len) {
GetBuffer(len);
}
pdfium::span<wchar_t> WideString::GetBuffer(size_t nMinBufLength) {
if (!m_pData) {
if (nMinBufLength == 0)
return pdfium::span<wchar_t>();
m_pData.Reset(StringData::Create(nMinBufLength));
m_pData->m_nDataLength = 0;
m_pData->m_String[0] = 0;
return pdfium::span<wchar_t>(m_pData->m_String, m_pData->m_nAllocLength);
}
if (m_pData->CanOperateInPlace(nMinBufLength))
return pdfium::span<wchar_t>(m_pData->m_String, m_pData->m_nAllocLength);
nMinBufLength = std::max(nMinBufLength, m_pData->m_nDataLength);
if (nMinBufLength == 0)
return pdfium::span<wchar_t>();
RetainPtr<StringData> pNewData(StringData::Create(nMinBufLength));
pNewData->CopyContents(*m_pData);
pNewData->m_nDataLength = m_pData->m_nDataLength;
m_pData.Swap(pNewData);
return pdfium::span<wchar_t>(m_pData->m_String, m_pData->m_nAllocLength);
}
size_t WideString::Delete(size_t index, size_t count) {
if (!m_pData)
return 0;
size_t old_length = m_pData->m_nDataLength;
if (count == 0 || index != pdfium::clamp<size_t>(index, 0, old_length))
return old_length;
size_t removal_length = index + count;
if (removal_length > old_length)
return old_length;
ReallocBeforeWrite(old_length);
size_t chars_to_copy = old_length - removal_length + 1;
wmemmove(m_pData->m_String + index, m_pData->m_String + removal_length,
chars_to_copy);
m_pData->m_nDataLength = old_length - count;
return m_pData->m_nDataLength;
}
void WideString::Concat(const wchar_t* pSrcData, size_t nSrcLen) {
if (!pSrcData || nSrcLen == 0)
return;
if (!m_pData) {
m_pData.Reset(StringData::Create(pSrcData, nSrcLen));
return;
}
if (m_pData->CanOperateInPlace(m_pData->m_nDataLength + nSrcLen)) {
m_pData->CopyContentsAt(m_pData->m_nDataLength, pSrcData, nSrcLen);
m_pData->m_nDataLength += nSrcLen;
return;
}
size_t nConcatLen = std::max(m_pData->m_nDataLength / 2, nSrcLen);
RetainPtr<StringData> pNewData(
StringData::Create(m_pData->m_nDataLength + nConcatLen));
pNewData->CopyContents(*m_pData);
pNewData->CopyContentsAt(m_pData->m_nDataLength, pSrcData, nSrcLen);
pNewData->m_nDataLength = m_pData->m_nDataLength + nSrcLen;
m_pData.Swap(pNewData);
}
intptr_t WideString::ReferenceCountForTesting() const {
return m_pData ? m_pData->m_nRefs : 0;
}
ByteString WideString::ToASCII() const {
ByteString result;
result.Reserve(GetLength());
for (wchar_t wc : *this)
result.InsertAtBack(static_cast<char>(wc & 0x7f));
return result;
}
ByteString WideString::ToLatin1() const {
ByteString result;
result.Reserve(GetLength());
for (wchar_t wc : *this)
result.InsertAtBack(static_cast<char>(wc & 0xff));
return result;
}
ByteString WideString::ToDefANSI() const {
size_t dest_len =
FX_WideCharToMultiByte(FX_CodePage::kDefANSI, AsStringView(), {});
if (!dest_len)
return ByteString();
ByteString bstr;
{
// Span's lifetime must end before ReleaseBuffer() below.
pdfium::span<char> dest_buf = bstr.GetBuffer(dest_len);
FX_WideCharToMultiByte(FX_CodePage::kDefANSI, AsStringView(), dest_buf);
}
bstr.ReleaseBuffer(dest_len);
return bstr;
}
ByteString WideString::ToUTF8() const {
return FX_UTF8Encode(AsStringView());
}
ByteString WideString::ToUTF16LE() const {
if (!m_pData)
return ByteString("\0\0", 2);
ByteString result;
size_t len = m_pData->m_nDataLength;
{
// Span's lifetime must end before ReleaseBuffer() below.
pdfium::span<char> buffer = result.GetBuffer(len * 2 + 2);
for (size_t i = 0; i < len; i++) {
buffer[i * 2] = m_pData->m_String[i] & 0xff;
buffer[i * 2 + 1] = m_pData->m_String[i] >> 8;
}
buffer[len * 2] = 0;
buffer[len * 2 + 1] = 0;
}
result.ReleaseBuffer(len * 2 + 2);
return result;
}
WideString WideString::EncodeEntities() const {
WideString ret = *this;
ret.Replace(L"&", L"&amp;");
ret.Replace(L"<", L"&lt;");
ret.Replace(L">", L"&gt;");
ret.Replace(L"\'", L"&apos;");
ret.Replace(L"\"", L"&quot;");
return ret;
}
WideString WideString::Substr(size_t offset) const {
// Unsigned underflow is well-defined and out-of-range is handled by Substr().
return Substr(offset, GetLength() - offset);
}
WideString WideString::Substr(size_t first, size_t count) const {
if (!m_pData)
return WideString();
if (!IsValidIndex(first))
return WideString();
if (count == 0 || !IsValidLength(count))
return WideString();
if (!IsValidIndex(first + count - 1))
return WideString();
if (first == 0 && count == GetLength())
return *this;
WideString dest;
AllocCopy(dest, count, first);
return dest;
}
WideString WideString::First(size_t count) const {
return Substr(0, count);
}
WideString WideString::Last(size_t count) const {
// Unsigned underflow is well-defined and out-of-range is handled by Substr().
return Substr(GetLength() - count, count);
}
void WideString::AllocCopy(WideString& dest,
size_t nCopyLen,
size_t nCopyIndex) const {
if (nCopyLen == 0)
return;
RetainPtr<StringData> pNewData(
StringData::Create(m_pData->m_String + nCopyIndex, nCopyLen));
dest.m_pData.Swap(pNewData);
}
size_t WideString::Insert(size_t index, wchar_t ch) {
const size_t cur_length = GetLength();
if (!IsValidLength(index))
return cur_length;
const size_t new_length = cur_length + 1;
ReallocBeforeWrite(new_length);
wmemmove(m_pData->m_String + index + 1, m_pData->m_String + index,
new_length - index);
m_pData->m_String[index] = ch;
m_pData->m_nDataLength = new_length;
return new_length;
}
absl::optional<size_t> WideString::Find(wchar_t ch, size_t start) const {
if (!m_pData)
return absl::nullopt;
if (!IsValidIndex(start))
return absl::nullopt;
const wchar_t* pStr =
wmemchr(m_pData->m_String + start, ch, m_pData->m_nDataLength - start);
return pStr ? absl::optional<size_t>(
static_cast<size_t>(pStr - m_pData->m_String))
: absl::nullopt;
}
absl::optional<size_t> WideString::Find(WideStringView subStr,
size_t start) const {
if (!m_pData)
return absl::nullopt;
if (!IsValidIndex(start))
return absl::nullopt;
const wchar_t* pStr =
FX_wcsstr(m_pData->m_String + start, m_pData->m_nDataLength - start,
subStr.unterminated_c_str(), subStr.GetLength());
return pStr ? absl::optional<size_t>(
static_cast<size_t>(pStr - m_pData->m_String))
: absl::nullopt;
}
absl::optional<size_t> WideString::ReverseFind(wchar_t ch) const {
if (!m_pData)
return absl::nullopt;
size_t nLength = m_pData->m_nDataLength;
while (nLength--) {
if (m_pData->m_String[nLength] == ch)
return nLength;
}
return absl::nullopt;
}
void WideString::MakeLower() {
if (IsEmpty())
return;
ReallocBeforeWrite(m_pData->m_nDataLength);
FXSYS_wcslwr(m_pData->m_String);
}
void WideString::MakeUpper() {
if (IsEmpty())
return;
ReallocBeforeWrite(m_pData->m_nDataLength);
FXSYS_wcsupr(m_pData->m_String);
}
size_t WideString::Remove(wchar_t chRemove) {
if (IsEmpty())
return 0;
wchar_t* pstrSource = m_pData->m_String;
wchar_t* pstrEnd = m_pData->m_String + m_pData->m_nDataLength;
while (pstrSource < pstrEnd) {
if (*pstrSource == chRemove)
break;
pstrSource++;
}
if (pstrSource == pstrEnd)
return 0;
ptrdiff_t copied = pstrSource - m_pData->m_String;
ReallocBeforeWrite(m_pData->m_nDataLength);
pstrSource = m_pData->m_String + copied;
pstrEnd = m_pData->m_String + m_pData->m_nDataLength;
wchar_t* pstrDest = pstrSource;
while (pstrSource < pstrEnd) {
if (*pstrSource != chRemove) {
*pstrDest = *pstrSource;
pstrDest++;
}
pstrSource++;
}
*pstrDest = 0;
size_t count = static_cast<size_t>(pstrSource - pstrDest);
m_pData->m_nDataLength -= count;
return count;
}
size_t WideString::Replace(WideStringView pOld, WideStringView pNew) {
if (!m_pData || pOld.IsEmpty())
return 0;
size_t nSourceLen = pOld.GetLength();
size_t nReplacementLen = pNew.GetLength();
size_t count = 0;
const wchar_t* pStart = m_pData->m_String;
wchar_t* pEnd = m_pData->m_String + m_pData->m_nDataLength;
while (true) {
const wchar_t* pTarget =
FX_wcsstr(pStart, static_cast<size_t>(pEnd - pStart),
pOld.unterminated_c_str(), nSourceLen);
if (!pTarget)
break;
count++;
pStart = pTarget + nSourceLen;
}
if (count == 0)
return 0;
size_t nNewLength =
m_pData->m_nDataLength + (nReplacementLen - nSourceLen) * count;
if (nNewLength == 0) {
clear();
return count;
}
RetainPtr<StringData> pNewData(StringData::Create(nNewLength));
pStart = m_pData->m_String;
wchar_t* pDest = pNewData->m_String;
for (size_t i = 0; i < count; i++) {
const wchar_t* pTarget =
FX_wcsstr(pStart, static_cast<size_t>(pEnd - pStart),
pOld.unterminated_c_str(), nSourceLen);
wmemcpy(pDest, pStart, pTarget - pStart);
pDest += pTarget - pStart;
wmemcpy(pDest, pNew.unterminated_c_str(), pNew.GetLength());
pDest += pNew.GetLength();
pStart = pTarget + nSourceLen;
}
wmemcpy(pDest, pStart, pEnd - pStart);
m_pData.Swap(pNewData);
return count;
}
// static
WideString WideString::FromASCII(ByteStringView bstr) {
WideString result;
result.Reserve(bstr.GetLength());
for (char c : bstr)
result.InsertAtBack(static_cast<wchar_t>(c & 0x7f));
return result;
}
// static
WideString WideString::FromLatin1(ByteStringView bstr) {
WideString result;
result.Reserve(bstr.GetLength());
for (char c : bstr)
result.InsertAtBack(static_cast<wchar_t>(c & 0xff));
return result;
}
// static
WideString WideString::FromDefANSI(ByteStringView bstr) {
size_t dest_len = FX_MultiByteToWideChar(FX_CodePage::kDefANSI, bstr, {});
if (!dest_len)
return WideString();
WideString wstr;
{
// Span's lifetime must end before ReleaseBuffer() below.
pdfium::span<wchar_t> dest_buf = wstr.GetBuffer(dest_len);
FX_MultiByteToWideChar(FX_CodePage::kDefANSI, bstr, dest_buf);
}
wstr.ReleaseBuffer(dest_len);
return wstr;
}
// static
WideString WideString::FromUTF8(ByteStringView str) {
return FX_UTF8Decode(str);
}
// static
WideString WideString::FromUTF16LE(const unsigned short* wstr, size_t wlen) {
if (!wstr || wlen == 0)
return WideString();
WideString result;
{
// Span's lifetime must end before ReleaseBuffer() below.
pdfium::span<wchar_t> buf = result.GetBuffer(wlen);
for (size_t i = 0; i < wlen; i++)
buf[i] = wstr[i];
}
result.ReleaseBuffer(wlen);
return result;
}
WideString WideString::FromUTF16BE(const unsigned short* wstr, size_t wlen) {
if (!wstr || wlen == 0)
return WideString();
WideString result;
{
// Span's lifetime must end before ReleaseBuffer() below.
pdfium::span<wchar_t> buf = result.GetBuffer(wlen);
for (size_t i = 0; i < wlen; i++) {
auto wch = wstr[i];
wch = (wch >> 8) | (wch << 8);
buf[i] = wch;
}
}
result.ReleaseBuffer(wlen);
return result;
}
void WideString::SetAt(size_t index, wchar_t c) {
DCHECK(IsValidIndex(index));
ReallocBeforeWrite(m_pData->m_nDataLength);
m_pData->m_String[index] = c;
}
int WideString::Compare(const wchar_t* str) const {
if (m_pData)
return str ? wcscmp(m_pData->m_String, str) : 1;
return (!str || str[0] == 0) ? 0 : -1;
}
int WideString::Compare(const WideString& str) const {
if (!m_pData)
return str.m_pData ? -1 : 0;
if (!str.m_pData)
return 1;
size_t this_len = m_pData->m_nDataLength;
size_t that_len = str.m_pData->m_nDataLength;
size_t min_len = std::min(this_len, that_len);
int result = wmemcmp(m_pData->m_String, str.m_pData->m_String, min_len);
if (result != 0)
return result;
if (this_len == that_len)
return 0;
return this_len < that_len ? -1 : 1;
}
int WideString::CompareNoCase(const wchar_t* str) const {
if (m_pData)
return str ? FXSYS_wcsicmp(m_pData->m_String, str) : 1;
return (!str || str[0] == 0) ? 0 : -1;
}
size_t WideString::WStringLength(const unsigned short* str) {
size_t len = 0;
if (str)
while (str[len])
len++;
return len;
}
void WideString::Trim() {
TrimRight(kWideTrimChars);
TrimLeft(kWideTrimChars);
}
void WideString::Trim(wchar_t target) {
wchar_t str[2] = {target, 0};
TrimRight(str);
TrimLeft(str);
}
void WideString::Trim(WideStringView targets) {
TrimRight(targets);
TrimLeft(targets);
}
void WideString::TrimLeft() {
TrimLeft(kWideTrimChars);
}
void WideString::TrimLeft(wchar_t target) {
wchar_t str[2] = {target, 0};
TrimLeft(str);
}
void WideString::TrimLeft(WideStringView targets) {
if (!m_pData || targets.IsEmpty())
return;
size_t len = GetLength();
if (len == 0)
return;
size_t pos = 0;
while (pos < len) {
size_t i = 0;
while (i < targets.GetLength() &&
targets.CharAt(i) != m_pData->m_String[pos]) {
i++;
}
if (i == targets.GetLength())
break;
pos++;
}
if (!pos)
return;
ReallocBeforeWrite(len);
size_t nDataLength = len - pos;
memmove(m_pData->m_String, m_pData->m_String + pos,
(nDataLength + 1) * sizeof(wchar_t));
m_pData->m_nDataLength = nDataLength;
}
void WideString::TrimRight() {
TrimRight(kWideTrimChars);
}
void WideString::TrimRight(wchar_t target) {
wchar_t str[2] = {target, 0};
TrimRight(str);
}
void WideString::TrimRight(WideStringView targets) {
if (IsEmpty() || targets.IsEmpty())
return;
size_t pos = GetLength();
while (pos && targets.Contains(m_pData->m_String[pos - 1]))
pos--;
if (pos < m_pData->m_nDataLength) {
ReallocBeforeWrite(m_pData->m_nDataLength);
m_pData->m_String[pos] = 0;
m_pData->m_nDataLength = pos;
}
}
int WideString::GetInteger() const {
return m_pData ? FXSYS_wtoi(m_pData->m_String) : 0;
}
std::wostream& operator<<(std::wostream& os, const WideString& str) {
return os.write(str.c_str(), str.GetLength());
}
std::ostream& operator<<(std::ostream& os, const WideString& str) {
os << str.ToUTF8();
return os;
}
std::wostream& operator<<(std::wostream& os, WideStringView str) {
return os.write(str.unterminated_c_str(), str.GetLength());
}
std::ostream& operator<<(std::ostream& os, WideStringView str) {
os << FX_UTF8Encode(str);
return os;
}
} // namespace fxcrt
uint32_t FX_HashCode_GetW(WideStringView str) {
uint32_t dwHashCode = 0;
for (WideStringView::UnsignedType c : str)
dwHashCode = 1313 * dwHashCode + c;
return dwHashCode;
}
uint32_t FX_HashCode_GetLoweredW(WideStringView str) {
uint32_t dwHashCode = 0;
for (wchar_t c : str) // match FXSYS_towlower() arg type.
dwHashCode = 1313 * dwHashCode + FXSYS_towlower(c);
return dwHashCode;
}