// Copyright 2014 The PDFium Authors // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com #include "core/fxcrt/widestring.h" #include #include #include #include #include "core/fxcrt/fx_codepage.h" #include "core/fxcrt/fx_extension.h" #include "core/fxcrt/fx_safe_types.h" #include "core/fxcrt/fx_system.h" #include "core/fxcrt/string_pool_template.h" #include "third_party/base/check.h" #include "third_party/base/check_op.h" #include "third_party/base/cxx17_backports.h" #include "third_party/base/numerics/safe_math.h" template class fxcrt::StringDataTemplate; template class fxcrt::StringViewTemplate; template class fxcrt::StringPoolTemplate; template struct std::hash; #define FORCE_ANSI 0x10000 #define FORCE_UNICODE 0x20000 #define FORCE_INT64 0x40000 namespace { constexpr wchar_t kWideTrimChars[] = L"\x09\x0a\x0b\x0c\x0d\x20"; const wchar_t* FX_wcsstr(const wchar_t* haystack, size_t haystack_len, const wchar_t* needle, size_t needle_len) { if (needle_len > haystack_len || needle_len == 0) return nullptr; const wchar_t* end_ptr = haystack + haystack_len - needle_len; while (haystack <= end_ptr) { size_t i = 0; while (true) { if (haystack[i] != needle[i]) break; i++; if (i == needle_len) return haystack; } haystack++; } return nullptr; } absl::optional GuessSizeForVSWPrintf(const wchar_t* pFormat, va_list argList) { size_t nMaxLen = 0; for (const wchar_t* pStr = pFormat; *pStr != 0; pStr++) { if (*pStr != '%' || *(pStr = pStr + 1) == '%') { ++nMaxLen; continue; } int iWidth = 0; for (; *pStr != 0; pStr++) { if (*pStr == '#') { nMaxLen += 2; } else if (*pStr == '*') { iWidth = va_arg(argList, int); } else if (*pStr != '-' && *pStr != '+' && *pStr != '0' && *pStr != ' ') { break; } } if (iWidth == 0) { iWidth = FXSYS_wtoi(pStr); while (FXSYS_IsDecimalDigit(*pStr)) ++pStr; } if (iWidth < 0 || iWidth > 128 * 1024) return absl::nullopt; uint32_t nWidth = static_cast(iWidth); int iPrecision = 0; if (*pStr == '.') { pStr++; if (*pStr == '*') { iPrecision = va_arg(argList, int); pStr++; } else { iPrecision = FXSYS_wtoi(pStr); while (FXSYS_IsDecimalDigit(*pStr)) ++pStr; } } if (iPrecision < 0 || iPrecision > 128 * 1024) return absl::nullopt; uint32_t nPrecision = static_cast(iPrecision); int nModifier = 0; if (*pStr == L'I' && *(pStr + 1) == L'6' && *(pStr + 2) == L'4') { pStr += 3; nModifier = FORCE_INT64; } else { switch (*pStr) { case 'h': nModifier = FORCE_ANSI; pStr++; break; case 'l': nModifier = FORCE_UNICODE; pStr++; break; case 'F': case 'N': case 'L': pStr++; break; } } size_t nItemLen = 0; switch (*pStr | nModifier) { case 'c': case 'C': nItemLen = 2; va_arg(argList, int); break; case 'c' | FORCE_ANSI: case 'C' | FORCE_ANSI: nItemLen = 2; va_arg(argList, int); break; case 'c' | FORCE_UNICODE: case 'C' | FORCE_UNICODE: nItemLen = 2; va_arg(argList, int); break; case 's': { const wchar_t* pstrNextArg = va_arg(argList, const wchar_t*); if (pstrNextArg) { nItemLen = wcslen(pstrNextArg); if (nItemLen < 1) { nItemLen = 1; } } else { nItemLen = 6; } } break; case 'S': { const char* pstrNextArg = va_arg(argList, const char*); if (pstrNextArg) { nItemLen = strlen(pstrNextArg); if (nItemLen < 1) { nItemLen = 1; } } else { nItemLen = 6; } } break; case 's' | FORCE_ANSI: case 'S' | FORCE_ANSI: { const char* pstrNextArg = va_arg(argList, const char*); if (pstrNextArg) { nItemLen = strlen(pstrNextArg); if (nItemLen < 1) { nItemLen = 1; } } else { nItemLen = 6; } } break; case 's' | FORCE_UNICODE: case 'S' | FORCE_UNICODE: { const wchar_t* pstrNextArg = va_arg(argList, wchar_t*); if (pstrNextArg) { nItemLen = wcslen(pstrNextArg); if (nItemLen < 1) { nItemLen = 1; } } else { nItemLen = 6; } } break; } if (nItemLen != 0) { if (nPrecision != 0 && nItemLen > nPrecision) { nItemLen = nPrecision; } if (nItemLen < nWidth) { nItemLen = nWidth; } } else { switch (*pStr) { case 'd': case 'i': case 'u': case 'x': case 'X': case 'o': if (nModifier & FORCE_INT64) { va_arg(argList, int64_t); } else { va_arg(argList, int); } nItemLen = 32; if (nItemLen < nWidth + nPrecision) { nItemLen = nWidth + nPrecision; } break; case 'a': case 'A': case 'e': case 'E': case 'g': case 'G': va_arg(argList, double); nItemLen = 128; if (nItemLen < nWidth + nPrecision) { nItemLen = nWidth + nPrecision; } break; case 'f': if (nWidth + nPrecision > 100) { nItemLen = nPrecision + nWidth + 128; } else { double f; char pszTemp[256]; f = va_arg(argList, double); FXSYS_snprintf(pszTemp, sizeof(pszTemp), "%*.*f", nWidth, nPrecision + 6, f); nItemLen = strlen(pszTemp); } break; case 'p': va_arg(argList, void*); nItemLen = 32; if (nItemLen < nWidth + nPrecision) { nItemLen = nWidth + nPrecision; } break; case 'n': va_arg(argList, int*); break; } } nMaxLen += nItemLen; } nMaxLen += 32; // Fudge factor. return nMaxLen; } // Returns string unless we ran out of space. absl::optional TryVSWPrintf(size_t size, const wchar_t* pFormat, va_list argList) { if (!size) return absl::nullopt; WideString str; { // Span's lifetime must end before ReleaseBuffer() below. pdfium::span buffer = str.GetBuffer(size); // In the following two calls, there's always space in the WideString // for a terminating NUL that's not included in the span. // For vswprintf(), MSAN won't untaint the buffer on a truncated write's // -1 return code even though the buffer is written. Probably just as well // not to trust the vendor's implementation to write anything anyways. // See https://crbug.com/705912. memset(buffer.data(), 0, (size + 1) * sizeof(wchar_t)); int ret = vswprintf(buffer.data(), size + 1, pFormat, argList); bool bSufficientBuffer = ret >= 0 || buffer[size - 1] == 0; if (!bSufficientBuffer) return absl::nullopt; } str.ReleaseBuffer(str.GetStringLength()); return str; } } // namespace namespace fxcrt { static_assert(sizeof(WideString) <= sizeof(wchar_t*), "Strings must not require more space than pointers"); // static WideString WideString::FormatInteger(int i) { wchar_t wbuf[32]; swprintf(wbuf, std::size(wbuf), L"%d", i); return WideString(wbuf); } // static WideString WideString::FormatV(const wchar_t* format, va_list argList) { va_list argListCopy; va_copy(argListCopy, argList); auto guess = GuessSizeForVSWPrintf(format, argListCopy); va_end(argListCopy); if (!guess.has_value()) { return WideString(); } int maxLen = pdfium::base::checked_cast(guess.value()); while (maxLen < 32 * 1024) { va_copy(argListCopy, argList); absl::optional ret = TryVSWPrintf(static_cast(maxLen), format, argListCopy); va_end(argListCopy); if (ret.has_value()) return ret.value(); maxLen *= 2; } return WideString(); } // static WideString WideString::Format(const wchar_t* pFormat, ...) { va_list argList; va_start(argList, pFormat); WideString ret = FormatV(pFormat, argList); va_end(argList); return ret; } WideString::WideString() = default; WideString::WideString(const WideString& other) : m_pData(other.m_pData) {} WideString::WideString(WideString&& other) noexcept { m_pData.Swap(other.m_pData); } WideString::WideString(const wchar_t* pStr, size_t nLen) { if (nLen) m_pData.Reset(StringData::Create(pStr, nLen)); } WideString::WideString(wchar_t ch) { m_pData.Reset(StringData::Create(1)); m_pData->m_String[0] = ch; } WideString::WideString(const wchar_t* ptr) : WideString(ptr, ptr ? wcslen(ptr) : 0) {} WideString::WideString(WideStringView stringSrc) { if (!stringSrc.IsEmpty()) { m_pData.Reset(StringData::Create(stringSrc.unterminated_c_str(), stringSrc.GetLength())); } } WideString::WideString(WideStringView str1, WideStringView str2) { FX_SAFE_SIZE_T nSafeLen = str1.GetLength(); nSafeLen += str2.GetLength(); size_t nNewLen = nSafeLen.ValueOrDie(); if (nNewLen == 0) return; m_pData.Reset(StringData::Create(nNewLen)); m_pData->CopyContents(str1.unterminated_c_str(), str1.GetLength()); m_pData->CopyContentsAt(str1.GetLength(), str2.unterminated_c_str(), str2.GetLength()); } WideString::WideString(const std::initializer_list& list) { FX_SAFE_SIZE_T nSafeLen = 0; for (const auto& item : list) nSafeLen += item.GetLength(); size_t nNewLen = nSafeLen.ValueOrDie(); if (nNewLen == 0) return; m_pData.Reset(StringData::Create(nNewLen)); size_t nOffset = 0; for (const auto& item : list) { m_pData->CopyContentsAt(nOffset, item.unterminated_c_str(), item.GetLength()); nOffset += item.GetLength(); } } WideString::~WideString() = default; void WideString::clear() { if (m_pData && m_pData->CanOperateInPlace(0)) { m_pData->m_nDataLength = 0; return; } m_pData.Reset(); } WideString& WideString::operator=(const wchar_t* str) { if (!str || !str[0]) clear(); else AssignCopy(str, wcslen(str)); return *this; } WideString& WideString::operator=(WideStringView str) { if (str.IsEmpty()) clear(); else AssignCopy(str.unterminated_c_str(), str.GetLength()); return *this; } WideString& WideString::operator=(const WideString& that) { if (m_pData != that.m_pData) m_pData = that.m_pData; return *this; } WideString& WideString::operator=(WideString&& that) noexcept { if (m_pData != that.m_pData) m_pData = std::move(that.m_pData); return *this; } WideString& WideString::operator+=(const wchar_t* str) { if (str) Concat(str, wcslen(str)); return *this; } WideString& WideString::operator+=(wchar_t ch) { Concat(&ch, 1); return *this; } WideString& WideString::operator+=(const WideString& str) { if (str.m_pData) Concat(str.m_pData->m_String, str.m_pData->m_nDataLength); return *this; } WideString& WideString::operator+=(WideStringView str) { if (!str.IsEmpty()) Concat(str.unterminated_c_str(), str.GetLength()); return *this; } bool WideString::operator==(const wchar_t* ptr) const { if (!m_pData) return !ptr || !ptr[0]; if (!ptr) return m_pData->m_nDataLength == 0; return wcslen(ptr) == m_pData->m_nDataLength && wmemcmp(ptr, m_pData->m_String, m_pData->m_nDataLength) == 0; } bool WideString::operator==(WideStringView str) const { if (!m_pData) return str.IsEmpty(); return m_pData->m_nDataLength == str.GetLength() && wmemcmp(m_pData->m_String, str.unterminated_c_str(), str.GetLength()) == 0; } bool WideString::operator==(const WideString& other) const { if (m_pData == other.m_pData) return true; if (IsEmpty()) return other.IsEmpty(); if (other.IsEmpty()) return false; return other.m_pData->m_nDataLength == m_pData->m_nDataLength && wmemcmp(other.m_pData->m_String, m_pData->m_String, m_pData->m_nDataLength) == 0; } bool WideString::operator<(const wchar_t* ptr) const { return Compare(ptr) < 0; } bool WideString::operator<(WideStringView str) const { if (!m_pData && !str.unterminated_c_str()) return false; if (c_str() == str.unterminated_c_str()) return false; size_t len = GetLength(); size_t other_len = str.GetLength(); int result = wmemcmp(c_str(), str.unterminated_c_str(), std::min(len, other_len)); return result < 0 || (result == 0 && len < other_len); } bool WideString::operator<(const WideString& other) const { return Compare(other) < 0; } void WideString::AssignCopy(const wchar_t* pSrcData, size_t nSrcLen) { AllocBeforeWrite(nSrcLen); m_pData->CopyContents(pSrcData, nSrcLen); m_pData->m_nDataLength = nSrcLen; } void WideString::ReallocBeforeWrite(size_t nNewLength) { if (m_pData && m_pData->CanOperateInPlace(nNewLength)) return; if (nNewLength == 0) { clear(); return; } RetainPtr pNewData(StringData::Create(nNewLength)); if (m_pData) { size_t nCopyLength = std::min(m_pData->m_nDataLength, nNewLength); pNewData->CopyContents(m_pData->m_String, nCopyLength); pNewData->m_nDataLength = nCopyLength; } else { pNewData->m_nDataLength = 0; } pNewData->m_String[pNewData->m_nDataLength] = 0; m_pData.Swap(pNewData); } void WideString::AllocBeforeWrite(size_t nNewLength) { if (m_pData && m_pData->CanOperateInPlace(nNewLength)) return; if (nNewLength == 0) { clear(); return; } m_pData.Reset(StringData::Create(nNewLength)); } void WideString::ReleaseBuffer(size_t nNewLength) { if (!m_pData) return; nNewLength = std::min(nNewLength, m_pData->m_nAllocLength); if (nNewLength == 0) { clear(); return; } DCHECK_EQ(m_pData->m_nRefs, 1); m_pData->m_nDataLength = nNewLength; m_pData->m_String[nNewLength] = 0; if (m_pData->m_nAllocLength - nNewLength >= 32) { // Over arbitrary threshold, so pay the price to relocate. Force copy to // always occur by holding a second reference to the string. WideString preserve(*this); ReallocBeforeWrite(nNewLength); } } void WideString::Reserve(size_t len) { GetBuffer(len); } pdfium::span WideString::GetBuffer(size_t nMinBufLength) { if (!m_pData) { if (nMinBufLength == 0) return pdfium::span(); m_pData.Reset(StringData::Create(nMinBufLength)); m_pData->m_nDataLength = 0; m_pData->m_String[0] = 0; return pdfium::span(m_pData->m_String, m_pData->m_nAllocLength); } if (m_pData->CanOperateInPlace(nMinBufLength)) return pdfium::span(m_pData->m_String, m_pData->m_nAllocLength); nMinBufLength = std::max(nMinBufLength, m_pData->m_nDataLength); if (nMinBufLength == 0) return pdfium::span(); RetainPtr pNewData(StringData::Create(nMinBufLength)); pNewData->CopyContents(*m_pData); pNewData->m_nDataLength = m_pData->m_nDataLength; m_pData.Swap(pNewData); return pdfium::span(m_pData->m_String, m_pData->m_nAllocLength); } size_t WideString::Delete(size_t index, size_t count) { if (!m_pData) return 0; size_t old_length = m_pData->m_nDataLength; if (count == 0 || index != pdfium::clamp(index, 0, old_length)) return old_length; size_t removal_length = index + count; if (removal_length > old_length) return old_length; ReallocBeforeWrite(old_length); size_t chars_to_copy = old_length - removal_length + 1; wmemmove(m_pData->m_String + index, m_pData->m_String + removal_length, chars_to_copy); m_pData->m_nDataLength = old_length - count; return m_pData->m_nDataLength; } void WideString::Concat(const wchar_t* pSrcData, size_t nSrcLen) { if (!pSrcData || nSrcLen == 0) return; if (!m_pData) { m_pData.Reset(StringData::Create(pSrcData, nSrcLen)); return; } if (m_pData->CanOperateInPlace(m_pData->m_nDataLength + nSrcLen)) { m_pData->CopyContentsAt(m_pData->m_nDataLength, pSrcData, nSrcLen); m_pData->m_nDataLength += nSrcLen; return; } size_t nConcatLen = std::max(m_pData->m_nDataLength / 2, nSrcLen); RetainPtr pNewData( StringData::Create(m_pData->m_nDataLength + nConcatLen)); pNewData->CopyContents(*m_pData); pNewData->CopyContentsAt(m_pData->m_nDataLength, pSrcData, nSrcLen); pNewData->m_nDataLength = m_pData->m_nDataLength + nSrcLen; m_pData.Swap(pNewData); } intptr_t WideString::ReferenceCountForTesting() const { return m_pData ? m_pData->m_nRefs : 0; } ByteString WideString::ToASCII() const { ByteString result; result.Reserve(GetLength()); for (wchar_t wc : *this) result.InsertAtBack(static_cast(wc & 0x7f)); return result; } ByteString WideString::ToLatin1() const { ByteString result; result.Reserve(GetLength()); for (wchar_t wc : *this) result.InsertAtBack(static_cast(wc & 0xff)); return result; } ByteString WideString::ToDefANSI() const { size_t dest_len = FX_WideCharToMultiByte(FX_CodePage::kDefANSI, AsStringView(), {}); if (!dest_len) return ByteString(); ByteString bstr; { // Span's lifetime must end before ReleaseBuffer() below. pdfium::span dest_buf = bstr.GetBuffer(dest_len); FX_WideCharToMultiByte(FX_CodePage::kDefANSI, AsStringView(), dest_buf); } bstr.ReleaseBuffer(dest_len); return bstr; } ByteString WideString::ToUTF8() const { return FX_UTF8Encode(AsStringView()); } ByteString WideString::ToUTF16LE() const { if (!m_pData) return ByteString("\0\0", 2); ByteString result; size_t len = m_pData->m_nDataLength; { // Span's lifetime must end before ReleaseBuffer() below. pdfium::span buffer = result.GetBuffer(len * 2 + 2); for (size_t i = 0; i < len; i++) { buffer[i * 2] = m_pData->m_String[i] & 0xff; buffer[i * 2 + 1] = m_pData->m_String[i] >> 8; } buffer[len * 2] = 0; buffer[len * 2 + 1] = 0; } result.ReleaseBuffer(len * 2 + 2); return result; } WideString WideString::EncodeEntities() const { WideString ret = *this; ret.Replace(L"&", L"&"); ret.Replace(L"<", L"<"); ret.Replace(L">", L">"); ret.Replace(L"\'", L"'"); ret.Replace(L"\"", L"""); return ret; } WideString WideString::Substr(size_t offset) const { // Unsigned underflow is well-defined and out-of-range is handled by Substr(). return Substr(offset, GetLength() - offset); } WideString WideString::Substr(size_t first, size_t count) const { if (!m_pData) return WideString(); if (!IsValidIndex(first)) return WideString(); if (count == 0 || !IsValidLength(count)) return WideString(); if (!IsValidIndex(first + count - 1)) return WideString(); if (first == 0 && count == GetLength()) return *this; WideString dest; AllocCopy(dest, count, first); return dest; } WideString WideString::First(size_t count) const { return Substr(0, count); } WideString WideString::Last(size_t count) const { // Unsigned underflow is well-defined and out-of-range is handled by Substr(). return Substr(GetLength() - count, count); } void WideString::AllocCopy(WideString& dest, size_t nCopyLen, size_t nCopyIndex) const { if (nCopyLen == 0) return; RetainPtr pNewData( StringData::Create(m_pData->m_String + nCopyIndex, nCopyLen)); dest.m_pData.Swap(pNewData); } size_t WideString::Insert(size_t index, wchar_t ch) { const size_t cur_length = GetLength(); if (!IsValidLength(index)) return cur_length; const size_t new_length = cur_length + 1; ReallocBeforeWrite(new_length); wmemmove(m_pData->m_String + index + 1, m_pData->m_String + index, new_length - index); m_pData->m_String[index] = ch; m_pData->m_nDataLength = new_length; return new_length; } absl::optional WideString::Find(wchar_t ch, size_t start) const { if (!m_pData) return absl::nullopt; if (!IsValidIndex(start)) return absl::nullopt; const wchar_t* pStr = wmemchr(m_pData->m_String + start, ch, m_pData->m_nDataLength - start); return pStr ? absl::optional( static_cast(pStr - m_pData->m_String)) : absl::nullopt; } absl::optional WideString::Find(WideStringView subStr, size_t start) const { if (!m_pData) return absl::nullopt; if (!IsValidIndex(start)) return absl::nullopt; const wchar_t* pStr = FX_wcsstr(m_pData->m_String + start, m_pData->m_nDataLength - start, subStr.unterminated_c_str(), subStr.GetLength()); return pStr ? absl::optional( static_cast(pStr - m_pData->m_String)) : absl::nullopt; } absl::optional WideString::ReverseFind(wchar_t ch) const { if (!m_pData) return absl::nullopt; size_t nLength = m_pData->m_nDataLength; while (nLength--) { if (m_pData->m_String[nLength] == ch) return nLength; } return absl::nullopt; } void WideString::MakeLower() { if (IsEmpty()) return; ReallocBeforeWrite(m_pData->m_nDataLength); FXSYS_wcslwr(m_pData->m_String); } void WideString::MakeUpper() { if (IsEmpty()) return; ReallocBeforeWrite(m_pData->m_nDataLength); FXSYS_wcsupr(m_pData->m_String); } size_t WideString::Remove(wchar_t chRemove) { if (IsEmpty()) return 0; wchar_t* pstrSource = m_pData->m_String; wchar_t* pstrEnd = m_pData->m_String + m_pData->m_nDataLength; while (pstrSource < pstrEnd) { if (*pstrSource == chRemove) break; pstrSource++; } if (pstrSource == pstrEnd) return 0; ptrdiff_t copied = pstrSource - m_pData->m_String; ReallocBeforeWrite(m_pData->m_nDataLength); pstrSource = m_pData->m_String + copied; pstrEnd = m_pData->m_String + m_pData->m_nDataLength; wchar_t* pstrDest = pstrSource; while (pstrSource < pstrEnd) { if (*pstrSource != chRemove) { *pstrDest = *pstrSource; pstrDest++; } pstrSource++; } *pstrDest = 0; size_t count = static_cast(pstrSource - pstrDest); m_pData->m_nDataLength -= count; return count; } size_t WideString::Replace(WideStringView pOld, WideStringView pNew) { if (!m_pData || pOld.IsEmpty()) return 0; size_t nSourceLen = pOld.GetLength(); size_t nReplacementLen = pNew.GetLength(); size_t count = 0; const wchar_t* pStart = m_pData->m_String; wchar_t* pEnd = m_pData->m_String + m_pData->m_nDataLength; while (true) { const wchar_t* pTarget = FX_wcsstr(pStart, static_cast(pEnd - pStart), pOld.unterminated_c_str(), nSourceLen); if (!pTarget) break; count++; pStart = pTarget + nSourceLen; } if (count == 0) return 0; size_t nNewLength = m_pData->m_nDataLength + (nReplacementLen - nSourceLen) * count; if (nNewLength == 0) { clear(); return count; } RetainPtr pNewData(StringData::Create(nNewLength)); pStart = m_pData->m_String; wchar_t* pDest = pNewData->m_String; for (size_t i = 0; i < count; i++) { const wchar_t* pTarget = FX_wcsstr(pStart, static_cast(pEnd - pStart), pOld.unterminated_c_str(), nSourceLen); wmemcpy(pDest, pStart, pTarget - pStart); pDest += pTarget - pStart; wmemcpy(pDest, pNew.unterminated_c_str(), pNew.GetLength()); pDest += pNew.GetLength(); pStart = pTarget + nSourceLen; } wmemcpy(pDest, pStart, pEnd - pStart); m_pData.Swap(pNewData); return count; } // static WideString WideString::FromASCII(ByteStringView bstr) { WideString result; result.Reserve(bstr.GetLength()); for (char c : bstr) result.InsertAtBack(static_cast(c & 0x7f)); return result; } // static WideString WideString::FromLatin1(ByteStringView bstr) { WideString result; result.Reserve(bstr.GetLength()); for (char c : bstr) result.InsertAtBack(static_cast(c & 0xff)); return result; } // static WideString WideString::FromDefANSI(ByteStringView bstr) { size_t dest_len = FX_MultiByteToWideChar(FX_CodePage::kDefANSI, bstr, {}); if (!dest_len) return WideString(); WideString wstr; { // Span's lifetime must end before ReleaseBuffer() below. pdfium::span dest_buf = wstr.GetBuffer(dest_len); FX_MultiByteToWideChar(FX_CodePage::kDefANSI, bstr, dest_buf); } wstr.ReleaseBuffer(dest_len); return wstr; } // static WideString WideString::FromUTF8(ByteStringView str) { return FX_UTF8Decode(str); } // static WideString WideString::FromUTF16LE(const unsigned short* wstr, size_t wlen) { if (!wstr || wlen == 0) return WideString(); WideString result; { // Span's lifetime must end before ReleaseBuffer() below. pdfium::span buf = result.GetBuffer(wlen); for (size_t i = 0; i < wlen; i++) buf[i] = wstr[i]; } result.ReleaseBuffer(wlen); return result; } WideString WideString::FromUTF16BE(const unsigned short* wstr, size_t wlen) { if (!wstr || wlen == 0) return WideString(); WideString result; { // Span's lifetime must end before ReleaseBuffer() below. pdfium::span buf = result.GetBuffer(wlen); for (size_t i = 0; i < wlen; i++) { auto wch = wstr[i]; wch = (wch >> 8) | (wch << 8); buf[i] = wch; } } result.ReleaseBuffer(wlen); return result; } void WideString::SetAt(size_t index, wchar_t c) { DCHECK(IsValidIndex(index)); ReallocBeforeWrite(m_pData->m_nDataLength); m_pData->m_String[index] = c; } int WideString::Compare(const wchar_t* str) const { if (m_pData) return str ? wcscmp(m_pData->m_String, str) : 1; return (!str || str[0] == 0) ? 0 : -1; } int WideString::Compare(const WideString& str) const { if (!m_pData) return str.m_pData ? -1 : 0; if (!str.m_pData) return 1; size_t this_len = m_pData->m_nDataLength; size_t that_len = str.m_pData->m_nDataLength; size_t min_len = std::min(this_len, that_len); int result = wmemcmp(m_pData->m_String, str.m_pData->m_String, min_len); if (result != 0) return result; if (this_len == that_len) return 0; return this_len < that_len ? -1 : 1; } int WideString::CompareNoCase(const wchar_t* str) const { if (m_pData) return str ? FXSYS_wcsicmp(m_pData->m_String, str) : 1; return (!str || str[0] == 0) ? 0 : -1; } size_t WideString::WStringLength(const unsigned short* str) { size_t len = 0; if (str) while (str[len]) len++; return len; } void WideString::Trim() { TrimRight(kWideTrimChars); TrimLeft(kWideTrimChars); } void WideString::Trim(wchar_t target) { wchar_t str[2] = {target, 0}; TrimRight(str); TrimLeft(str); } void WideString::Trim(WideStringView targets) { TrimRight(targets); TrimLeft(targets); } void WideString::TrimLeft() { TrimLeft(kWideTrimChars); } void WideString::TrimLeft(wchar_t target) { wchar_t str[2] = {target, 0}; TrimLeft(str); } void WideString::TrimLeft(WideStringView targets) { if (!m_pData || targets.IsEmpty()) return; size_t len = GetLength(); if (len == 0) return; size_t pos = 0; while (pos < len) { size_t i = 0; while (i < targets.GetLength() && targets.CharAt(i) != m_pData->m_String[pos]) { i++; } if (i == targets.GetLength()) break; pos++; } if (!pos) return; ReallocBeforeWrite(len); size_t nDataLength = len - pos; memmove(m_pData->m_String, m_pData->m_String + pos, (nDataLength + 1) * sizeof(wchar_t)); m_pData->m_nDataLength = nDataLength; } void WideString::TrimRight() { TrimRight(kWideTrimChars); } void WideString::TrimRight(wchar_t target) { wchar_t str[2] = {target, 0}; TrimRight(str); } void WideString::TrimRight(WideStringView targets) { if (IsEmpty() || targets.IsEmpty()) return; size_t pos = GetLength(); while (pos && targets.Contains(m_pData->m_String[pos - 1])) pos--; if (pos < m_pData->m_nDataLength) { ReallocBeforeWrite(m_pData->m_nDataLength); m_pData->m_String[pos] = 0; m_pData->m_nDataLength = pos; } } int WideString::GetInteger() const { return m_pData ? FXSYS_wtoi(m_pData->m_String) : 0; } std::wostream& operator<<(std::wostream& os, const WideString& str) { return os.write(str.c_str(), str.GetLength()); } std::ostream& operator<<(std::ostream& os, const WideString& str) { os << str.ToUTF8(); return os; } std::wostream& operator<<(std::wostream& os, WideStringView str) { return os.write(str.unterminated_c_str(), str.GetLength()); } std::ostream& operator<<(std::ostream& os, WideStringView str) { os << FX_UTF8Encode(str); return os; } } // namespace fxcrt uint32_t FX_HashCode_GetW(WideStringView str) { uint32_t dwHashCode = 0; for (WideStringView::UnsignedType c : str) dwHashCode = 1313 * dwHashCode + c; return dwHashCode; } uint32_t FX_HashCode_GetLoweredW(WideStringView str) { uint32_t dwHashCode = 0; for (wchar_t c : str) // match FXSYS_towlower() arg type. dwHashCode = 1313 * dwHashCode + FXSYS_towlower(c); return dwHashCode; }