Qt
Internal/Contributor docs for the Qt SDK. Note: These are NOT official API docs; those are found at https://doc.qt.io/
Loading...
Searching...
No Matches
widestring.h
Go to the documentation of this file.
1// Copyright 2017 The PDFium Authors
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
6
7#ifndef CORE_FXCRT_WIDESTRING_H_
8#define CORE_FXCRT_WIDESTRING_H_
9
10#include <stdarg.h>
11#include <stddef.h>
12#include <stdint.h>
13
14#include <iosfwd>
15#include <utility>
16
17#include "core/fxcrt/compiler_specific.h"
18#include "core/fxcrt/span.h"
19#include "core/fxcrt/string_template.h"
20
21namespace fxcrt {
22
23class ByteString;
24
25// A mutable string with shared buffers using copy-on-write semantics that
26// avoids the cost of std::string's iterator stability guarantees.
27// TODO(crbug.com/pdfium/2031): Consider switching to `char16_t` instead.
28class WideString : public StringTemplate<wchar_t> {
29 public:
30 [[nodiscard]] static WideString FormatInteger(int i);
31 [[nodiscard]] static WideString Format(const wchar_t* pFormat, ...);
32 [[nodiscard]] static WideString FormatV(const wchar_t* lpszFormat,
33 va_list argList);
34
35 WideString() = default;
36 WideString(const WideString& other) = default;
37
38 // Move-construct a WideString. After construction, |other| is empty.
39 WideString(WideString&& other) noexcept = default;
40
41 ~WideString() = default;
42
43 UNSAFE_BUFFER_USAGE WideString(const wchar_t* pStr, size_t len);
44
45 // Make a one-character string from one wide char.
46 explicit WideString(wchar_t ch);
47
48 // Deliberately implicit to avoid calling on every string literal.
49 // NOLINTNEXTLINE(runtime/explicit)
50 WideString(const wchar_t* ptr);
51
52 // No implicit conversions from byte strings.
53 // NOLINTNEXTLINE(runtime/explicit)
54 WideString(char) = delete;
55
56 explicit WideString(WideStringView str);
58 WideString(const std::initializer_list<WideStringView>& list);
59
64 [[nodiscard]] static WideString FromUTF16LE(pdfium::span<const uint8_t> data);
65 [[nodiscard]] static WideString FromUTF16BE(pdfium::span<const uint8_t> data);
66
67 WideString& operator=(const wchar_t* str);
69 WideString& operator=(const WideString& that);
70
71 // Move-assign a WideString. After assignment, |that| is empty.
72 WideString& operator=(WideString&& that) noexcept;
73
74 WideString& operator+=(const wchar_t* str);
75 WideString& operator+=(wchar_t ch);
76 WideString& operator+=(const WideString& str);
78
79 bool operator==(const wchar_t* ptr) const;
80 bool operator==(WideStringView str) const;
81 bool operator==(const WideString& other) const;
82
83 bool operator!=(const wchar_t* ptr) const { return !(*this == ptr); }
84 bool operator!=(WideStringView str) const { return !(*this == str); }
85 bool operator!=(const WideString& other) const { return !(*this == other); }
86
87 bool operator<(const wchar_t* ptr) const;
88 bool operator<(WideStringView str) const;
89 bool operator<(const WideString& other) const;
90
91 int Compare(const wchar_t* str) const;
92 int Compare(const WideString& str) const;
93 int CompareNoCase(const wchar_t* str) const;
94
95 WideString Substr(size_t offset) const;
96 WideString Substr(size_t first, size_t count) const;
97 WideString First(size_t count) const;
98 WideString Last(size_t count) const;
99
100 void MakeLower();
101 void MakeUpper();
102
103 // Trim a canonical set of characters from the widestring.
104 void TrimWhitespace();
105 void TrimWhitespaceFront();
106 void TrimWhitespaceBack();
107
108 int GetInteger() const;
109
110 bool IsASCII() const { return AsStringView().IsASCII(); }
111 bool EqualsASCII(ByteStringView that) const {
112 return AsStringView().EqualsASCII(that);
113 }
115 return AsStringView().EqualsASCIINoCase(that);
116 }
117
118 ByteString ToASCII() const;
119 ByteString ToLatin1() const;
120 ByteString ToDefANSI() const;
121 ByteString ToUTF8() const;
122
123 // These methods will add \0\0 to the end of the string to represent the
124 // two-byte terminator. These values are part of the string itself, so
125 // GetLength() will include them.
126 ByteString ToUTF16LE() const;
127 ByteString ToUCS2LE() const;
128
129 // Replace the characters &<>'" with HTML entities.
131
132 protected:
133 intptr_t ReferenceCountForTesting() const;
134
135 friend class WideString_Assign_Test;
136 friend class WideString_ConcatInPlace_Test;
137 friend class WideString_Construct_Test;
138 friend class StringPool_WideString_Test;
139};
140
142 return WideString(str1, str2);
143}
144inline WideString operator+(WideStringView str1, const wchar_t* str2) {
145 return WideString(str1, str2);
146}
147inline WideString operator+(const wchar_t* str1, WideStringView str2) {
148 return WideString(str1, str2);
149}
150inline WideString operator+(WideStringView str1, wchar_t ch) {
151 return WideString(str1, WideStringView(ch));
152}
153inline WideString operator+(wchar_t ch, WideStringView str2) {
154 return WideString(WideStringView(ch), str2);
155}
156inline WideString operator+(const WideString& str1, const WideString& str2) {
157 return WideString(str1.AsStringView(), str2.AsStringView());
158}
159inline WideString operator+(const WideString& str1, wchar_t ch) {
160 return WideString(str1.AsStringView(), WideStringView(ch));
161}
162inline WideString operator+(wchar_t ch, const WideString& str2) {
163 return WideString(WideStringView(ch), str2.AsStringView());
164}
165inline WideString operator+(const WideString& str1, const wchar_t* str2) {
166 return WideString(str1.AsStringView(), str2);
167}
168inline WideString operator+(const wchar_t* str1, const WideString& str2) {
169 return WideString(str1, str2.AsStringView());
170}
171inline WideString operator+(const WideString& str1, WideStringView str2) {
172 return WideString(str1.AsStringView(), str2);
173}
174inline WideString operator+(WideStringView str1, const WideString& str2) {
175 return WideString(str1, str2.AsStringView());
176}
177inline bool operator==(const wchar_t* lhs, const WideString& rhs) {
178 return rhs == lhs;
179}
180inline bool operator==(WideStringView lhs, const WideString& rhs) {
181 return rhs == lhs;
182}
183inline bool operator!=(const wchar_t* lhs, const WideString& rhs) {
184 return rhs != lhs;
185}
186inline bool operator!=(WideStringView lhs, const WideString& rhs) {
187 return rhs != lhs;
188}
189inline bool operator<(const wchar_t* lhs, const WideString& rhs) {
190 return rhs.Compare(lhs) > 0;
191}
192
193std::wostream& operator<<(std::wostream& os, const WideString& str);
194std::ostream& operator<<(std::ostream& os, const WideString& str);
195std::wostream& operator<<(std::wostream& os, WideStringView str);
196std::ostream& operator<<(std::ostream& os, WideStringView str);
197
198// This is declared here for use in gtest-based tests but is defined in a test
199// support target. This should not be used in production code. Just use
200// operator<< from above instead.
201// In some cases, gtest will automatically use operator<< as well, but in this
202// case, it needs PrintTo() because WideString looks like a container to gtest.
203void PrintTo(const WideString& str, std::ostream* os);
204
205} // namespace fxcrt
206
208
209uint32_t FX_HashCode_GetW(WideStringView str);
211
212namespace std {
213
214template <>
216 size_t operator()(const WideString& str) const {
217 return FX_HashCode_GetW(str.AsStringView());
218 }
219};
220
221} // namespace std
222
223extern template struct std::hash<WideString>;
224
225#endif // CORE_FXCRT_WIDESTRING_H_
fxcrt::ByteString ByteString
Definition bytestring.h:180
#define DCHECK
Definition check.h:33
CPDF_ArrayLocker(RetainPtr< CPDF_Array > pArray)
const_iterator begin() const
Definition cpdf_array.h:185
const_iterator end() const
Definition cpdf_array.h:189
CPDF_ArrayLocker(const CPDF_Array *pArray)
CPDF_ArrayLocker(RetainPtr< const CPDF_Array > pArray)
size_t size() const
Definition cpdf_array.h:41
void Append(RetainPtr< CPDF_Stream > stream)=delete
bool GetBooleanAt(size_t index, bool bDefault) const
void SetAt(size_t index, RetainPtr< CPDF_Object > object)
RetainPtr< CPDF_Dictionary > GetMutableDictAt(size_t index)
RetainPtr< CPDF_Object > CloneNonCyclic(bool bDirect, std::set< const CPDF_Object * > *pVisited) const override
bool IsEmpty() const
Definition cpdf_array.h:40
RetainPtr< const CPDF_Object > GetDirectObjectAt(size_t index) const
RetainPtr< const CPDF_Stream > GetStreamAt(size_t index) const
Type GetType() const override
CPDF_Array * AsMutableArray() override
RetainPtr< const CPDF_Object > GetObjectAt(size_t index) const
RetainPtr< CPDF_Object > GetMutableObjectAt(size_t index)
std::enable_if<!CanInternStrings< T >::value, RetainPtr< T > >::type AppendNew(Args &&... args)
Definition cpdf_array.h:85
WideString GetUnicodeTextAt(size_t index) const
RetainPtr< CPDF_Array > GetMutableArrayAt(size_t index)
RetainPtr< CPDF_Object > Clone() const override
std::enable_if< CanInternStrings< T >::value, RetainPtr< T > >::type AppendNew(Args &&... args)
Definition cpdf_array.h:94
RetainPtr< const CPDF_Dictionary > GetDictAt(size_t index) const
std::vector< RetainPtr< CPDF_Object > >::const_iterator const_iterator
Definition cpdf_array.h:29
std::enable_if<!CanInternStrings< T >::value, RetainPtr< T > >::type InsertNewAt(size_t index, Args &&... args)
Definition cpdf_array.h:115
bool IsLocked() const
Definition cpdf_array.h:150
RetainPtr< CPDF_Stream > GetMutableStreamAt(size_t index)
bool Contains(const CPDF_Object *pThat) const
void ConvertToIndirectObjectAt(size_t index, CPDF_IndirectObjectHolder *pHolder)
std::optional< size_t > Find(const CPDF_Object *pThat) const
std::enable_if< CanInternStrings< T >::value, RetainPtr< T > >::type InsertNewAt(size_t index, Args &&... args)
Definition cpdf_array.h:124
std::enable_if<!CanInternStrings< T >::value, RetainPtr< T > >::type SetNewAt(size_t index, Args &&... args)
Definition cpdf_array.h:100
bool WriteTo(IFX_ArchiveStream *archive, const CPDF_Encryptor *encryptor) const override
RetainPtr< CPDF_Object > GetMutableDirectObjectAt(size_t index)
CFX_Matrix GetMatrix() const
~CPDF_Array() override
int GetIntegerAt(size_t index) const
void SetAt(size_t index, RetainPtr< CPDF_Stream > stream)=delete
void InsertAt(size_t index, RetainPtr< CPDF_Object > object)
ByteString GetByteStringAt(size_t index) const
std::enable_if< CanInternStrings< T >::value, RetainPtr< T > >::type SetNewAt(size_t index, Args &&... args)
Definition cpdf_array.h:109
void Append(RetainPtr< CPDF_Object > object)
RetainPtr< const CPDF_String > GetStringAt(size_t index) const
RetainPtr< const CPDF_Array > GetArrayAt(size_t index) const
RetainPtr< const CPDF_Number > GetNumberAt(size_t index) const
CFX_FloatRect GetRect() const
void InsertAt(size_t index, RetainPtr< CPDF_Stream > stream)=delete
void RemoveAt(size_t index)
float GetFloatAt(size_t index) const
CPDF_Creator(CPDF_Document *pDoc, RetainPtr< IFX_RetainableWriteStream > archive)
bool SetFileVersion(int32_t fileVersion)
void RemoveSecurity()
bool Create(uint32_t flags)
std::map< ByteString, RetainPtr< CPDF_Object >, std::less<> > DictMap
RetainPtr< const CPDF_Object > GetIndirectObject(uint32_t objnum) const
std::enable_if<!CanInternStrings< T >::value, RetainPtr< T > >::type New(Args &&... args)
RetainPtr< T > NewIndirect(Args &&... args)
RetainPtr< CPDF_Object > GetOrParseIndirectObject(uint32_t objnum)
WeakPtr< ByteStringPool > GetByteStringPool() const
std::enable_if< CanInternStrings< T >::value, RetainPtr< T > >::type New(Args &&... args)
virtual RetainPtr< CPDF_Object > ParseIndirectObject(uint32_t objnum)
RetainPtr< CPDF_Object > GetMutableIndirectObject(uint32_t objnum)
uint32_t AddIndirectObject(RetainPtr< CPDF_Object > pObj)
bool ReplaceIndirectObjectIfHigherGeneration(uint32_t objnum, RetainPtr< CPDF_Object > pObj)
void SetGenNum(uint32_t gennum)
Definition cpdf_object.h:68
RetainPtr< const CPDF_Dictionary > GetDict() const
bool IsInline() const
Definition cpdf_object.h:69
uint32_t GetGenNum() const
Definition cpdf_object.h:67
virtual Type GetType() const =0
virtual WideString GetUnicodeText() const
virtual ByteString GetString() const
RetainPtr< const CPDF_Object > GetDirect() const
uint32_t m_GenNum
bool IsName() const
virtual CPDF_Null * AsMutableNull()
const CPDF_Name * AsName() const
bool IsArray() const
const CPDF_Boolean * AsBoolean() const
virtual void SetString(const ByteString &str)
const CPDF_Null * AsNull() const
bool IsDictionary() const
bool IsStream() const
virtual RetainPtr< CPDF_Reference > MakeReference(CPDF_IndirectObjectHolder *holder) const
RetainPtr< CPDF_Object > GetMutableDirect()
const CPDF_Array * AsArray() const
virtual int GetInteger() const
CPDF_Object()=default
virtual float GetNumber() const
bool IsNull() const
bool IsBoolean() const
uint32_t GetObjNum() const
Definition cpdf_object.h:65
const CPDF_Dictionary * AsDictionary() const
virtual bool WriteTo(IFX_ArchiveStream *archive, const CPDF_Encryptor *encryptor) const =0
RetainPtr< CPDF_Object > CloneDirectObject() const
virtual CPDF_Stream * AsMutableStream()
bool IsString() const
virtual CPDF_Number * AsMutableNumber()
virtual CPDF_Dictionary * AsMutableDictionary()
virtual RetainPtr< CPDF_Object > Clone() const =0
bool IsNumber() const
virtual CPDF_Reference * AsMutableReference()
uint32_t m_ObjNum
CPDF_Object(const CPDF_Object &src)=delete
const CPDF_Stream * AsStream() const
static constexpr uint32_t kInvalidObjNum
Definition cpdf_object.h:52
virtual const CPDF_Object * GetDirectInternal() const
virtual CPDF_Name * AsMutableName()
bool IsReference() const
void SetObjNum(uint32_t objnum)
Definition cpdf_object.h:66
const CPDF_String * AsString() const
uint64_t KeyForCache() const
virtual CPDF_Array * AsMutableArray()
const CPDF_Reference * AsReference() const
virtual RetainPtr< CPDF_Object > CloneNonCyclic(bool bDirect, std::set< const CPDF_Object * > *pVisited) const
virtual CPDF_String * AsMutableString()
const CPDF_Number * AsNumber() const
RetainPtr< CPDF_Dictionary > GetMutableDict()
RetainPtr< CPDF_Object > CloneObjectNonCyclic(bool bDirect) const
virtual const CPDF_Dictionary * GetDictInternal() const
~CPDF_Object() override
virtual CPDF_Boolean * AsMutableBoolean()
virtual FX_FILESIZE CurrentOffset() const =0
static RetainPtr< IFX_SeekableReadStream > CreateFromFilename(const char *filename)
Definition fx_stream.cpp:68
virtual FX_FILESIZE GetPosition()
Definition fx_stream.cpp:80
virtual bool ReadBlockAtOffset(pdfium::span< uint8_t > buffer, FX_FILESIZE offset)=0
virtual bool IsEOF()
Definition fx_stream.cpp:76
virtual bool Flush()=0
virtual FX_FILESIZE GetSize()=0
bool WriteFilesize(FX_FILESIZE size)
Definition fx_stream.cpp:61
bool WriteByte(uint8_t byte)
Definition fx_stream.cpp:50
bool WriteString(ByteStringView str)
Definition fx_stream.cpp:46
virtual ~IFX_WriteStream()=default
bool WriteDWord(uint32_t i)
Definition fx_stream.cpp:54
virtual bool WriteBlock(pdfium::span< const uint8_t > data)=0
static ByteString Format(const char *pFormat,...)
ByteString & operator=(ByteString &&that) noexcept
T * get() const noexcept
UnownedPtr(const UnownedPtr< U > &that)
Definition unowned_ptr.h:99
bool operator==(const UnownedPtr &that) const
operator T*() const noexcept
UnownedPtr(UnownedPtr< U > &&that) noexcept
UnownedPtr & operator=(UnownedPtr< U > &&that) noexcept
constexpr UnownedPtr(const UnownedPtr &that) noexcept=default
constexpr UnownedPtr(T *pObj) noexcept
Definition unowned_ptr.h:84
UnownedPtr & operator=(T *that) noexcept
bool operator==(std::nullptr_t ptr) const
UnownedPtr & operator=(UnownedPtr &&that) noexcept
UnownedPtr & operator=(std::nullptr_t) noexcept
UnownedPtr & operator=(const UnownedPtr< U > &that) noexcept
T * operator->() const
constexpr UnownedPtr() noexcept=default
bool operator<(const UnownedPtr &that) const
UnownedPtr & operator=(const UnownedPtr &that) noexcept=default
T & operator*() const
constexpr UnownedPtr(UnownedPtr &&that) noexcept
Definition unowned_ptr.h:92
constexpr UnownedPtr(std::nullptr_t ptr)
Definition unowned_ptr.h:82
WideString(char)=delete
WideString(const std::initializer_list< WideStringView > &list)
WideString & operator+=(const WideString &str)
WideString(wchar_t ch)
bool operator==(const WideString &other) const
ByteString ToUTF8() const
static WideString Format(const wchar_t *pFormat,...)
UNSAFE_BUFFER_USAGE WideString(const wchar_t *pStr, size_t len)
WideString & operator=(WideString &&that) noexcept
WideString(WideStringView str1, WideStringView str2)
WideString()=default
WideString First(size_t count) const
static WideString FromUTF8(ByteStringView str)
WideString & operator+=(const wchar_t *str)
bool operator==(const wchar_t *ptr) const
WideString & operator+=(wchar_t ch)
bool operator<(WideStringView str) const
bool EqualsASCIINoCase(ByteStringView that) const
Definition widestring.h:114
~WideString()=default
WideString(const WideString &other)=default
static WideString FromDefANSI(ByteStringView str)
int GetInteger() const
int CompareNoCase(const wchar_t *str) const
WideString(const wchar_t *ptr)
static WideString FromLatin1(ByteStringView str)
WideString(WideString &&other) noexcept=default
bool IsASCII() const
Definition widestring.h:110
bool operator==(WideStringView str) const
bool operator!=(const WideString &other) const
Definition widestring.h:85
ByteString ToLatin1() const
intptr_t ReferenceCountForTesting() const
static WideString FromUTF16BE(pdfium::span< const uint8_t > data)
bool operator<(const WideString &other) const
int Compare(const wchar_t *str) const
WideString & operator=(const WideString &that)
WideString EncodeEntities() const
ByteString ToASCII() const
static WideString FromASCII(ByteStringView str)
WideString & operator+=(WideStringView str)
static WideString FromUTF16LE(pdfium::span< const uint8_t > data)
ByteString ToUCS2LE() const
WideString Last(size_t count) const
int Compare(const WideString &str) const
WideString & operator=(const wchar_t *str)
WideString Substr(size_t offset) const
WideString(WideStringView str)
bool operator!=(const wchar_t *ptr) const
Definition widestring.h:83
static WideString FormatV(const wchar_t *lpszFormat, va_list argList)
ByteString ToUTF16LE() const
static WideString FormatInteger(int i)
bool EqualsASCII(ByteStringView that) const
Definition widestring.h:111
ByteString ToDefANSI() const
bool operator<(const wchar_t *ptr) const
WideString Substr(size_t first, size_t count) const
bool operator!=(WideStringView str) const
Definition widestring.h:84
WideString & operator=(WideStringView str)
#define GSL_POINTER
#define TRIVIAL_ABI
#define UNSAFE_BUFFER_USAGE
CPDF_Array * ToArray(CPDF_Object *obj)
Definition cpdf_array.h:198
const CPDF_Array * ToArray(const CPDF_Object *obj)
Definition cpdf_array.h:202
RetainPtr< CPDF_Array > ToArray(RetainPtr< CPDF_Object > obj)
Definition cpdf_array.h:206
#define FPDFCREATE_INCREMENTAL
#define FPDFCREATE_NO_ORIGINAL
void * FX_Random_MT_Start(uint32_t dwSeed)
Definition fx_random.cpp:87
void FX_Random_MT_Close(void *pContext)
pdfium::CheckedNumeric< FX_FILESIZE > FX_SAFE_FILESIZE
constexpr uint32_t FXBSTR_ID(uint8_t c1, uint8_t c2, uint8_t c3, uint8_t c4)
Definition fx_string.h:19
double StringToDouble(WideStringView wsStr)
float StringToFloat(ByteStringView str)
ByteString FX_UTF8Encode(WideStringView wsStr)
Definition fx_string.cpp:68
std::u16string FX_UTF16Encode(WideStringView wsStr)
Definition fx_string.cpp:76
float StringToFloat(WideStringView wsStr)
double StringToDouble(ByteStringView str)
#define FX_FILESIZE
Definition fx_types.h:19
WideString operator+(const wchar_t *str1, WideStringView str2)
Definition widestring.h:147
bool operator==(const wchar_t *lhs, const WideString &rhs)
Definition widestring.h:177
WideString operator+(const WideString &str1, const WideString &str2)
Definition widestring.h:156
StringViewTemplate< wchar_t > WideStringView
WideString operator+(const WideString &str1, WideStringView str2)
Definition widestring.h:171
WideString operator+(const WideString &str1, wchar_t ch)
Definition widestring.h:159
WideString operator+(WideStringView str1, const WideString &str2)
Definition widestring.h:174
std::vector< StrType > Split(const StrType &that, typename StrType::CharType ch)
Definition fx_string.h:36
bool operator!=(WideStringView lhs, const WideString &rhs)
Definition widestring.h:186
StringViewTemplate< char > ByteStringView
bool operator==(WideStringView lhs, const WideString &rhs)
Definition widestring.h:180
bool operator!=(const wchar_t *lhs, const WideString &rhs)
Definition widestring.h:183
WideString operator+(WideStringView str1, const wchar_t *str2)
Definition widestring.h:144
WideString operator+(WideStringView str1, wchar_t ch)
Definition widestring.h:150
void PrintTo(const WideString &str, std::ostream *os)
WideString operator+(WideStringView str1, WideStringView str2)
Definition widestring.h:141
WideString operator+(wchar_t ch, WideStringView str2)
Definition widestring.h:153
WideString operator+(wchar_t ch, const WideString &str2)
Definition widestring.h:162
WideString operator+(const wchar_t *str1, const WideString &str2)
Definition widestring.h:168
bool operator<(const wchar_t *lhs, const WideString &rhs)
Definition widestring.h:189
WideString operator+(const WideString &str1, const wchar_t *str2)
Definition widestring.h:165
UnownedPtr< T > WrapUnowned(T *that)
#define CHECK(cvref)
#define CONSTRUCT_VIA_MAKE_RETAIN
Definition retain_ptr.h:222
fxcrt::ByteStringView ByteStringView
fxcrt::WideStringView WideStringView
static constexpr bool value
size_t operator()(const WideString &str) const
Definition widestring.h:216
#define UNOWNED_PTR_EXCLUSION
fxcrt::WideString WideString
Definition widestring.h:207
uint32_t FX_HashCode_GetLoweredW(WideStringView str)
uint32_t FX_HashCode_GetW(WideStringView str)