forked from OSchip/llvm-project
472 lines
17 KiB
C++
472 lines
17 KiB
C++
//===-- ConstString.h -------------------------------------------*- C++ -*-===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLDB_UTILITY_CONSTSTRING_H
|
|
#define LLDB_UTILITY_CONSTSTRING_H
|
|
|
|
#include "llvm/ADT/DenseMapInfo.h"
|
|
#include "llvm/ADT/StringRef.h"
|
|
#include "llvm/Support/FormatVariadic.h"
|
|
#include "llvm/Support/YAMLTraits.h"
|
|
|
|
#include <stddef.h>
|
|
|
|
namespace lldb_private {
|
|
class Stream;
|
|
}
|
|
namespace llvm {
|
|
class raw_ostream;
|
|
}
|
|
|
|
namespace lldb_private {
|
|
|
|
/// \class ConstString ConstString.h "lldb/Utility/ConstString.h"
|
|
/// A uniqued constant string class.
|
|
///
|
|
/// Provides an efficient way to store strings as uniqued strings. After the
|
|
/// strings are uniqued, finding strings that are equal to one another is very
|
|
/// fast as just the pointers need to be compared. It also allows for many
|
|
/// common strings from many different sources to be shared to keep the memory
|
|
/// footprint low.
|
|
///
|
|
/// No reference counting is done on strings that are added to the string
|
|
/// pool, once strings are added they are in the string pool for the life of
|
|
/// the program.
|
|
class ConstString {
|
|
public:
|
|
/// Default constructor
|
|
///
|
|
/// Initializes the string to an empty string.
|
|
ConstString() = default;
|
|
|
|
explicit ConstString(const llvm::StringRef &s);
|
|
|
|
/// Construct with C String value
|
|
///
|
|
/// Constructs this object with a C string by looking to see if the
|
|
/// C string already exists in the global string pool. If it doesn't
|
|
/// exist, it is added to the string pool.
|
|
///
|
|
/// \param[in] cstr
|
|
/// A NULL terminated C string to add to the string pool.
|
|
explicit ConstString(const char *cstr);
|
|
|
|
/// Construct with C String value with max length
|
|
///
|
|
/// Constructs this object with a C string with a length. If \a max_cstr_len
|
|
/// is greater than the actual length of the string, the string length will
|
|
/// be truncated. This allows substrings to be created without the need to
|
|
/// NULL terminate the string as it is passed into this function.
|
|
///
|
|
/// \param[in] cstr
|
|
/// A pointer to the first character in the C string. The C
|
|
/// string can be NULL terminated in a buffer that contains
|
|
/// more characters than the length of the string, or the
|
|
/// string can be part of another string and a new substring
|
|
/// can be created.
|
|
///
|
|
/// \param[in] max_cstr_len
|
|
/// The max length of \a cstr. If the string length of \a cstr
|
|
/// is less than \a max_cstr_len, then the string will be
|
|
/// truncated. If the string length of \a cstr is greater than
|
|
/// \a max_cstr_len, then only max_cstr_len bytes will be used
|
|
/// from \a cstr.
|
|
explicit ConstString(const char *cstr, size_t max_cstr_len);
|
|
|
|
/// C string equality binary predicate function object for ConstString
|
|
/// objects.
|
|
struct StringIsEqual {
|
|
/// C equality test.
|
|
///
|
|
/// Two C strings are equal when they are contained in ConstString objects
|
|
/// when their pointer values are equal to each other.
|
|
///
|
|
/// \return
|
|
/// Returns \b true if the C string in \a lhs is equal to
|
|
/// the C string value in \a rhs, \b false otherwise.
|
|
bool operator()(const char *lhs, const char *rhs) const {
|
|
return lhs == rhs;
|
|
}
|
|
};
|
|
|
|
/// Convert to bool operator.
|
|
///
|
|
/// This allows code to check a ConstString object to see if it contains a
|
|
/// valid string using code such as:
|
|
///
|
|
/// \code
|
|
/// ConstString str(...);
|
|
/// if (str)
|
|
/// { ...
|
|
/// \endcode
|
|
///
|
|
/// \return
|
|
/// /b True this object contains a valid non-empty C string, \b
|
|
/// false otherwise.
|
|
explicit operator bool() const { return !IsEmpty(); }
|
|
|
|
/// Equal to operator
|
|
///
|
|
/// Returns true if this string is equal to the string in \a rhs. This
|
|
/// operation is very fast as it results in a pointer comparison since all
|
|
/// strings are in a uniqued in a global string pool.
|
|
///
|
|
/// \param[in] rhs
|
|
/// Another string object to compare this object to.
|
|
///
|
|
/// \return
|
|
/// true if this object is equal to \a rhs.
|
|
/// false if this object is not equal to \a rhs.
|
|
bool operator==(ConstString rhs) const {
|
|
// We can do a pointer compare to compare these strings since they must
|
|
// come from the same pool in order to be equal.
|
|
return m_string == rhs.m_string;
|
|
}
|
|
|
|
/// Equal to operator against a non-ConstString value.
|
|
///
|
|
/// Returns true if this string is equal to the string in \a rhs. This
|
|
/// overload is usually slower than comparing against a ConstString value.
|
|
/// However, if the rhs string not already a ConstString and it is impractical
|
|
/// to turn it into a non-temporary variable, then this overload is faster.
|
|
///
|
|
/// \param[in] rhs
|
|
/// Another string object to compare this object to.
|
|
///
|
|
/// \return
|
|
/// \b true if this object is equal to \a rhs.
|
|
/// \b false if this object is not equal to \a rhs.
|
|
bool operator==(const char *rhs) const {
|
|
// ConstString differentiates between empty strings and nullptr strings, but
|
|
// StringRef doesn't. Therefore we have to do this check manually now.
|
|
if (m_string == nullptr && rhs != nullptr)
|
|
return false;
|
|
if (m_string != nullptr && rhs == nullptr)
|
|
return false;
|
|
|
|
return GetStringRef() == rhs;
|
|
}
|
|
|
|
/// Not equal to operator
|
|
///
|
|
/// Returns true if this string is not equal to the string in \a rhs. This
|
|
/// operation is very fast as it results in a pointer comparison since all
|
|
/// strings are in a uniqued in a global string pool.
|
|
///
|
|
/// \param[in] rhs
|
|
/// Another string object to compare this object to.
|
|
///
|
|
/// \return
|
|
/// \b true if this object is not equal to \a rhs.
|
|
/// \b false if this object is equal to \a rhs.
|
|
bool operator!=(ConstString rhs) const { return m_string != rhs.m_string; }
|
|
|
|
/// Not equal to operator against a non-ConstString value.
|
|
///
|
|
/// Returns true if this string is not equal to the string in \a rhs. This
|
|
/// overload is usually slower than comparing against a ConstString value.
|
|
/// However, if the rhs string not already a ConstString and it is impractical
|
|
/// to turn it into a non-temporary variable, then this overload is faster.
|
|
///
|
|
/// \param[in] rhs
|
|
/// Another string object to compare this object to.
|
|
///
|
|
/// \return \b true if this object is not equal to \a rhs, false otherwise.
|
|
bool operator!=(const char *rhs) const { return !(*this == rhs); }
|
|
|
|
bool operator<(ConstString rhs) const;
|
|
|
|
/// Get the string value as a C string.
|
|
///
|
|
/// Get the value of the contained string as a NULL terminated C string
|
|
/// value.
|
|
///
|
|
/// If \a value_if_empty is nullptr, then nullptr will be returned.
|
|
///
|
|
/// \return Returns \a value_if_empty if the string is empty, otherwise
|
|
/// the C string value contained in this object.
|
|
const char *AsCString(const char *value_if_empty = nullptr) const {
|
|
return (IsEmpty() ? value_if_empty : m_string);
|
|
}
|
|
|
|
/// Get the string value as a llvm::StringRef
|
|
///
|
|
/// \return
|
|
/// Returns a new llvm::StringRef object filled in with the
|
|
/// needed data.
|
|
llvm::StringRef GetStringRef() const {
|
|
return llvm::StringRef(m_string, GetLength());
|
|
}
|
|
|
|
/// Get the string value as a C string.
|
|
///
|
|
/// Get the value of the contained string as a NULL terminated C string
|
|
/// value. Similar to the ConstString::AsCString() function, yet this
|
|
/// function will always return nullptr if the string is not valid. So this
|
|
/// function is a direct accessor to the string pointer value.
|
|
///
|
|
/// \return
|
|
/// Returns nullptr the string is invalid, otherwise the C string
|
|
/// value contained in this object.
|
|
const char *GetCString() const { return m_string; }
|
|
|
|
/// Get the length in bytes of string value.
|
|
///
|
|
/// The string pool stores the length of the string, so we can avoid calling
|
|
/// strlen() on the pointer value with this function.
|
|
///
|
|
/// \return
|
|
/// Returns the number of bytes that this string occupies in
|
|
/// memory, not including the NULL termination byte.
|
|
size_t GetLength() const;
|
|
|
|
/// Clear this object's state.
|
|
///
|
|
/// Clear any contained string and reset the value to the empty string
|
|
/// value.
|
|
void Clear() { m_string = nullptr; }
|
|
|
|
/// Equal to operator
|
|
///
|
|
/// Returns true if this string is equal to the string in \a rhs. If case
|
|
/// sensitive equality is tested, this operation is very fast as it results
|
|
/// in a pointer comparison since all strings are in a uniqued in a global
|
|
/// string pool.
|
|
///
|
|
/// \param[in] lhs
|
|
/// The Left Hand Side const ConstString object reference.
|
|
///
|
|
/// \param[in] rhs
|
|
/// The Right Hand Side const ConstString object reference.
|
|
///
|
|
/// \param[in] case_sensitive
|
|
/// Case sensitivity. If true, case sensitive equality
|
|
/// will be tested, otherwise character case will be ignored
|
|
///
|
|
/// \return \b true if this object is equal to \a rhs, \b false otherwise.
|
|
static bool Equals(ConstString lhs, ConstString rhs,
|
|
const bool case_sensitive = true);
|
|
|
|
/// Compare two string objects.
|
|
///
|
|
/// Compares the C string values contained in \a lhs and \a rhs and returns
|
|
/// an integer result.
|
|
///
|
|
/// NOTE: only call this function when you want a true string
|
|
/// comparison. If you want string equality use the, use the == operator as
|
|
/// it is much more efficient. Also if you want string inequality, use the
|
|
/// != operator for the same reasons.
|
|
///
|
|
/// \param[in] lhs
|
|
/// The Left Hand Side const ConstString object reference.
|
|
///
|
|
/// \param[in] rhs
|
|
/// The Right Hand Side const ConstString object reference.
|
|
///
|
|
/// \param[in] case_sensitive
|
|
/// Case sensitivity of compare. If true, case sensitive compare
|
|
/// will be performed, otherwise character case will be ignored
|
|
///
|
|
/// \return -1 if lhs < rhs, 0 if lhs == rhs, 1 if lhs > rhs
|
|
static int Compare(ConstString lhs, ConstString rhs,
|
|
const bool case_sensitive = true);
|
|
|
|
/// Dump the object description to a stream.
|
|
///
|
|
/// Dump the string value to the stream \a s. If the contained string is
|
|
/// empty, print \a value_if_empty to the stream instead. If \a
|
|
/// value_if_empty is nullptr, then nothing will be dumped to the stream.
|
|
///
|
|
/// \param[in] s
|
|
/// The stream that will be used to dump the object description.
|
|
///
|
|
/// \param[in] value_if_empty
|
|
/// The value to dump if the string is empty. If nullptr, nothing
|
|
/// will be output to the stream.
|
|
void Dump(Stream *s, const char *value_if_empty = nullptr) const;
|
|
|
|
/// Dump the object debug description to a stream.
|
|
///
|
|
/// \param[in] s
|
|
/// The stream that will be used to dump the object description.
|
|
void DumpDebug(Stream *s) const;
|
|
|
|
/// Test for empty string.
|
|
///
|
|
/// \return
|
|
/// \b true if the contained string is empty.
|
|
/// \b false if the contained string is not empty.
|
|
bool IsEmpty() const { return m_string == nullptr || m_string[0] == '\0'; }
|
|
|
|
/// Test for null string.
|
|
///
|
|
/// \return
|
|
/// \b true if there is no string associated with this instance.
|
|
/// \b false if there is a string associated with this instance.
|
|
bool IsNull() const { return m_string == nullptr; }
|
|
|
|
/// Set the C string value.
|
|
///
|
|
/// Set the string value in the object by uniquing the \a cstr string value
|
|
/// in our global string pool.
|
|
///
|
|
/// If the C string already exists in the global string pool, it finds the
|
|
/// current entry and returns the existing value. If it doesn't exist, it is
|
|
/// added to the string pool.
|
|
///
|
|
/// \param[in] cstr
|
|
/// A NULL terminated C string to add to the string pool.
|
|
void SetCString(const char *cstr);
|
|
|
|
void SetString(const llvm::StringRef &s);
|
|
|
|
/// Set the C string value and its mangled counterpart.
|
|
///
|
|
/// Object files and debug symbols often use mangled string to represent the
|
|
/// linkage name for a symbol, function or global. The string pool can
|
|
/// efficiently store these values and their counterparts so when we run
|
|
/// into another instance of a mangled name, we can avoid calling the name
|
|
/// demangler over and over on the same strings and then trying to unique
|
|
/// them.
|
|
///
|
|
/// \param[in] demangled
|
|
/// The demangled string to correlate with the \a mangled name.
|
|
///
|
|
/// \param[in] mangled
|
|
/// The already uniqued mangled ConstString to correlate the
|
|
/// soon to be uniqued version of \a demangled.
|
|
void SetStringWithMangledCounterpart(llvm::StringRef demangled,
|
|
ConstString mangled);
|
|
|
|
/// Retrieve the mangled or demangled counterpart for a mangled or demangled
|
|
/// ConstString.
|
|
///
|
|
/// Object files and debug symbols often use mangled string to represent the
|
|
/// linkage name for a symbol, function or global. The string pool can
|
|
/// efficiently store these values and their counterparts so when we run
|
|
/// into another instance of a mangled name, we can avoid calling the name
|
|
/// demangler over and over on the same strings and then trying to unique
|
|
/// them.
|
|
///
|
|
/// \param[in] counterpart
|
|
/// A reference to a ConstString object that might get filled in
|
|
/// with the demangled/mangled counterpart.
|
|
///
|
|
/// \return
|
|
/// /b True if \a counterpart was filled in with the counterpart
|
|
/// /b false otherwise.
|
|
bool GetMangledCounterpart(ConstString &counterpart) const;
|
|
|
|
/// Set the C string value with length.
|
|
///
|
|
/// Set the string value in the object by uniquing \a cstr_len bytes
|
|
/// starting at the \a cstr string value in our global string pool. If trim
|
|
/// is true, then \a cstr_len indicates a maximum length of the CString and
|
|
/// if the actual length of the string is less, then it will be trimmed.
|
|
///
|
|
/// If the C string already exists in the global string pool, it finds the
|
|
/// current entry and returns the existing value. If it doesn't exist, it is
|
|
/// added to the string pool.
|
|
///
|
|
/// \param[in] cstr
|
|
/// A NULL terminated C string to add to the string pool.
|
|
///
|
|
/// \param[in] cstr_len
|
|
/// The maximum length of the C string.
|
|
void SetCStringWithLength(const char *cstr, size_t cstr_len);
|
|
|
|
/// Set the C string value with the minimum length between \a fixed_cstr_len
|
|
/// and the actual length of the C string. This can be used for data
|
|
/// structures that have a fixed length to store a C string where the string
|
|
/// might not be NULL terminated if the string takes the entire buffer.
|
|
void SetTrimmedCStringWithLength(const char *cstr, size_t fixed_cstr_len);
|
|
|
|
/// Get the memory cost of this object.
|
|
///
|
|
/// Return the size in bytes that this object takes in memory. This returns
|
|
/// the size in bytes of this object, which does not include any the shared
|
|
/// string values it may refer to.
|
|
///
|
|
/// \return
|
|
/// The number of bytes that this object occupies in memory.
|
|
///
|
|
/// \see ConstString::StaticMemorySize ()
|
|
size_t MemorySize() const { return sizeof(ConstString); }
|
|
|
|
/// Get the size in bytes of the current global string pool.
|
|
///
|
|
/// Reports the size in bytes of all shared C string values, containers and
|
|
/// any other values as a byte size for the entire string pool.
|
|
///
|
|
/// \return
|
|
/// The number of bytes that the global string pool occupies
|
|
/// in memory.
|
|
static size_t StaticMemorySize();
|
|
|
|
protected:
|
|
template <typename T> friend struct ::llvm::DenseMapInfo;
|
|
/// Only used by DenseMapInfo.
|
|
static ConstString FromStringPoolPointer(const char *ptr) {
|
|
ConstString s;
|
|
s.m_string = ptr;
|
|
return s;
|
|
};
|
|
|
|
const char *m_string = nullptr;
|
|
};
|
|
|
|
/// Stream the string value \a str to the stream \a s
|
|
Stream &operator<<(Stream &s, ConstString str);
|
|
|
|
} // namespace lldb_private
|
|
|
|
namespace llvm {
|
|
template <> struct format_provider<lldb_private::ConstString> {
|
|
static void format(const lldb_private::ConstString &CS, llvm::raw_ostream &OS,
|
|
llvm::StringRef Options);
|
|
};
|
|
|
|
/// DenseMapInfo implementation.
|
|
/// \{
|
|
template <> struct DenseMapInfo<lldb_private::ConstString> {
|
|
static inline lldb_private::ConstString getEmptyKey() {
|
|
return lldb_private::ConstString::FromStringPoolPointer(
|
|
DenseMapInfo<const char *>::getEmptyKey());
|
|
}
|
|
static inline lldb_private::ConstString getTombstoneKey() {
|
|
return lldb_private::ConstString::FromStringPoolPointer(
|
|
DenseMapInfo<const char *>::getTombstoneKey());
|
|
}
|
|
static unsigned getHashValue(lldb_private::ConstString val) {
|
|
return DenseMapInfo<const char *>::getHashValue(val.m_string);
|
|
}
|
|
static bool isEqual(lldb_private::ConstString LHS,
|
|
lldb_private::ConstString RHS) {
|
|
return LHS == RHS;
|
|
}
|
|
};
|
|
/// \}
|
|
|
|
namespace yaml {
|
|
template <> struct ScalarTraits<lldb_private::ConstString> {
|
|
static void output(const lldb_private::ConstString &, void *, raw_ostream &);
|
|
static StringRef input(StringRef, void *, lldb_private::ConstString &);
|
|
static QuotingType mustQuote(StringRef S) { return QuotingType::Double; }
|
|
};
|
|
} // namespace yaml
|
|
|
|
inline raw_ostream &operator<<(raw_ostream &os, lldb_private::ConstString s) {
|
|
os << s.GetStringRef();
|
|
return os;
|
|
}
|
|
} // namespace llvm
|
|
|
|
LLVM_YAML_IS_SEQUENCE_VECTOR(lldb_private::ConstString)
|
|
|
|
#endif // LLDB_UTILITY_CONSTSTRING_H
|