forked from OSchip/llvm-project
[ADT] Simplifying hex string parsing so it runs faster in debug modes.
This expands the lookup table statically and avoids routing through methods that contain asserts (like StringRef/std::string element accessors and drop_front) such that performance is more predictable across compilation environments. This was primarily driven by slow debug mode performance but has a large benefit in release builds as well. ``` ssd_mobilenet_v2_face_float (42MB .mlir) Debug/MSVC (old): 5.22s Debug/MSVC (new): 0.16s Release/MSVC (old): 0.81s Release/MSVC (new): 0.02s huggingface_minilm (536MB .mlir) Debug/MSVC (old): 65.31s Debug/MSVC (new): 2.03s Release/MSVC (old): 9.93s Release/MSVC (new): 0.27s ``` Now in debug the time is split evenly between lexString, tryGetFromHex, and element attrs hashing, with the next step to making it faster being to combine the work (incremental hashing during conversion, etc) - but this is at least in the right order of magnitude and retains the original API surface. I have not profiled a build with clang but this is strictly less code and simpler data structures so I'd expect improvements there as well. This also fixes a bug where 0xFF bytes in the input would read out of bounds. Reviewed By: dblaikie, stellaraccident Differential Revision: https://reviews.llvm.org/D112105
This commit is contained in:
parent
539f500e78
commit
2fcffcd0e8
|
@ -67,22 +67,27 @@ inline ArrayRef<uint8_t> arrayRefFromStringRef(StringRef Input) {
|
|||
///
|
||||
/// If \p C is not a valid hex digit, -1U is returned.
|
||||
inline unsigned hexDigitValue(char C) {
|
||||
struct HexTable {
|
||||
unsigned LUT[255] = {};
|
||||
constexpr HexTable() {
|
||||
// Default initialize everything to invalid.
|
||||
for (int i = 0; i < 255; ++i)
|
||||
LUT[i] = ~0U;
|
||||
// Initialize `0`-`9`.
|
||||
for (int i = 0; i < 10; ++i)
|
||||
LUT['0' + i] = i;
|
||||
// Initialize `A`-`F` and `a`-`f`.
|
||||
for (int i = 0; i < 6; ++i)
|
||||
LUT['A' + i] = LUT['a' + i] = 10 + i;
|
||||
}
|
||||
/* clang-format off */
|
||||
static const int16_t LUT[256] = {
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
0, 1, 2, 3, 4, 5, 6, 7, 8, 9, -1, -1, -1, -1, -1, -1, // '0'..'9'
|
||||
-1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1, // 'A'..'F'
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1, // 'a'..'f'
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
|
||||
};
|
||||
constexpr HexTable Table;
|
||||
return Table.LUT[static_cast<unsigned char>(C)];
|
||||
/* clang-format on */
|
||||
return LUT[static_cast<unsigned char>(C)];
|
||||
}
|
||||
|
||||
/// Checks if character \p C is one of the 10 decimal digits.
|
||||
|
@ -210,24 +215,31 @@ inline bool tryGetFromHex(StringRef Input, std::string &Output) {
|
|||
if (Input.empty())
|
||||
return true;
|
||||
|
||||
Output.reserve((Input.size() + 1) / 2);
|
||||
// If the input string is not properly aligned on 2 nibbles we pad out the
|
||||
// front with a 0 prefix; e.g. `ABC` -> `0ABC`.
|
||||
Output.resize((Input.size() + 1) / 2);
|
||||
char *OutputPtr = const_cast<char *>(Output.data());
|
||||
if (Input.size() % 2 == 1) {
|
||||
uint8_t Hex = 0;
|
||||
if (!tryGetHexFromNibbles('0', Input.front(), Hex))
|
||||
return false;
|
||||
|
||||
Output.push_back(Hex);
|
||||
*OutputPtr++ = Hex;
|
||||
Input = Input.drop_front();
|
||||
}
|
||||
|
||||
assert(Input.size() % 2 == 0);
|
||||
while (!Input.empty()) {
|
||||
// Convert the nibble pairs (e.g. `9C`) into bytes (0x9C).
|
||||
// With the padding above we know the input is aligned and the output expects
|
||||
// exactly half as many bytes as nibbles in the input.
|
||||
size_t InputSize = Input.size();
|
||||
assert(InputSize % 2 == 0);
|
||||
const char *InputPtr = Input.data();
|
||||
for (size_t OutputIndex = 0; OutputIndex < InputSize / 2; ++OutputIndex) {
|
||||
uint8_t Hex = 0;
|
||||
if (!tryGetHexFromNibbles(Input[0], Input[1], Hex))
|
||||
if (!tryGetHexFromNibbles(InputPtr[OutputIndex * 2 + 0], // MSB
|
||||
InputPtr[OutputIndex * 2 + 1], // LSB
|
||||
Hex))
|
||||
return false;
|
||||
|
||||
Output.push_back(Hex);
|
||||
Input = Input.drop_front(2);
|
||||
OutputPtr[OutputIndex] = Hex;
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
|
|
@ -91,7 +91,7 @@ TEST(StringExtrasTest, ToAndFromHex) {
|
|||
EXPECT_EQ(EvenData, fromHex(EvenStr));
|
||||
EXPECT_EQ(StringRef(EvenStr).lower(), toHex(EvenData, true));
|
||||
|
||||
std::string InvalidStr = "A5ZX";
|
||||
std::string InvalidStr = "A50\xFF";
|
||||
std::string IgnoredOutput;
|
||||
EXPECT_FALSE(tryGetFromHex(InvalidStr, IgnoredOutput));
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue