Reduce the size of the lexer's data tables.

The lexer uses a matrix of state transition data to parse text. This matrix was highly sparse and contained large runs of zeros and repeated values. I found that by transposing the matrix, it became extremely compressible. In its transposed state, most slices had only 1-3 unique nonzero values. This CL leverages this finding to reduce the matrix data from ~55K to ~10K. A handful of slices do contain a large number of unique values and continue to be represented as plain 16-bit arrays. Some slices contain no data at all and were eliminated entirely. The majority of slices are now represented by a compact two-bit array. Bit pattern 00 always represents zero. Bit patterns 01, 10 and 11 are translated into values v0, v1 and v2, which are stored per slice (bit-packed to save a few extra bytes). This transformation involves a fair amount of bit shifting and masking, but the generated code will be quite efficient: https://godbolt.org/z/eTvjr96ez Change-Id: Iecc67aadd510ccf63b4bcb11ed861d703efefaae Reviewed-on: https://skia-review.googlesource.com/c/skia/+/461356 Auto-Submit: John Stiles <johnstiles@google.com> Reviewed-by: Brian Osman <brianosman@google.com> Commit-Queue: John Stiles <johnstiles@google.com>
2021-10-20 12:40:03 -04:00 · 2021-10-20 12:40:03 -04:00 · 97d9e47e8f
commit 97d9e47e8f
parent dbd3b1b04c
5 changed files with 707 additions and 1439 deletions
--- a/BUILD.gn
+++ b/BUILD.gn
@ -575,10 +575,20 @@ optional("fontmgr_win_gdi") {
 if (skia_lex) {
  skia_executable("sksllex") {
    sources = [
      "src/sksl/lex/DFA.h",
      "src/sksl/lex/DFAState.h",
      "src/sksl/lex/LexUtil.h",
      "src/sksl/lex/Main.cpp",
      "src/sksl/lex/NFA.cpp",
      "src/sksl/lex/NFA.h",
      "src/sksl/lex/NFAState.h",
      "src/sksl/lex/NFAtoDFA.h",
      "src/sksl/lex/RegexNode.cpp",
      "src/sksl/lex/RegexNode.h",
      "src/sksl/lex/RegexParser.cpp",
      "src/sksl/lex/RegexParser.h",
      "src/sksl/lex/TransitionTable.cpp",
      "src/sksl/lex/TransitionTable.h",
    ]
    include_dirs = [ "." ]
  }
--- a/src/sksl/SkSLLexer.cpp
+++ b/src/sksl/SkSLLexer.cpp
--- a/src/sksl/lex/Main.cpp
+++ b/src/sksl/lex/Main.cpp
@ -7,6 +7,7 @@
 #include "src/sksl/lex/NFAtoDFA.h"
 #include "src/sksl/lex/RegexParser.h"
 #include "src/sksl/lex/TransitionTable.h"
 #include <fstream>
 #include <sstream>
@ -30,8 +31,8 @@ static constexpr const char* HEADER =
    " ******************** This file was generated by sksllex. Do not edit. *******************\n"
    " *****************************************************************************************/\n";
-void writeH(const DFA& dfa, const char* lexer, const char* token,
+static void writeH(const DFA& dfa, const char* lexer, const char* token,
-            const std::vector<std::string>& tokens, const char* hPath) {
+                   const std::vector<std::string>& tokens, const char* hPath) {
    std::ofstream out(hPath);
    SkASSERT(out.good());
    out << HEADER;
@ -100,8 +101,8 @@ private:
 )";
 }
-void writeCPP(const DFA& dfa, const char* lexer, const char* token, const char* include,
+static void writeCPP(const DFA& dfa, const char* lexer, const char* token, const char* include,
-              const char* cppPath) {
+                     const char* cppPath) {
    std::ofstream out(cppPath);
    SkASSERT(out.good());
    out << HEADER;
@ -114,7 +115,7 @@ void writeCPP(const DFA& dfa, const char* lexer, const char* token, const char*
    for (const auto& row : dfa.fTransitions) {
        states = std::max(states, row.size());
    }
-    out << "using State = " << (states <= 256 ? "uint8_t" : "int16_t") << ";\n";
+    out << "using State = " << (states <= 256 ? "uint8_t" : "uint16_t") << ";\n";
    // arbitrarily-chosen character which is greater than START_CHAR and should not appear in actual
    // input
    out << "static const uint8_t INVALID_CHAR = 18;";
@ -125,21 +126,8 @@ void writeCPP(const DFA& dfa, const char* lexer, const char* token, const char*
        separator = ", ";
    }
    out << "\n};\n";
-    out << "static const State kTransitions[" << dfa.fTransitions.size() << "]["
+
-                                              << states << "] = {\n";
+    WriteTransitionTable(out, dfa, states);
    for (size_t c = 0; c < dfa.fTransitions.size(); ++c) {
        out << "    {";
        for (size_t j = 0; j < states; ++j) {
            if ((size_t) c < dfa.fTransitions.size() && j < dfa.fTransitions[c].size()) {
                out << " " << dfa.fTransitions[c][j] << ",";
            } else {
                out << " 0,";
            }
        }
        out << " },\n";
    }
    out << "};\n";
    out << "\n";
    out << "static const int8_t kAccepts[" << states << "] = {";
    for (size_t i = 0; i < states; ++i) {
@ -175,7 +163,7 @@ void writeCPP(const DFA& dfa, const char* lexer, const char* token, const char*
        if (c <= 8 || c >= )" << dfa.fCharMappings.size() << R"() {
            c = INVALID_CHAR;
        }
-        State newState = kTransitions[kMappings[c]][state];
+        State newState = get_transition(kMappings[c], state);
        if (!newState) {
            break;
        }
@ -193,8 +181,8 @@ void writeCPP(const DFA& dfa, const char* lexer, const char* token, const char*
 )";
 }
-void process(const char* inPath, const char* lexer, const char* token, const char* hPath,
+static void process(const char* inPath, const char* lexer, const char* token, const char* hPath,
-             const char* cppPath) {
+                    const char* cppPath) {
    NFA nfa;
    std::vector<std::string> tokens;
    tokens.push_back("END_OF_FILE");
--- a/src/sksl/lex/TransitionTable.cpp
+++ b/src/sksl/lex/TransitionTable.cpp
@ -0,0 +1,242 @@
 /*
 * Copyright 2021 Google Inc.
 *
 * Use of this source code is governed by a BSD-style license that can be
 * found in the LICENSE file.
 */
 #include "src/sksl/lex/DFA.h"
 #include "src/sksl/lex/TransitionTable.h"
 #include <array>
 #include <bitset>
 #include <cassert>
 #include <cmath>
 #include <unordered_map>
 #include <unordered_set>
 #include <vector>
 namespace {
 // The number of bits to use per entry in our compact transition table. This is customizable:
 // - 1-bit: reasonable in theory. Doesn't actually pack many slices.
 // - 2-bit: best fit for our data. Packs extremely well.
 // - 4-bit: packs all but one slice, but doesn't save as much space overall.
 // - 8-bit: way too large (an 8-bit LUT plus an 8-bit data table is as big as a 16-bit table)
 // Other values don't divide cleanly into a byte and do not work.
 constexpr int kNumBits = 2;
 // These values are derived from kNumBits and shouldn't need to change.
 constexpr int kNumValues = (1 << kNumBits) - 1;
 constexpr int kDataPerByte = 8 / kNumBits;
 enum IndexType {
    kZero = 0,
    kFullEntry,
    kCompactEntry,
 };
 struct IndexEntry {
    IndexType type;
    int pos;
 };
 struct CompactEntry {
    std::array<int, kNumValues> v = {};
    std::vector<int> data;
 };
 struct FullEntry {
    std::vector<int> data;
 };
 using TransitionSet = std::unordered_set<int>;
 static int add_compact_entry(const TransitionSet& transitionSet,
                             const std::vector<int>& data,
                             std::vector<CompactEntry>* entries) {
    // Create a compact entry with the unique values from the transition set, padded out with zeros
    // and sorted.
    CompactEntry result{};
    assert(transitionSet.size() <= result.v.size());
    std::copy(transitionSet.begin(), transitionSet.end(), result.v.begin());
    std::sort(result.v.begin(), result.v.end());
    // Create a mapping from real values to small values. (0 -> 0, v[0] -> 1, v[1] -> 2, v[2] -> 3)
    std::unordered_map<int, int> translationTable;
    for (size_t index = 0; index < result.v.size(); ++index) {
        translationTable[result.v[index]] = 1 + index;
    }
    translationTable[0] = 0;
    // Convert the real values into small values.
    for (size_t index = 0; index < data.size(); ++index) {
        int value = data[index];
        assert(translationTable.find(value) != translationTable.end());
        result.data.push_back(translationTable[value]);
    }
    // Look for an existing entry that exactly matches this one.
    for (size_t index = 0; index < entries->size(); ++index) {
        if (entries->at(index).v == result.v && entries->at(index).data == result.data) {
            return index;
        }
    }
    // Add this as a new entry.
    entries->push_back(std::move(result));
    return (int)(entries->size() - 1);
 }
 static int add_full_entry(const TransitionSet& transitionMap,
                          const std::vector<int>& data,
                          std::vector<FullEntry>* entries) {
    // Create a full entry with this data.
    FullEntry result{};
    result.data = std::vector<int>(data.begin(), data.end());
    // Look for an existing entry that exactly matches this one.
    for (size_t index = 0; index < entries->size(); ++index) {
        if (entries->at(index).data == result.data) {
            return index;
        }
    }
    // Add this as a new entry.
    entries->push_back(std::move(result));
    return (int)(entries->size() - 1);
 }
 }  // namespace
 void WriteTransitionTable(std::ofstream& out, const DFA& dfa, size_t states) {
    int numTransitions = dfa.fTransitions.size();
    // Assemble our compact and full data tables, and an index into them.
    std::vector<CompactEntry> compactEntries;
    std::vector<FullEntry> fullEntries;
    std::vector<IndexEntry> indices;
    for (size_t s = 0; s < states; ++s) {
        // Copy all the transitions for this state into a flat array, and into a histogram (counting
        // the number of unique state-transition values). Most states only transition to a few
        // possible new states.
        TransitionSet transitionSet;
        std::vector<int> data(numTransitions);
        for (int t = 0; t < numTransitions; ++t) {
            if ((size_t) t < dfa.fTransitions.size() && s < dfa.fTransitions[t].size()) {
                int value = dfa.fTransitions[t][s];
                assert(value >= 0 && value < (int)states);
                data[t] = value;
                transitionSet.insert(value);
            }
        }
        transitionSet.erase(0);
        if (transitionSet.empty()) {
            // This transition table was completely empty (every value was zero). No data needed;
            // zero pages are handled as a special index type.
            indices.push_back(IndexEntry{kZero, 0});
        } else if (transitionSet.size() <= kNumValues) {
            // This table only contained a small number of unique nonzero values.
            // Use a compact representation that squishes each value down to a few bits.
            int index = add_compact_entry(transitionSet, data, &compactEntries);
            indices.push_back(IndexEntry{kCompactEntry, index});
        } else {
            // This table contained a large number of values. We can't compact it.
            int index = add_full_entry(transitionSet, data, &fullEntries);
            indices.push_back(IndexEntry{kFullEntry, index});
        }
    }
    // Find the largest value for each compact-entry slot.
    int maxValue[kNumValues] = {};
    for (const CompactEntry& entry : compactEntries) {
        for (int index=0; index < kNumValues; ++index) {
            maxValue[index] = std::max(maxValue[index], entry.v[index]);
        }
    }
    // Emit all the structs our transition table will use.
    out << "struct IndexEntry {\n"
        << "    uint16_t type : 2;\n"
        << "    uint16_t pos : 14;\n"
        << "};\n"
        << "struct FullEntry {\n"
        << "    State data[" << numTransitions << "];\n"
        << "};\n";
    // Emit the compact-entry structure; minimize the number of bits needed per value.
    out << "struct CompactEntry {\n";
    for (int index=0; index < kNumValues; ++index) {
        if (maxValue[index] > 0) {
            out << "    State v" << index << " : " << int(std::ceil(std::log2(maxValue[index])))
                << ";\n";
        }
    }
    out << "    uint8_t data[" << std::ceil(float(numTransitions) / float(kDataPerByte)) << "];\n"
        << "};\n";
    // Emit the full-table data.
    out << "static constexpr FullEntry kFull[] = {\n";
    for (const FullEntry& entry : fullEntries) {
        out << "    {";
        for (int value : entry.data) {
            out << value << ", ";
        }
        out << "},\n";
    }
    out << "};\n";
    // Emit the compact-table data.
    out << "static constexpr CompactEntry kCompact[] = {\n";
    for (const CompactEntry& entry : compactEntries) {
        out << "    {";
        for (int index=0; index < kNumValues; ++index) {
            if (maxValue[index] > 0) {
                out << entry.v[index] << ", ";
            }
        }
        out << "{";
        unsigned int shiftBits = 0, combinedBits = 0;
        for (int index = 0; index < numTransitions; index++) {
            combinedBits |= entry.data[index] << shiftBits;
            shiftBits += kNumBits;
            assert(shiftBits <= 8);
            if (shiftBits == 8) {
                out << combinedBits << ", ";
                shiftBits = 0;
                combinedBits = 0;
            }
        }
        if (shiftBits > 0) {
            // Flush any partial values.
            out << combinedBits;
        }
        out << "}},\n";
    }
    out << "};\n"
        << "static constexpr IndexEntry kIndices[] = {\n";
    for (const IndexEntry& entry : indices) {
        out << "    {" << entry.type << ", " << entry.pos << "},\n";
    }
    out << "};\n"
        << "State get_transition(int transition, int state) {\n"
        << "    IndexEntry index = kIndices[state];\n"
        << "    if (index.type == 0) { return 0; }\n"
        << "    if (index.type == 1) { return kFull[index.pos].data[transition]; }\n"
        << "    const CompactEntry& entry = kCompact[index.pos];\n"
        << "    int value = entry.data[transition >> " << std::log2(kDataPerByte) << "];\n"
        << "    value >>= " << kNumBits << " * (transition & " << kDataPerByte - 1 << ");\n"
        << "    value &= " << kNumValues << ";\n"
        << "    State table[] = {0";
    for (int index=0; index < kNumValues; ++index) {
        if (maxValue[index] > 0) {
            out << ", entry.v" << index;
        } else {
            out << ", 0";
        }
    }
    out << "};\n"
        << "    return table[value];\n"
        << "}\n";
 }
--- a/src/sksl/lex/TransitionTable.h
+++ b/src/sksl/lex/TransitionTable.h
@ -0,0 +1,17 @@
 /*
 * Copyright 2021 Google Inc.
 *
 * Use of this source code is governed by a BSD-style license that can be
 * found in the LICENSE file.
 */
 #ifndef SKSL_TRANSITIONTABLE
 #define SKSL_TRANSITIONTABLE
 #include <fstream>
 struct DFA;
 void WriteTransitionTable(std::ofstream& out, const DFA& dfa, size_t states);
 #endif // SKSL_TRANSITIONTABLE