move final_id_to_literal into build_context

This commit is contained in:
Justin Viiret 2017-01-31 13:11:04 +11:00 committed by Matthew Barr
parent a0260c0362
commit a83b7cb348
2 changed files with 50 additions and 45 deletions

View File

@ -243,6 +243,9 @@ struct build_context : boost::noncopyable {
/** \brief Global bitmap of groups that can be squashed. */ /** \brief Global bitmap of groups that can be squashed. */
rose_group squashable_groups = 0; rose_group squashable_groups = 0;
/** \brief Mapping from final ID to the set of literals it is used for. */
map<u32, flat_set<u32>> final_id_to_literal;
}; };
/** \brief subengine info including built engine and /** \brief subengine info including built engine and
@ -2500,10 +2503,11 @@ void fillInSomRevNfas(RoseEngine *engine, const SomSlotManager &ssm,
static static
vector<const rose_literal_info *> vector<const rose_literal_info *>
getLiteralInfoByFinalId(const RoseBuildImpl &build, u32 final_id) { getLiteralInfoByFinalId(const RoseBuildImpl &build, const build_context &bc,
u32 final_id) {
vector<const rose_literal_info *> out; vector<const rose_literal_info *> out;
const auto &final_id_to_literal = build.final_id_to_literal; const auto &final_id_to_literal = bc.final_id_to_literal;
assert(contains(final_id_to_literal, final_id)); assert(contains(final_id_to_literal, final_id));
const auto &lits = final_id_to_literal.find(final_id)->second; const auto &lits = final_id_to_literal.find(final_id)->second;
@ -4154,9 +4158,10 @@ void addPredBlocks(build_context &bc, map<u32, RoseProgram> &pred_blocks,
} }
static static
void makePushDelayedInstructions(const RoseBuildImpl &build, u32 final_id, void makePushDelayedInstructions(const RoseBuildImpl &build,
const build_context &bc, u32 final_id,
RoseProgram &program) { RoseProgram &program) {
const auto &lit_infos = getLiteralInfoByFinalId(build, final_id); const auto &lit_infos = getLiteralInfoByFinalId(build, bc, final_id);
const auto &arb_lit_info = **lit_infos.begin(); const auto &arb_lit_info = **lit_infos.begin();
if (arb_lit_info.delayed_ids.empty()) { if (arb_lit_info.delayed_ids.empty()) {
return; return;
@ -4177,9 +4182,10 @@ void makePushDelayedInstructions(const RoseBuildImpl &build, u32 final_id,
} }
static static
rose_group getFinalIdGroupsUnion(const RoseBuildImpl &build, u32 final_id) { rose_group getFinalIdGroupsUnion(const RoseBuildImpl &build,
assert(contains(build.final_id_to_literal, final_id)); const build_context &bc, u32 final_id) {
const auto &lit_infos = getLiteralInfoByFinalId(build, final_id); assert(contains(bc.final_id_to_literal, final_id));
const auto &lit_infos = getLiteralInfoByFinalId(build, bc, final_id);
rose_group groups = 0; rose_group groups = 0;
for (const auto &li : lit_infos) { for (const auto &li : lit_infos) {
@ -4189,9 +4195,10 @@ rose_group getFinalIdGroupsUnion(const RoseBuildImpl &build, u32 final_id) {
} }
static static
void makeGroupCheckInstruction(const RoseBuildImpl &build, u32 final_id, void makeGroupCheckInstruction(const RoseBuildImpl &build,
const build_context &bc, u32 final_id,
RoseProgram &program) { RoseProgram &program) {
rose_group groups = getFinalIdGroupsUnion(build, final_id); rose_group groups = getFinalIdGroupsUnion(build, bc, final_id);
if (!groups) { if (!groups) {
return; return;
} }
@ -4201,8 +4208,7 @@ void makeGroupCheckInstruction(const RoseBuildImpl &build, u32 final_id,
static static
void makeCheckLitMaskInstruction(const RoseBuildImpl &build, build_context &bc, void makeCheckLitMaskInstruction(const RoseBuildImpl &build, build_context &bc,
u32 final_id, RoseProgram &program) { u32 final_id, RoseProgram &program) {
assert(contains(build.final_id_to_literal, final_id)); const auto &lit_infos = getLiteralInfoByFinalId(build, bc, final_id);
const auto &lit_infos = getLiteralInfoByFinalId(build, final_id);
assert(!lit_infos.empty()); assert(!lit_infos.empty());
if (!lit_infos.front()->requires_benefits) { if (!lit_infos.front()->requires_benefits) {
@ -4211,8 +4217,8 @@ void makeCheckLitMaskInstruction(const RoseBuildImpl &build, build_context &bc,
vector<LookEntry> look; vector<LookEntry> look;
assert(build.final_id_to_literal.at(final_id).size() == 1); assert(bc.final_id_to_literal.at(final_id).size() == 1);
u32 lit_id = *build.final_id_to_literal.at(final_id).begin(); u32 lit_id = *bc.final_id_to_literal.at(final_id).begin();
const ue2_literal &s = build.literals.right.at(lit_id).s; const ue2_literal &s = build.literals.right.at(lit_id).s;
DEBUG_PRINTF("building mask for lit %u (final id %u) %s\n", lit_id, DEBUG_PRINTF("building mask for lit %u (final id %u) %s\n", lit_id,
final_id, dumpString(s).c_str()); final_id, dumpString(s).c_str());
@ -4230,16 +4236,17 @@ void makeCheckLitMaskInstruction(const RoseBuildImpl &build, build_context &bc,
} }
static static
void makeGroupSquashInstruction(const RoseBuildImpl &build, u32 final_id, void makeGroupSquashInstruction(const RoseBuildImpl &build,
const build_context &bc, u32 final_id,
RoseProgram &program) { RoseProgram &program) {
assert(contains(build.final_id_to_literal, final_id)); assert(contains(bc.final_id_to_literal, final_id));
const auto &lit_infos = getLiteralInfoByFinalId(build, final_id); const auto &lit_infos = getLiteralInfoByFinalId(build, bc, final_id);
if (!lit_infos.front()->squash_group) { if (!lit_infos.front()->squash_group) {
return; return;
} }
rose_group groups = getFinalIdGroupsUnion(build, final_id); rose_group groups = getFinalIdGroupsUnion(build, bc, final_id);
if (!groups) { if (!groups) {
return; return;
} }
@ -4266,8 +4273,8 @@ static
void makeRecordAnchoredInstruction(const RoseBuildImpl &build, void makeRecordAnchoredInstruction(const RoseBuildImpl &build,
build_context &bc, u32 final_id, build_context &bc, u32 final_id,
RoseProgram &program) { RoseProgram &program) {
assert(contains(build.final_id_to_literal, final_id)); assert(contains(bc.final_id_to_literal, final_id));
const auto &lit_ids = build.final_id_to_literal.at(final_id); const auto &lit_ids = bc.final_id_to_literal.at(final_id);
// Must be anchored. // Must be anchored.
assert(!lit_ids.empty()); assert(!lit_ids.empty());
@ -4321,7 +4328,7 @@ void makeCheckLitEarlyInstruction(const RoseBuildImpl &build, build_context &bc,
return; return;
} }
const auto &lit_ids = build.final_id_to_literal.at(final_id); const auto &lit_ids = bc.final_id_to_literal.at(final_id);
if (lit_ids.empty()) { if (lit_ids.empty()) {
return; return;
} }
@ -4367,7 +4374,7 @@ void makeCheckLiteralInstruction(const RoseBuildImpl &build,
DEBUG_PRINTF("final_id %u, long lit threshold %zu\n", final_id, DEBUG_PRINTF("final_id %u, long lit threshold %zu\n", final_id,
bc.longLitLengthThreshold); bc.longLitLengthThreshold);
const auto &lits = build.final_id_to_literal.at(final_id); const auto &lits = bc.final_id_to_literal.at(final_id);
if (lits.size() != 1) { if (lits.size() != 1) {
// final_id sharing is only allowed for literals that are short enough // final_id sharing is only allowed for literals that are short enough
// to not require any additional confirm work. // to not require any additional confirm work.
@ -4464,11 +4471,11 @@ RoseProgram buildLitInitialProgram(RoseBuildImpl &build, build_context &bc,
// delayed literals, as their groups may be switched off; ordinarily, we // delayed literals, as their groups may be switched off; ordinarily, we
// can trust the HWLM matcher. // can trust the HWLM matcher.
if (hasDelayedLiteral(build, lit_edges)) { if (hasDelayedLiteral(build, lit_edges)) {
makeGroupCheckInstruction(build, final_id, program); makeGroupCheckInstruction(build, bc, final_id, program);
} }
// Add instructions for pushing delayed matches, if there are any. // Add instructions for pushing delayed matches, if there are any.
makePushDelayedInstructions(build, final_id, program); makePushDelayedInstructions(build, bc, final_id, program);
// Add pre-check for early literals in the floating table. // Add pre-check for early literals in the floating table.
makeCheckLitEarlyInstruction(build, bc, final_id, lit_edges, program); makeCheckLitEarlyInstruction(build, bc, final_id, lit_edges, program);
@ -4521,7 +4528,7 @@ RoseProgram buildLiteralProgram(RoseBuildImpl &build, build_context &bc,
RoseProgram root_block; RoseProgram root_block;
// Literal may squash groups. // Literal may squash groups.
makeGroupSquashInstruction(build, final_id, root_block); makeGroupSquashInstruction(build, bc, final_id, root_block);
// Literal may be anchored and need to be recorded. // Literal may be anchored and need to be recorded.
makeRecordAnchoredInstruction(build, bc, final_id, root_block); makeRecordAnchoredInstruction(build, bc, final_id, root_block);
@ -4581,7 +4588,7 @@ u32 buildDelayRebuildProgram(RoseBuildImpl &build, build_context &bc,
RoseProgram program; RoseProgram program;
for (const auto &final_id : final_ids) { for (const auto &final_id : final_ids) {
const auto &lit_infos = getLiteralInfoByFinalId(build, final_id); const auto &lit_infos = getLiteralInfoByFinalId(build, bc, final_id);
const auto &arb_lit_info = **lit_infos.begin(); const auto &arb_lit_info = **lit_infos.begin();
if (arb_lit_info.delayed_ids.empty()) { if (arb_lit_info.delayed_ids.empty()) {
continue; // No delayed IDs, no work to do. continue; // No delayed IDs, no work to do.
@ -4590,7 +4597,7 @@ u32 buildDelayRebuildProgram(RoseBuildImpl &build, build_context &bc,
RoseProgram prog; RoseProgram prog;
makeCheckLiteralInstruction(build, bc, final_id, prog); makeCheckLiteralInstruction(build, bc, final_id, prog);
makeCheckLitMaskInstruction(build, bc, final_id, prog); makeCheckLitMaskInstruction(build, bc, final_id, prog);
makePushDelayedInstructions(build, final_id, prog); makePushDelayedInstructions(build, bc, final_id, prog);
program.add_block(move(prog)); program.add_block(move(prog));
} }
@ -4650,7 +4657,7 @@ rose_literal_id getFragment(const rose_literal_id &lit) {
} }
static static
rose_group getGroups(const RoseBuildImpl &build, const set<u32> &lit_ids) { rose_group getGroups(const RoseBuildImpl &build, const flat_set<u32> &lit_ids) {
rose_group groups = 0; rose_group groups = 0;
for (auto lit_id : lit_ids) { for (auto lit_id : lit_ids) {
auto &info = build.literal_info.at(lit_id); auto &info = build.literal_info.at(lit_id);
@ -4660,7 +4667,8 @@ rose_group getGroups(const RoseBuildImpl &build, const set<u32> &lit_ids) {
} }
static static
map<u32, LitFragment> groupByFragment(const RoseBuildImpl &build) { map<u32, LitFragment> groupByFragment(const RoseBuildImpl &build,
const build_context &bc) {
u32 frag_id = 0; u32 frag_id = 0;
map<u32, LitFragment> final_to_frag; map<u32, LitFragment> final_to_frag;
@ -4671,7 +4679,7 @@ map<u32, LitFragment> groupByFragment(const RoseBuildImpl &build) {
map<rose_literal_id, FragmentInfo> frag_info; map<rose_literal_id, FragmentInfo> frag_info;
for (const auto &m : build.final_id_to_literal) { for (const auto &m : bc.final_id_to_literal) {
u32 final_id = m.first; u32 final_id = m.first;
const auto &lit_ids = m.second; const auto &lit_ids = m.second;
assert(!lit_ids.empty()); assert(!lit_ids.empty());
@ -4762,7 +4770,7 @@ u32 buildDelayPrograms(RoseBuildImpl &build, build_context &bc) {
vector<u32> programs; vector<u32> programs;
for (u32 final_id = build.delay_base_id; for (u32 final_id = build.delay_base_id;
final_id < build.final_id_to_literal.size(); final_id++) { final_id < bc.final_id_to_literal.size(); final_id++) {
u32 offset = writeLiteralProgram(build, bc, {final_id}, lit_edge_map); u32 offset = writeLiteralProgram(build, bc, {final_id}, lit_edge_map);
programs.push_back(offset); programs.push_back(offset);
} }
@ -5143,11 +5151,11 @@ u32 buildEagerQueueIter(const set<u32> &eager, u32 leftfixBeginQueue,
} }
static static
void allocateFinalIdToSet(RoseBuildImpl &build, const set<u32> &lits, void allocateFinalIdToSet(RoseBuildImpl &build, build_context &bc,
u32 *next_final_id) { const set<u32> &lits, u32 *next_final_id) {
const auto &g = build.g; const auto &g = build.g;
auto &literal_info = build.literal_info; auto &literal_info = build.literal_info;
auto &final_id_to_literal = build.final_id_to_literal; auto &final_id_to_literal = bc.final_id_to_literal;
/* We can allocate the same final id to multiple literals of the same type /* We can allocate the same final id to multiple literals of the same type
* if they share the same vertex set and trigger the same delayed literal * if they share the same vertex set and trigger the same delayed literal
@ -5262,13 +5270,13 @@ bool isUsedLiteral(const RoseBuildImpl &build, u32 lit_id) {
/** \brief Allocate final literal IDs for all literals. */ /** \brief Allocate final literal IDs for all literals. */
static static
void allocateFinalLiteralId(RoseBuildImpl &build) { void allocateFinalLiteralId(RoseBuildImpl &build, build_context &bc) {
set<u32> anch; set<u32> anch;
set<u32> norm; set<u32> norm;
set<u32> delay; set<u32> delay;
/* undelayed ids come first */ /* undelayed ids come first */
assert(build.final_id_to_literal.empty()); assert(bc.final_id_to_literal.empty());
u32 next_final_id = 0; u32 next_final_id = 0;
for (u32 i = 0; i < build.literal_info.size(); i++) { for (u32 i = 0; i < build.literal_info.size(); i++) {
assert(!build.hasFinalId(i)); assert(!build.hasFinalId(i));
@ -5296,15 +5304,15 @@ void allocateFinalLiteralId(RoseBuildImpl &build) {
} }
/* normal lits */ /* normal lits */
allocateFinalIdToSet(build, norm, &next_final_id); allocateFinalIdToSet(build, bc, norm, &next_final_id);
/* next anchored stuff */ /* next anchored stuff */
build.anchored_base_id = next_final_id; build.anchored_base_id = next_final_id;
allocateFinalIdToSet(build, anch, &next_final_id); allocateFinalIdToSet(build, bc, anch, &next_final_id);
/* delayed ids come last */ /* delayed ids come last */
build.delay_base_id = next_final_id; build.delay_base_id = next_final_id;
allocateFinalIdToSet(build, delay, &next_final_id); allocateFinalIdToSet(build, bc, delay, &next_final_id);
} }
static static
@ -5418,12 +5426,12 @@ aligned_unique_ptr<RoseEngine> RoseBuildImpl::buildFinalEngine(u32 minWidth) {
historyRequired); historyRequired);
DEBUG_PRINTF("longLitLengthThreshold=%zu\n", longLitLengthThreshold); DEBUG_PRINTF("longLitLengthThreshold=%zu\n", longLitLengthThreshold);
allocateFinalLiteralId(*this); build_context bc;
final_to_frag_map = groupByFragment(*this); allocateFinalLiteralId(*this, bc);
final_to_frag_map = groupByFragment(*this, bc);
auto anchored_dfas = buildAnchoredDfas(*this); auto anchored_dfas = buildAnchoredDfas(*this);
build_context bc;
bc.floatingMinLiteralMatchOffset = bc.floatingMinLiteralMatchOffset =
findMinFloatingLiteralMatch(*this, anchored_dfas); findMinFloatingLiteralMatch(*this, anchored_dfas);
bc.longLitLengthThreshold = longLitLengthThreshold; bc.longLitLengthThreshold = longLitLengthThreshold;
@ -5710,7 +5718,7 @@ aligned_unique_ptr<RoseEngine> RoseBuildImpl::buildFinalEngine(u32 minWidth) {
engine->lastByteHistoryIterOffset = lastByteOffset; engine->lastByteHistoryIterOffset = lastByteOffset;
engine->delay_count = engine->delay_count =
verify_u32(final_id_to_literal.size() - delay_base_id); verify_u32(bc.final_id_to_literal.size() - delay_base_id);
engine->delay_fatbit_size = fatbit_size(engine->delay_count); engine->delay_fatbit_size = fatbit_size(engine->delay_count);
engine->delay_base_id = delay_base_id; engine->delay_base_id = delay_base_id;
engine->anchored_base_id = anchored_base_id; engine->anchored_base_id = anchored_base_id;

View File

@ -593,9 +593,6 @@ public:
* overlap calculation in history assignment. */ * overlap calculation in history assignment. */
std::map<u32, rose_literal_id> anchoredLitSuffix; std::map<u32, rose_literal_id> anchoredLitSuffix;
std::map<u32, std::set<u32> > final_id_to_literal; /* final literal id to
* literal id */
std::map<u32, LitFragment> final_to_frag_map; std::map<u32, LitFragment> final_to_frag_map;
unordered_set<left_id> transient; unordered_set<left_id> transient;