Browse Source

perf: reserved size of the hash map

legacy
Dnomd343 3 months ago
parent
commit
c30c5d910e
  1. 6
      src/core/benchmark/fast_cal.cc
  2. 2
      src/core/fast_cal/fast_cal.h
  3. 49
      src/core/fast_cal/internal/fast_cal.cc

6
src/core/benchmark/fast_cal.cc

@ -11,9 +11,9 @@ static void FastCalBenchmark(benchmark::State &state) {
auto code = CommonCode::unsafe_create(0x1A9BF0C00).to_raw_code(); auto code = CommonCode::unsafe_create(0x1A9BF0C00).to_raw_code();
for (auto _ : state) { for (auto _ : state) {
// auto fc = FastCal(code); auto fc = FastCal(code);
// benchmark::DoNotOptimize(fc.solve()); benchmark::DoNotOptimize(fc.demo());
benchmark::DoNotOptimize(FastCal_demo(code)); // benchmark::DoNotOptimize(FastCal_demo(code));
} }
} }

2
src/core/fast_cal/fast_cal.h

@ -44,6 +44,8 @@ public:
RawCode target(const match_t &match); RawCode target(const match_t &match);
std::vector<RawCode> target_multi(const match_t &match); std::vector<RawCode> target_multi(const match_t &match);
RawCode demo();
/// static BFS search functions /// static BFS search functions
static std::vector<RawCode> resolve(const RawCode &start); static std::vector<RawCode> resolve(const RawCode &start);
static std::vector<std::vector<RawCode>> to_furthest(const RawCode &start); static std::vector<std::vector<RawCode>> to_furthest(const RawCode &start);

49
src/core/fast_cal/internal/fast_cal.cc

@ -1,9 +1,13 @@
#include <algorithm> #include <algorithm>
#include <iostream>
#include "utils/common.h" #include "utils/common.h"
#include "fast_cal/fast_cal.h" #include "fast_cal/fast_cal.h"
#include "raw_code/raw_code.h" #include "raw_code/raw_code.h"
#include "group/group.h"
FastCal::FastCal(const RawCode &code) { FastCal::FastCal(const RawCode &code) {
this->root = (uint64_t)code; this->root = (uint64_t)code;
} }
@ -21,6 +25,51 @@ RawCode FastCal::solve() {
return FastCal::target(resolved); return FastCal::target(resolved);
} }
RawCode FastCal::demo() {
// max_group_size = 25955
// auto reserve = klotski::cases::GroupUnion::from_raw_code(RawCode::unsafe_create(root)).max_group_size();
cases.reserve(25955); // FAST !!! (about 5ms)
// cases.reserve(32768); // SLOW !!! (about 50ms)
// TODO: using prime number!
std::queue<fast_cal_t*>{}.swap(cache);
cache.emplace(&cases.emplace(root, fast_cal_t {
.code = root,
.mask = 0,
.last = nullptr, // without parent node
}).first->second);
auto core = MaskMover(
[this](uint64_t code, uint64_t mask) { // lambda as function pointer
auto current = cases.find(code);
if (current != cases.end()) { // find existed case
current->second.mask |= mask; // update mask info
return;
}
cache.emplace(&cases.emplace(code, fast_cal_t { // record new case
.code = code,
.mask = mask,
.last = cache.front(), // link parent case
}).first->second);
}
);
while (!cache.empty()) {
if (((cache.front()->code >> (3 * 0xD)) & 0b111) == BLOCK_2x2) {
return RawCode::unsafe_create(cache.front()->code); // match target
}
core.next_cases(cache.front()->code, cache.front()->mask);
cache.pop();
}
return FC_NOT_FOUND; // target not found
}
std::vector<RawCode> FastCal::solve_multi() { std::vector<RawCode> FastCal::solve_multi() {
return FastCal::target_multi(resolved); return FastCal::target_multi(resolved);
} }

Loading…
Cancel
Save