AdventOfCode/2022/day6.cpp

163 lines
4.5 KiB
C++

#include <bit>
#include <cinttypes>
#include <chrono>
#include <fstream>
#include <iostream>
#include <vector>
const size_t BATCH_SIZE = 64;
const size_t BATCH_NUM = 4096/BATCH_SIZE;
bool substring_unique_copyless(std::vector<uint8_t> *s, size_t right, size_t length) {
for (size_t i = (right-length); i<right; i++) {
uint8_t c = (*s)[i];
for (size_t j = (i+1); j<right; j++) {
if ((*s)[j] == c) {
return false;
}
}
}
return true;
}
size_t find_first_unique_run(std::vector<uint8_t> *s, size_t num, size_t skip) {
for (size_t right = skip; right<s->size(); right++) {
if (substring_unique_copyless(s, right, num)) {
return right;
}
}
return 0;
}
std::pair<size_t, size_t> find_first_unique_runs(std::vector<uint8_t> *s) {
size_t four = 0;
size_t fourteen = 0;
uint32_t masks[4096];
uint32_t scratch_masks[BATCH_SIZE];
uint8_t scratch_masks_bits[BATCH_SIZE];
for (int i=0; i<4096; i++) {
masks[i] = 1 << ((*s)[i]-'a');
}
// Turn masks into masks2. Indices are now +1.
for (int i=0; i<4095; i++) {
masks[i] |= masks[i+1];
}
for (int batch=1; batch<BATCH_NUM; batch++) {
for (int i=0; i<BATCH_SIZE; i++) {
int idx = batch*BATCH_SIZE + i;
scratch_masks[i] = masks[idx] | masks[idx-2];
scratch_masks_bits[i] = std::popcount(scratch_masks[i]);
}
for (int i=0; i<BATCH_SIZE; i++) {
if (scratch_masks_bits[i] == 4) {
four = batch*BATCH_SIZE + i;
goto four_found;
}
}
}
four_found:
// Turn masks2 into masks4. Indices are now +3.
for (int i=four; i<4093; i++) {
masks[i] |= masks[i+2];
}
// Turn masks4 into masks8. Indices are now +7.
for (int i=fourteen; i<4089; i++) {
masks[i] |= masks[i+4];
}
for (int batch=(four/BATCH_SIZE); batch<BATCH_NUM; batch++) {
for (int i=0; i<BATCH_SIZE; i++) {
int idx = batch*BATCH_SIZE + i;
scratch_masks[i] = masks[idx] | masks[idx-6];
scratch_masks_bits[i] = std::popcount(scratch_masks[i]);
}
for (int i=0; i<BATCH_SIZE; i++) {
if (scratch_masks_bits[i] == 14) {
fourteen = batch*BATCH_SIZE + i;
goto fourteen_found;
}
}
}
fourteen_found:
return std::pair<size_t, size_t>(four+2, fourteen+8);
}
std::pair<size_t, size_t> find_first_unique_runs_xor(std::vector<uint8_t> *s) {
size_t four = 0;
size_t fourteen = 0;
uint32_t masks[4096];
for (int i=0; i<4096; i++) {
masks[i] = 1 << ((*s)[i]-'a');
}
uint32_t bitset = 0;
for (int i = 0; i < 4; i++) { // No old entries to remove
bitset ^= masks[i];
}
for (int i = 4; i < 4096; i++) {
bitset ^= masks[i];
bitset ^= masks[i-4];
if (std::popcount(bitset) >= 4) {
four = i;
break;
}
}
for (int i = four+1; i < four+11; i++) { // No old entries to remove while readjusting base
bitset ^= masks[i];
}
for (int i = four+11; i < 4096; i++) {
bitset ^= masks[i];
bitset ^= masks[i-14];
if (std::popcount(bitset) >= 14) {
fourteen = i;
break;
}
}
return std::pair<size_t, size_t>(four, fourteen);
}
int main(int argc, char **argv) {
size_t iterations = 1000000;
auto filename = "input/6";
switch(argc) {
case 3: // a.out filename iterations
iterations = std::stoi(argv[2]);
// std::cout << "Set iterations to: " << iterations << '\n'; // fallthrough
case 2: // a.out filename
filename = argv[1];
// std::cout << "Set filename to: " << filename << '\n';
default:
break;
}
auto input_file = std::ifstream(filename, std::ios::binary | std::ios::ate);
const std::streamoff eof_position = static_cast<std::streamoff>(input_file.tellg());
auto s = std::vector<uint8_t>(eof_position);
input_file.seekg(0, std::ios::beg);
input_file.read(reinterpret_cast<char*>(s.data()), eof_position);
size_t volatile four = 0; // Don't you dare optimize out the iterations!
size_t volatile fourteen = 0;
std::cout << "Running " << iterations << " iterations with batch size " << BATCH_SIZE << ":\n";
auto clock = std::chrono::high_resolution_clock();
auto t0 = clock.now();
for (size_t i = 0; i<iterations; i++) {
// four = find_first_unique_run(&s, 4, 4);
// fourteen = find_first_unique_run(&s, 14, four);
// auto result = find_first_unique_runs(&s);
auto result = find_first_unique_runs_xor(&s);
four = result.first;
fourteen = result.second;
}
auto t1 = clock.now();
auto delta = t1 - t0;
auto per_iteration = delta / iterations;
std::cout << "Part 1: " << four << '\n';
std::cout << "Part 2: " << fourteen << '\n';
std::cout << "Completed " << iterations << " iterations in "
<< std::chrono::duration_cast<std::chrono::milliseconds>(delta).count()
<< "ms (~"
<< std::chrono::duration_cast<std::chrono::nanoseconds>(per_iteration).count()
<< "ns each)\n";
}