Faster approach caching precomputed blocks of jump offsets

maneatingape · maneatingape · commit 28b35cb7a1ab · 2024-09-13T21:14:41.000+02:00
diff --git a/README.md b/README.md
@@ -53,7 +53,7 @@ Place input files in `input/yearYYYY/dayDD.txt` including leading zeroes. For ex
 ## Performance
 
 Benchmarks are measured using the built-in `cargo bench` tool run on an [Apple M2 Max][apple-link].
-All 225 solutions from 2023 to 2015 complete sequentially in **594 milliseconds**.
+All 225 solutions from 2023 to 2015 complete sequentially in **581 milliseconds**.
 Interestingly 84% of the total time is spent on just 9 solutions.
 Performance is reasonable even on older hardware, for example a 2011 MacBook Pro with an
 [Intel i7-2720QM][intel-link] processor takes 3.5 seconds to run the same 225 solutions.
@@ -68,7 +68,7 @@ Performance is reasonable even on older hardware, for example a 2011 MacBook Pro
 | [2020](#2020) | 272 |
 | [2019](#2019) | 16 |
 | [2018](#2018) | 35 |
-| [2017](#2017) | 102 |
+| [2017](#2017) | 89 |
 | [2016](#2016) | 120 |
 | [2015](#2015) | 24 |
 
@@ -274,7 +274,7 @@ Performance is reasonable even on older hardware, for example a 2011 MacBook Pro
 | 2 | [Corruption Checksum](https://adventofcode.com/2017/day/2) | [Source](src/year2017/day02.rs) | 2 |
 | 3 | [Spiral Memory](https://adventofcode.com/2017/day/3) | [Source](src/year2017/day03.rs) | 2 |
 | 4 | [High-Entropy Passphrases](https://adventofcode.com/2017/day/4) | [Source](src/year2017/day04.rs) | 98 |
-| 5 | [A Maze of Twisty Trampolines, All Alike](https://adventofcode.com/2017/day/5) | [Source](src/year2017/day05.rs) | 36000 |
+| 5 | [A Maze of Twisty Trampolines, All Alike](https://adventofcode.com/2017/day/5) | [Source](src/year2017/day05.rs) | 22000 |
 | 6 | [Memory Reallocation](https://adventofcode.com/2017/day/6) | [Source](src/year2017/day06.rs) | 81 |
 | 7 | [Recursive Circus](https://adventofcode.com/2017/day/7) | [Source](src/year2017/day07.rs) | 93 |
 | 8 | [I Heard You Like Registers](https://adventofcode.com/2017/day/8) | [Source](src/year2017/day08.rs) | 47 |
diff --git a/docs/pie-2017.svg b/docs/pie-2017.svg
@@ -2,9 +2,9 @@
 %%{init: {"themeVariables": { "pie1": "#7cb5ec", "pie2": "#90ed7d", "pie3": "#f7a35c", "pie4": "#c6cdd5"}}}%%
 pie
     title Year 2017 benchmark time by % of total
-    "Day 5" : 36000
     "Day 22" : 36000
     "Day 15" : 26000
+    "Day 5" : 22000
     "Others" : 5387
 -->
 <svg viewBox="0 0 1350 450" preserveAspectRatio="xMidYMin" xmlns="http://www.w3.org/2000/svg">
@@ -17,30 +17,31 @@ pie
 	</style>
 	<g transform="translate(675,225)">
 		<circle class="pieOuterCircle" cx="0" cy="0" r="186"/>
-		<path class="pieCircle" d="M0,-185A185,185,0,0,1,150.884,107.047L0,0Z" fill="#7cb5ec"/>
-		<path class="pieCircle" d="M150.884,107.047A185,185,0,0,1,-174.612,61.119L0,0Z" fill="#90ed7d"/>
-		<path class="pieCircle" d="M-174.612,61.119A185,185,0,0,1,-59.49,-175.174L0,0Z" fill="#f7a35c"/>
-		<path class="pieCircle" d="M-59.49,-175.174A185,185,0,0,1,0,-185L0,0Z" fill="#c6cdd5"/>
-		<text class="slice" style="text-anchor: middle;" transform="translate(123.27022509526007,-63.68684404933184)">35%</text>
-		<text class="slice" style="text-anchor: middle;" transform="translate(-19.385509928176543,137.38909893009915)">35%</text>
-		<text class="slice" style="text-anchor: middle;" transform="translate(-124.73386631798299,-60.77026487820792)">25%</text>
-		<text class="slice" style="text-anchor: middle;" transform="translate(-22.611149862440893,-136.89520956519348)">5%</text>
+		<path class="pieCircle" d="M0,-185A185,185,0,0,1,106.145,151.52L0,0Z" fill="#7cb5ec"/>
+		<path class="pieCircle" d="M106.145,151.52A185,185,0,0,1,-173.51,64.181L0,0Z" fill="#90ed7d"/>
+		<path class="pieCircle" d="M-173.51,64.181A185,185,0,0,1,-68.39,-171.895L0,0Z" fill="#f7a35c"/>
+		<path class="pieCircle" d="M-68.39,-171.895A185,185,0,0,1,0,-185L0,0Z" fill="#c6cdd5"/>
+		<text class="slice" style="text-anchor: middle;" transform="translate(132.3236843880879,-41.737334006398854)">40%</text>
+		<text class="slice" style="text-anchor: middle;" transform="translate(-41.36279061783987,132.44123999836583)">29%</text>
+		<text class="slice" style="text-anchor: middle;" transform="translate(-126.75198587075634,-56.440203559338684)">25%</text>
+		<text class="slice" style="text-anchor: middle;" transform="translate(-26.113057520486457,-136.27057909516552)">6%</text>
 		<text class="pieTitleText" x="0" y="-200">Year 2017 benchmark time by % of total</text>
 		<g transform="translate(216,-44)">
 			<rect height="18" style="fill: rgb(124, 181, 236); stroke: rgb(124, 181, 236);" width="18"/>
-			<text x="22" y="14">Day 5</text>
+			<text x="22" y="14">Day 22</text>
 		</g>
 		<g transform="translate(216,-22)">
 			<rect height="18" style="fill: rgb(144, 237, 125); stroke: rgb(144, 237, 125);" width="18"/>
-			<text x="22" y="14">Day 22</text>
+			<text x="22" y="14">Day 15</text>
 		</g>
 		<g transform="translate(216,0)">
 			<rect height="18" style="fill: rgb(247, 163, 92); stroke: rgb(247, 163, 92);" width="18"/>
-			<text x="22" y="14">Day 15</text>
+			<text x="22" y="14">Day 5</text>
 		</g>
 		<g transform="translate(216,22)">
 			<rect height="18" style="fill: rgb(198, 205, 213); stroke: rgb(198, 205, 213);" width="18"/>
 			<text x="22" y="14">Others</text>
 		</g>
 	</g>
+	</g>
 </svg>
diff --git a/docs/pie-all.svg b/docs/pie-all.svg
@@ -4,9 +4,9 @@ pie
 	title Each year benchmark time by % of total
 	"Year 2020" : 272
 	"Year 2016" : 120
-    "Year 2017" : 102
-    "Year 2018" : 35
+    "Year 2017" : 89
 	"Years 2015, 2019, 2021, 2022, 2023" : 65
+    "Year 2018" : 35
 -->
 <svg viewBox="0 0 1350 450" preserveAspectRatio="xMidYMin" xmlns="http://www.w3.org/2000/svg">
 	<style>
@@ -18,16 +18,16 @@ pie
 	</style>
 	<g transform="translate(675,225)">
 		<circle class="pieOuterCircle" cx="0" cy="0" r="186"/>
-		<path class="pieCircle" d="M0,-185A185,185,0,0,1,48.354,178.569L0,0Z" fill="#7cb5ec"/>
-		<path class="pieCircle" d="M48.354,178.569A185,185,0,0,1,-156.159,99.194L0,0Z" fill="#90ed7d"/>
-		<path class="pieCircle" d="M-156.159,99.194A185,185,0,0,1,-161.184,-90.8L0,0Z" fill="#f7a35c"/>
-		<path class="pieCircle" d="M-161.184,-90.8A185,185,0,0,1,-66.937,-172.466L0,0Z" fill="#e4d354"/>
-		<path class="pieCircle" d="M-66.937,-172.466A185,185,0,0,1,0,-185L0,0Z" fill="#e4c4fb"/>
-		<text class="slice" style="text-anchor: middle;" transform="translate(137.53890821276758,-18.292381683091275)">46%</text>
-		<text class="slice" style="text-anchor: middle;" transform="translate(-50.20277472318857,129.3493096622196)">20%</text>
-		<text class="slice" style="text-anchor: middle;" transform="translate(-138.7014885169856,3.6687304578717295)">17%</text>
-		<text class="slice" style="text-anchor: middle;" transform="translate(-90.86192683490827,-104.86025344165337)">11%</text>
-		<text class="slice" style="text-anchor: middle;" transform="translate(-25.537675935439314,-136.37957914518026)">6%</text>
+		<path class="pieCircle" d="M0,-185A185,185,0,0,1,36.766,181.31L0,0Z" fill="#7cb5ec"/>
+		<path class="pieCircle" d="M36.766,181.31A185,185,0,0,1,-164.677,84.3L0,0Z" fill="#90ed7d"/>
+		<path class="pieCircle" d="M-164.677,84.3A185,185,0,0,1,-163.288,-86.96L0,0Z" fill="#f7a35c"/>
+		<path class="pieCircle" d="M-163.288,-86.96A185,185,0,0,1,-68.363,-171.905L0,0Z" fill="#e4d354"/>
+		<path class="pieCircle" d="M-68.363,-171.905A185,185,0,0,1,0,-185L0,0Z" fill="#e4c4fb"/>
+		<text class="slice" style="text-anchor: middle;" transform="translate(138.05636380255447,-13.856511596239887)">47%</text>
+		<text class="slice" style="text-anchor: middle;" transform="translate(-60.201368802561184,125.00943042146065)">21%</text>
+		<text class="slice" style="text-anchor: middle;" transform="translate(-138.74543615786084,-1.1253645475836986)">15%</text>
+		<text class="slice" style="text-anchor: middle;" transform="translate(-92.52549393814081,-103.39533583050577)">11%</text>
+		<text class="slice" style="text-anchor: middle;" transform="translate(-26.10232465364791,-136.27263535895813)">6%</text>
 		<text class="pieTitleText" x="0" y="-200">Each year benchmark time by % of total</text>
 		<g transform="translate(216,-55)">
 			<rect height="18" style="fill: rgb(124, 181, 236); stroke: rgb(124, 181, 236);" width="18"/>
diff --git a/src/year2017/day05.rs b/src/year2017/day05.rs
@@ -1,40 +1,105 @@
 //! # A Maze of Twisty Trampolines, All Alike
+//!
+//! Part one brute forces the jumps. For part two we can make an observation that the jumps offsets
+//! will eventually flip flop between 2 or 3 starting from the beginning, for example:
+//!
+//! ```none
+//!     2 3 2 3 -1
+//! ```
+//!
+//! The twos and threes can be represented in binary compact form, using 0 for 2 and 1 for 3:
+//!
+//! ```none
+//!     0101
+//! ```
+//!
+//! We then precompute all possible combination for blocks of size 16, using this to accelerate
+//! part two.
 use crate::util::parse::*;
 
+const WIDTH: usize = 16;
+const LENGTH: usize = 1 << WIDTH;
+
 pub fn parse(input: &str) -> Vec<i32> {
     input.iter_signed().collect()
 }
 
-pub fn part1(input: &[i32]) -> u32 {
+/// Brute force implementation.
+pub fn part1(input: &[i32]) -> usize {
     let mut jump = input.to_vec();
+    let mut total = 0;
     let mut index = 0;
-    let mut result = 0;
 
     while index < jump.len() {
         let next = index.wrapping_add(jump[index] as usize);
         jump[index] += 1;
+        total += 1;
         index = next;
-        result += 1;
     }
 
-    result
+    total
 }
 
-pub fn part2(input: &[i32]) -> u32 {
+#[expect(clippy::needless_range_loop)]
+pub fn part2(input: &[i32]) -> usize {
     let mut jump = input.to_vec();
+    let mut total = 0;
     let mut index = 0;
-    let mut result = 0;
+
+    let mut fine = 0;
+    let mut coarse = 0;
+    let mut compact = Vec::new();
+    let mut cache = vec![[(0_u16, 0_u8, 0_u8); LENGTH]; WIDTH];
+
+    // Precompute all possible combinations. For each binary starting number we can start at any
+    // offset from 0..16.
+    for i in 0..WIDTH {
+        for j in 0..LENGTH {
+            let mut offset = i as u16;
+            let mut value = j as u16;
+            let mut steps = 0;
+
+            while offset < 16 {
+                value ^= 1 << offset;
+                steps += 1;
+                offset += 3 - ((value >> offset) & 1);
+            }
+
+            cache[i][j] = (value, steps, offset as u8 - i as u8);
+        }
+    }
 
     while index < jump.len() {
-        let next = index.wrapping_add(jump[index] as usize);
-        if jump[index] < 3 {
-            jump[index] += 1;
+        if index < coarse {
+            // Index lies withing precomputed blocks.
+            let base = index / 16;
+            let offset = index % 16;
+            let value = compact[base] as usize;
+            let (next, steps, delta) = cache[offset][value];
+
+            compact[base] = next;
+            total += steps as usize;
+            index += delta as usize;
         } else {
-            jump[index] -= 1;
+            // Fall back to part one approach.
+            let next = index.wrapping_add(jump[index] as usize);
+            jump[index] += if jump[index] == 3 { -1 } else { 1 };
+            total += 1;
+
+            // The frontier of twos and threes advances through the jump offsets.
+            // Each time it crosses a block of 16 add to the compact binary representation.
+            if jump[index] == 2 && index == fine {
+                fine += 1;
+                if fine % 16 == 0 {
+                    let value = (coarse..fine).rev().fold(0, |acc, i| (acc << 1) | (jump[i] & 1));
+                    coarse = fine;
+                    compact.push(value as u16);
+                }
+            }
+
+            index = next;
         }
-        index = next;
-        result += 1;
     }
 
-    result
+    total
 }