From 96eb963b9032003c60886673fc631a1b2493ce2c Mon Sep 17 00:00:00 2001 From: Ken Hoover Date: Mon, 9 Sep 2024 16:09:04 -0700 Subject: [PATCH 1/5] 3x speedup of the distance transform. By avoiding checked adds and instead manually iterating over the correct windows of `RoomXY`s, we obtain a 3x speedup over the naive `filter_map`-based implementation. --- src/algorithms/distance_transform.rs | 215 ++++++++++++++++++++------- 1 file changed, 159 insertions(+), 56 deletions(-) diff --git a/src/algorithms/distance_transform.rs b/src/algorithms/distance_transform.rs index 141ac42..259fb8f 100644 --- a/src/algorithms/distance_transform.rs +++ b/src/algorithms/distance_transform.rs @@ -1,11 +1,13 @@ // Heavily based on https://github.com/Screeps-Tutorials/Screeps-Tutorials/blob/Master/basePlanningAlgorithms/distanceTransform.js use screeps::{ - self, - constants::{extra::ROOM_SIZE, Direction}, + constants::extra::ROOM_SIZE, local::{LocalCostMatrix, LocalRoomTerrain, RoomXY}, + RoomCoordinate, }; +use crate::room_coordinate::{range_exclusive, range_inclusive}; + /// Provides a Cost Matrix with values equal to the Chebyshev distance from any /// wall terrain. This does *not* calculate based on constructed walls, only /// terrain walls. @@ -29,67 +31,168 @@ pub fn chebyshev_distance_transform_from_terrain( /// This allows for calculating the distance transform from an arbitrary set of /// positions. Other position values in the initial Cost Matrix should be /// initialized to 255 (u8::MAX) to ensure the calculations work correctly. -pub fn chebyshev_distance_transform_from_cost_matrix( - initial_cm: LocalCostMatrix, -) -> LocalCostMatrix { - // Copy the initial cost matrix into the output cost matrix - let mut cm = initial_cm.clone(); - +pub fn chebyshev_distance_transform_from_cost_matrix(mut cm: LocalCostMatrix) -> LocalCostMatrix { + let zero = RoomCoordinate::new(0).unwrap(); + let one = RoomCoordinate::new(1).unwrap(); + let forty_eight = RoomCoordinate::new(ROOM_SIZE - 2).unwrap(); + let forty_nine = RoomCoordinate::new(ROOM_SIZE - 1).unwrap(); + let windowing_vec: Vec<_> = range_inclusive(zero, forty_nine).collect(); // Pass 1: Top-to-Bottom, Left-to-Right - for x in 0..ROOM_SIZE { - for y in 0..ROOM_SIZE { - let current_position = unsafe { RoomXY::unchecked_new(x, y) }; + // Phase A: first column + range_inclusive(one, forty_nine) + .map(|y| RoomXY { x: zero, y }) + .fold(cm.get(RoomXY { x: zero, y: zero }), |top, xy| { + let val = cm.get(xy).min(top.saturating_add(1)); + cm.set(xy, val); + val + }); - // The distance to the closest wall is the minimum of the current position value - // and all of its neighbors. However, since we're going TTB:LTR, we - // can ignore tiles we know we haven't visited yet: TopRight, Right, - // BottomRight, and Bottom. We could include them and their default - // max values should get ignored, but why waste the processing cycles? - let min_value = [ - Direction::Top, - Direction::TopLeft, - Direction::Left, - Direction::BottomLeft, - ] - .into_iter() - .filter_map(|dir| current_position.checked_add_direction(dir)) - .map(|position| cm.get(position)) - .min() - .map(|x| x.saturating_add(1)) - .map(|x| x.min(cm.get(current_position))) - .unwrap_or_else(|| cm.get(current_position)); - - cm.set(current_position, min_value); - } - } + // Phase B: the rest + range_inclusive(one, forty_nine) + .zip(range_inclusive(zero, forty_eight)) + .for_each(|(current_x, left_x)| { + let initial_top = cm + .get(RoomXY { + x: current_x, + y: zero, + }) + .min( + cm.get(RoomXY { x: left_x, y: zero }) + .min(cm.get(RoomXY { x: left_x, y: one })) + .saturating_add(1), + ); + cm.set( + RoomXY { + x: current_x, + y: zero, + }, + initial_top, + ); + let final_top = range_exclusive(zero, forty_nine) + .map(|y| RoomXY { x: current_x, y }) + .zip(windowing_vec.windows(3)) + .fold(initial_top, |top, (current_xy, lefts)| { + let val = lefts + .iter() + .copied() + .map(|y| RoomXY { x: left_x, y }) + .map(|xy| cm.get(xy)) + .min() + .unwrap() + .min(top) + .saturating_add(1) + .min(cm.get(current_xy)); + cm.set(current_xy, val); + val + }); + cm.set( + RoomXY { + x: current_x, + y: forty_nine, + }, + cm.get(RoomXY { + x: current_x, + y: forty_nine, + }) + .min( + final_top + .min(cm.get(RoomXY { + x: left_x, + y: forty_eight, + })) + .min(cm.get(RoomXY { + x: left_x, + y: forty_nine, + })) + .saturating_add(1), + ), + ); + }); // Pass 2: Bottom-to-Top, Right-to-Left - for x in (0..ROOM_SIZE).rev() { - for y in (0..ROOM_SIZE).rev() { - let current_position = unsafe { RoomXY::unchecked_new(x, y) }; - - // The same logic as with Pass 1 applies here, we're just going BTT:RTL instead, - // so the neighbors we ignore are: BottomLeft, Left, TopLeft, and - // Top. - let min_value = [ - Direction::Bottom, - Direction::Right, - Direction::BottomRight, - Direction::TopRight, - ] - .into_iter() - .filter_map(|dir| current_position.checked_add_direction(dir)) - .map(|position| cm.get(position)) - .min() - .map(|x| x.saturating_add(1)) - .map(|x| x.min(cm.get(current_position))) - .unwrap_or_else(|| cm.get(current_position)); + // Phase A: last column + range_inclusive(zero, forty_eight) + .map(|y| RoomXY { x: forty_nine, y }) + .fold( + cm.get(RoomXY { + x: forty_nine, + y: forty_nine, + }), + |bottom, xy| { + let val = cm.get(xy).min(bottom.saturating_add(1)); + cm.set(xy, val); + val + }, + ); - cm.set(current_position, min_value); - } - } + // Phase B: the rest + range_inclusive(zero, forty_eight) + .rev() + .zip(range_inclusive(one, forty_nine).rev()) + .for_each(|(current_x, right_x)| { + let initial_bottom = cm + .get(RoomXY { + x: current_x, + y: forty_nine, + }) + .min( + cm.get(RoomXY { + x: right_x, + y: forty_nine, + }) + .min(cm.get(RoomXY { + x: right_x, + y: forty_eight, + })) + .saturating_add(1), + ); + cm.set( + RoomXY { + x: current_x, + y: forty_nine, + }, + initial_bottom, + ); + let final_bottom = range_exclusive(zero, forty_nine) + .rev() + .map(|y| RoomXY { x: current_x, y }) + .zip(windowing_vec.windows(3).rev()) + .fold(initial_bottom, |bottom, (current_xy, rights)| { + let val = rights + .iter() + .copied() + .map(|y| RoomXY { x: right_x, y }) + .map(|xy| cm.get(xy)) + .min() + .unwrap() + .min(bottom) + .saturating_add(1) + .min(cm.get(current_xy)); + cm.set(current_xy, val); + val + }); + cm.set( + RoomXY { + x: current_x, + y: zero, + }, + cm.get(RoomXY { + x: current_x, + y: zero, + }) + .min( + final_bottom + .min(cm.get(RoomXY { + x: right_x, + y: zero, + })) + .min(cm.get(RoomXY { x: right_x, y: one })) + .saturating_add(1), + ), + ); + }); cm } From d96a1e6a73fc92bccfbb8389f6d9da5741761091 Mon Sep 17 00:00:00 2001 From: Ken Hoover Date: Mon, 9 Sep 2024 16:10:47 -0700 Subject: [PATCH 2/5] Import formatting --- src/algorithms/distance_transform.rs | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/src/algorithms/distance_transform.rs b/src/algorithms/distance_transform.rs index 259fb8f..2bd0f0e 100644 --- a/src/algorithms/distance_transform.rs +++ b/src/algorithms/distance_transform.rs @@ -2,8 +2,7 @@ use screeps::{ constants::extra::ROOM_SIZE, - local::{LocalCostMatrix, LocalRoomTerrain, RoomXY}, - RoomCoordinate, + local::{LocalCostMatrix, LocalRoomTerrain, RoomCoordinate, RoomXY}, }; use crate::room_coordinate::{range_exclusive, range_inclusive}; From ea510a3336564b5286e8f5d176170a23627cd30a Mon Sep 17 00:00:00 2001 From: Ken Hoover Date: Mon, 9 Sep 2024 16:33:55 -0700 Subject: [PATCH 3/5] Squeeze some more performance out. Get rid of the windowing vector, map to the array of surrounding y- coordinates. --- src/algorithms/distance_transform.rs | 32 ++++++++++++++++++---------- 1 file changed, 21 insertions(+), 11 deletions(-) diff --git a/src/algorithms/distance_transform.rs b/src/algorithms/distance_transform.rs index 2bd0f0e..7bfacd0 100644 --- a/src/algorithms/distance_transform.rs +++ b/src/algorithms/distance_transform.rs @@ -35,7 +35,6 @@ pub fn chebyshev_distance_transform_from_cost_matrix(mut cm: LocalCostMatrix) -> let one = RoomCoordinate::new(1).unwrap(); let forty_eight = RoomCoordinate::new(ROOM_SIZE - 2).unwrap(); let forty_nine = RoomCoordinate::new(ROOM_SIZE - 1).unwrap(); - let windowing_vec: Vec<_> = range_inclusive(zero, forty_nine).collect(); // Pass 1: Top-to-Bottom, Left-to-Right // Phase A: first column @@ -69,12 +68,18 @@ pub fn chebyshev_distance_transform_from_cost_matrix(mut cm: LocalCostMatrix) -> initial_top, ); let final_top = range_exclusive(zero, forty_nine) - .map(|y| RoomXY { x: current_x, y }) - .zip(windowing_vec.windows(3)) + .map(|y| { + (RoomXY { x: current_x, y }, unsafe { + [ + RoomCoordinate::unchecked_new(y.u8() - 1), + y, + RoomCoordinate::unchecked_new(y.u8() + 1), + ] + }) + }) .fold(initial_top, |top, (current_xy, lefts)| { let val = lefts - .iter() - .copied() + .into_iter() .map(|y| RoomXY { x: left_x, y }) .map(|xy| cm.get(xy)) .min() @@ -155,13 +160,18 @@ pub fn chebyshev_distance_transform_from_cost_matrix(mut cm: LocalCostMatrix) -> initial_bottom, ); let final_bottom = range_exclusive(zero, forty_nine) - .rev() - .map(|y| RoomXY { x: current_x, y }) - .zip(windowing_vec.windows(3).rev()) - .fold(initial_bottom, |bottom, (current_xy, rights)| { + .map(|y| { + (RoomXY { x: current_x, y }, unsafe { + [ + RoomCoordinate::unchecked_new(y.u8() - 1), + y, + RoomCoordinate::unchecked_new(y.u8() + 1), + ] + }) + }) + .rfold(initial_bottom, |bottom, (current_xy, rights)| { let val = rights - .iter() - .copied() + .into_iter() .map(|y| RoomXY { x: right_x, y }) .map(|xy| cm.get(xy)) .min() From 85d916d15f81633f703fb6fdc63d3aed462b7831 Mon Sep 17 00:00:00 2001 From: Ken Hoover Date: Mon, 9 Sep 2024 19:02:35 -0700 Subject: [PATCH 4/5] Fixes bug in chebyshev dt, adds manhattan dt --- benches/distance_transform.rs | 10 ++- src/algorithms/distance_transform.rs | 128 ++++++++++++++++++++++++++- 2 files changed, 135 insertions(+), 3 deletions(-) diff --git a/benches/distance_transform.rs b/benches/distance_transform.rs index f1b0777..9676b7e 100644 --- a/benches/distance_transform.rs +++ b/benches/distance_transform.rs @@ -9,7 +9,13 @@ mod benches { #[bench] fn bench_chebyshev_distance_transform(b: &mut Bencher) { - let terrain = LocalRoomTerrain::new_from_bits(Box::new([0; 2500])); - b.iter(|| black_box(chebyshev_distance_transform_from_terrain(&terrain))); + let mut terrain = LocalRoomTerrain::new_from_bits(Box::new([0; 2500])); + b.iter(|| black_box(chebyshev_distance_transform_from_terrain(&*black_box(&mut terrain)))); + } + + #[bench] + fn bench_manhattan_distance_transform(b: &mut Bencher) { + let mut terrain = LocalRoomTerrain::new_from_bits(Box::new([0; 2500])); + b.iter(|| black_box(manhattan_distance_transform_from_terrain(&*black_box(&mut terrain)))); } } diff --git a/src/algorithms/distance_transform.rs b/src/algorithms/distance_transform.rs index 7bfacd0..378c001 100644 --- a/src/algorithms/distance_transform.rs +++ b/src/algorithms/distance_transform.rs @@ -119,7 +119,7 @@ pub fn chebyshev_distance_transform_from_cost_matrix(mut cm: LocalCostMatrix) -> // Phase A: last column range_inclusive(zero, forty_eight) .map(|y| RoomXY { x: forty_nine, y }) - .fold( + .rfold( cm.get(RoomXY { x: forty_nine, y: forty_nine, @@ -205,3 +205,129 @@ pub fn chebyshev_distance_transform_from_cost_matrix(mut cm: LocalCostMatrix) -> cm } + +/// Provides a Cost Matrix with values equal to the Manhattan distance from any +/// wall terrain. This does *not* calculate based on constructed walls, only +/// terrain walls. +pub fn manhattan_distance_transform_from_terrain( + room_terrain: &LocalRoomTerrain, +) -> LocalCostMatrix { + let mut initial_cm = LocalCostMatrix::new(); + + for (xy, cm_val) in initial_cm.iter_mut() { + *cm_val = match room_terrain.get_xy(xy) { + screeps::constants::Terrain::Wall => 0, + _ => u8::MAX, + }; + } + manhattan_distance_transform_from_cost_matrix(initial_cm) +} + +/// Provides a Cost Matrix with values equal to the Manhattan distance from any +/// position in the provided initial Cost Matrix with a value set to 0. +/// +/// This allows for calculating the distance transform from an arbitrary set of +/// positions. Other position values in the initial Cost Matrix should be +/// initialized to 255 (u8::MAX) to ensure the calculations work correctly. +pub fn manhattan_distance_transform_from_cost_matrix(mut cm: LocalCostMatrix) -> LocalCostMatrix { + let zero = RoomCoordinate::new(0).unwrap(); + let one = RoomCoordinate::new(1).unwrap(); + let forty_eight = RoomCoordinate::new(ROOM_SIZE - 2).unwrap(); + let forty_nine = RoomCoordinate::new(ROOM_SIZE - 1).unwrap(); + // Pass 1: Top-to-Bottom, Left-to-Right + + // Phase A: first column + range_inclusive(one, forty_nine) + .map(|y| RoomXY { x: zero, y }) + .fold(cm.get(RoomXY { x: zero, y: zero }), |top, xy| { + let val = cm.get(xy).min(top.saturating_add(1)); + cm.set(xy, val); + val + }); + + // Phase B: the rest + range_inclusive(one, forty_nine) + .zip(range_inclusive(zero, forty_eight)) + .for_each(|(current_x, left_x)| { + let initial_top = cm + .get(RoomXY { + x: current_x, + y: zero, + }) + .min(cm.get(RoomXY { x: left_x, y: zero }).saturating_add(1)); + cm.set( + RoomXY { + x: current_x, + y: zero, + }, + initial_top, + ); + range_inclusive(one, forty_nine) + .map(|y| (RoomXY { x: current_x, y }, RoomXY { x: left_x, y })) + .fold(initial_top, |top, (current_xy, left_xy)| { + let val = cm + .get(left_xy) + .min(top) + .saturating_add(1) + .min(cm.get(current_xy)); + cm.set(current_xy, val); + val + }); + }); + + // Pass 2: Bottom-to-Top, Right-to-Left + + // Phase A: last column + range_inclusive(zero, forty_eight) + .map(|y| RoomXY { x: forty_nine, y }) + .rfold( + cm.get(RoomXY { + x: forty_nine, + y: forty_nine, + }), + |bottom, xy| { + let val = cm.get(xy).min(bottom.saturating_add(1)); + cm.set(xy, val); + val + }, + ); + + // Phase B: the rest + range_inclusive(zero, forty_eight) + .rev() + .zip(range_inclusive(one, forty_nine).rev()) + .for_each(|(current_x, right_x)| { + let initial_bottom = cm + .get(RoomXY { + x: current_x, + y: forty_nine, + }) + .min( + cm.get(RoomXY { + x: right_x, + y: forty_nine, + }) + .saturating_add(1), + ); + cm.set( + RoomXY { + x: current_x, + y: forty_nine, + }, + initial_bottom, + ); + range_inclusive(zero, forty_eight) + .map(|y| (RoomXY { x: current_x, y }, RoomXY { x: right_x, y })) + .rfold(initial_bottom, |bottom, (current_xy, right_xy)| { + let val = cm + .get(right_xy) + .min(bottom) + .saturating_add(1) + .min(cm.get(current_xy)); + cm.set(current_xy, val); + val + }); + }); + + cm +} From 9b7421f87fe219347759b7498e776d2ce29b40fb Mon Sep 17 00:00:00 2001 From: Ken Hoover Date: Mon, 9 Sep 2024 19:11:24 -0700 Subject: [PATCH 5/5] Fix fmt --- benches/distance_transform.rs | 12 ++++++++++-- 1 file changed, 10 insertions(+), 2 deletions(-) diff --git a/benches/distance_transform.rs b/benches/distance_transform.rs index 9676b7e..aaa7622 100644 --- a/benches/distance_transform.rs +++ b/benches/distance_transform.rs @@ -10,12 +10,20 @@ mod benches { #[bench] fn bench_chebyshev_distance_transform(b: &mut Bencher) { let mut terrain = LocalRoomTerrain::new_from_bits(Box::new([0; 2500])); - b.iter(|| black_box(chebyshev_distance_transform_from_terrain(&*black_box(&mut terrain)))); + b.iter(|| { + black_box(chebyshev_distance_transform_from_terrain(&*black_box( + &mut terrain, + ))) + }); } #[bench] fn bench_manhattan_distance_transform(b: &mut Bencher) { let mut terrain = LocalRoomTerrain::new_from_bits(Box::new([0; 2500])); - b.iter(|| black_box(manhattan_distance_transform_from_terrain(&*black_box(&mut terrain)))); + b.iter(|| { + black_box(manhattan_distance_transform_from_terrain(&*black_box( + &mut terrain, + ))) + }); } }