diff --git a/.devcontainer/postCreate.sh b/.devcontainer/postCreate.sh
index fdfd6c4..4c7490e 100755
--- a/.devcontainer/postCreate.sh
+++ b/.devcontainer/postCreate.sh
@@ -10,7 +10,7 @@ pip install -e . || { echo "Failed to install the current directory as a package
 pip install -e ./fast-pysf || { echo "Failed to install ./fast-pysf as a package"; exit 1; }
 
 # Set the display environment variable for GUI applications based on the host OS
-if [[ $HOST_OS == *"Windows"* ]]; then
+if [ $HOST_OS == *"Windows"* ]; then
     # We are in Windows
     echo "export DISPLAY=host.docker.internal:0.0" >> ~/.bashrc || { echo "Failed to set DISPLAY environment variable for Windows"; exit 1; }
 else
diff --git a/.gitignore b/.gitignore
index 3a7a5fe..79c59bc 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,18 +1,19 @@
-__pycache__/
-.scannerwork
-.pytest_cache
 *.c
+*.egg-info
 *.o
 *.so
-profile.json
+*training*.zip
+.pytest_cache
+.scannerwork
+__pycache__/
 build
-*.egg-info
 file.log
-profiles
-model
 images
+logs
+model
+profile.json
+profiles
 pysf_tests
 pysocialforce
-logs
-*training*.zip
+recordings/*.pkl
 wandb
\ No newline at end of file
diff --git a/examples/demo_offensive.py b/examples/demo_offensive.py
index 59fd510..55caa4b 100644
--- a/examples/demo_offensive.py
+++ b/examples/demo_offensive.py
@@ -9,7 +9,7 @@ def training():
     env_config = EnvSettings(
         sim_config=SimulationSettings(difficulty=0, ped_density_by_difficulty=[0.02]),
         robot_config=BicycleDriveSettings(radius=0.5, max_accel=3.0, allow_backwards=True))
-    env = RobotEnv(env_config, debug=True)
+    env = RobotEnv(env_config, debug=True, recording_enabled=True)
     model = PPO.load("./model/run_043", env=env)
 
     obs = env.reset()
diff --git a/recordings/README.md b/recordings/README.md
new file mode 100644
index 0000000..5445a56
--- /dev/null
+++ b/recordings/README.md
@@ -0,0 +1,4 @@
+# Recordings
+
+The folder where recordings are stored by default.
+However, recordings are in the `.gitignore` file, so they are not uploaded to the repository.
diff --git a/robot_sf/gym_env/robot_env.py b/robot_sf/gym_env/robot_env.py
index 57bb655..7bb481e 100644
--- a/robot_sf/gym_env/robot_env.py
+++ b/robot_sf/gym_env/robot_env.py
@@ -1,234 +1,291 @@
-"""
-`robot_env.py` is a module that defines the simulation environment for a robot or multiple robots.
-It includes classes and protocols for defining the robot's state, actions, and 
-observations within the environment. 
-
-`RobotEnv`: A class that represents the robot's environment. It inherits from `VectorEnv`
-from the `gymnasium` library, which is a base class for environments that operate over
-vectorized actions and observations. It includes methods for stepping through the environment,
-resetting it, rendering it, and closing it.
-It also defines the action and observation spaces for the robot.
-"""
-
-from typing import Tuple, Callable
-from copy import deepcopy
-
-import numpy as np
-
-from gymnasium import Env
-from gymnasium.utils import seeding
-
-from robot_sf.robot.robot_state import RobotState
-from robot_sf.gym_env.env_config import EnvSettings
-from robot_sf.sensor.range_sensor import lidar_ray_scan
-
-from robot_sf.render.sim_view import (
-    SimulationView,
-    VisualizableAction,
-    VisualizableSimState)
-from robot_sf.sim.simulator import init_simulators
-from robot_sf.gym_env.reward import simple_reward
-from robot_sf.gym_env.env_util import init_collision_and_sensors, init_spaces
-
-Vec2D = Tuple[float, float]
-PolarVec2D = Tuple[float, float]
-RobotPose = Tuple[Vec2D, float]
-
-
-class RobotEnv(Env):
-    """
-    Representing a Gymnasium environment for training a self-driving robot
-    with reinforcement learning.
-    """
-
-    def __init__(
-            self,
-            env_config: EnvSettings = EnvSettings(),
-            reward_func: Callable[[dict], float] = simple_reward,
-            debug: bool = False
-            ):
-        """
-        Initialize the Robot Environment.
-
-        Parameters:
-        - env_config (EnvSettings): Configuration for environment settings.
-        - reward_func (Callable[[dict], float]): Reward function that takes
-            a dictionary as input and returns a float as reward.
-        - debug (bool): If True, enables debugging information such as 
-            visualizations.
-        """
-
-        # Environment configuration details
-        self.env_config = env_config
-
-        # Extract first map definition; currently only supports using the first map
-        map_def = env_config.map_pool.choose_random_map()
-
-        # Initialize spaces based on the environment configuration and map
-        self.action_space, self.observation_space, orig_obs_space = \
-            init_spaces(env_config, map_def)
-
-        # Assign the reward function and debug flag
-        self.reward_func = reward_func
-        self.debug = debug
-
-        # Initialize simulator with a random start position
-        self.simulator = init_simulators(
-            env_config,
-            map_def,
-            random_start_pos=True
-            )[0]
-
-        # Delta time per simulation step and maximum episode time
-        d_t = env_config.sim_config.time_per_step_in_secs
-        max_ep_time = env_config.sim_config.sim_time_in_secs
-
-        # Initialize collision detectors and sensor data processors
-        occupancies, sensors = init_collision_and_sensors(
-            self.simulator,
-            env_config,
-            orig_obs_space
-            )
-
-        # Setup initial state of the robot
-        self.state = RobotState(
-            self.simulator.robot_navs[0],
-            occupancies[0],
-            sensors[0],
-            d_t,
-            max_ep_time)
-
-        # Store last action executed by the robot
-        self.last_action = None
-
-        # If in debug mode, create a simulation view to visualize the state
-        if debug:
-            self.sim_ui = SimulationView(
-                scaling=10,
-                map_def=map_def,
-                obstacles=map_def.obstacles,
-                robot_radius=env_config.robot_config.radius,
-                ped_radius=env_config.sim_config.ped_radius,
-                goal_radius=env_config.sim_config.goal_radius)
-
-            # Display the simulation UI
-            self.sim_ui.show()
-
-    def step(self, action):
-        """
-        Execute one time step within the environment.
-
-        Parameters:
-        - action: Action to be executed.
-
-        Returns:
-        - obs: Observation after taking the action.
-        - reward: Calculated reward for the taken action.
-        - term: Boolean indicating if the episode has terminated.
-        - info: Additional information as dictionary.
-        """
-        # Process the action through the simulator
-        action = self.simulator.robots[0].parse_action(action)
-        self.last_action = action
-        # Perform simulation step
-        self.simulator.step_once([action])
-        # Get updated observation
-        obs = self.state.step()
-        # Fetch metadata about the current state
-        meta = self.state.meta_dict()
-        # Determine if the episode has reached terminal state
-        term = self.state.is_terminal
-        # Compute the reward using the provided reward function
-        reward = self.reward_func(meta)
-        return obs, reward, term, {"step": meta["step"], "meta": meta}
-
-    def reset(self):
-        """
-        Reset the environment state to start a new episode.
-
-        Returns:
-        - obs: The initial observation after resetting the environment.
-        """
-        # Reset internal simulator state
-        self.simulator.reset_state()
-        # Reset the environment's state and return the initial observation
-        obs = self.state.reset()
-        return obs
-
-    def render(self):
-        """
-        Render the environment visually if in debug mode.
-
-        Raises RuntimeError if debug mode is not enabled.
-        """
-        if not self.sim_ui:
-            raise RuntimeError(
-                'Debug mode is not activated! Consider setting '
-                'debug=True!')
-
-        # Prepare action visualization, if any action was executed
-        action = None if not self.last_action else VisualizableAction(
-            self.simulator.robot_poses[0],
-            self.last_action,
-            self.simulator.goal_pos[0])
-
-        # Robot position and LIDAR scanning visualization preparation
-        robot_pos = self.simulator.robot_poses[0][0]
-        distances, directions = lidar_ray_scan(
-            self.simulator.robot_poses[0],
-            self.state.occupancy,
-            self.env_config.lidar_config)
-
-        # Construct ray vectors for visualization
-        ray_vecs = zip(
-            np.cos(directions) * distances,
-            np.sin(directions) * distances
-            )
-        ray_vecs_np = np.array([[
-            [robot_pos[0], robot_pos[1]],
-            [robot_pos[0] + x, robot_pos[1] + y]
-            ] for x, y in ray_vecs]
-            )
-
-        # Prepare pedestrian action visualization
-        ped_actions = zip(
-            self.simulator.pysf_sim.peds.pos(),
-            self.simulator.pysf_sim.peds.pos() +
-            self.simulator.pysf_sim.peds.vel() * 2)
-        ped_actions_np = np.array([[pos, vel] for pos, vel in ped_actions])
-
-        # Package the state for visualization
-        state = VisualizableSimState(
-            self.state.timestep, action, self.simulator.robot_poses[0],
-            deepcopy(self.simulator.ped_pos), ray_vecs_np, ped_actions_np)
-
-        # Execute rendering of the state through the simulation UI
-        self.sim_ui.render(state)
-
-    def seed(self, seed=None):
-        """
-        Set the seed for this env's random number generator(s).
-
-        Note:
-            Some environments use multiple pseudorandom number generators.
-            We want to capture all such seeds used in order to ensure that
-            there aren't accidental correlations between multiple generators.
-
-        Returns:
-            list<bigint>: Returns the list of seeds used in this env's random
-            number generators. The first value in the list should be the
-            "main" seed, or the value which a reproducer should pass to
-            'seed'. Often, the main seed equals the provided 'seed', but
-            this won't be true if seed=None, for example.
-
-        TODO: validate this method
-        """
-        self.np_random, seed = seeding.np_random(seed)
-        return [seed]
-
-    def exit(self):
-        """
-        Clean up and exit the simulation UI, if it exists.
-        """
-        if self.sim_ui:
-            self.sim_ui.exit()
+"""
+`robot_env.py` is a module that defines the simulation environment for a robot or multiple robots.
+It includes classes and protocols for defining the robot's state, actions, and 
+observations within the environment. 
+
+`RobotEnv`: A class that represents the robot's environment. It inherits from `VectorEnv`
+from the `gymnasium` library, which is a base class for environments that operate over
+vectorized actions and observations. It includes methods for stepping through the environment,
+resetting it, rendering it, and closing it.
+It also defines the action and observation spaces for the robot.
+"""
+
+import os
+import datetime
+from typing import Tuple, Callable, List
+from copy import deepcopy
+import pickle
+
+import loguru
+import numpy as np
+
+from gymnasium import Env
+from gymnasium.utils import seeding
+
+from robot_sf.robot.robot_state import RobotState
+from robot_sf.gym_env.env_config import EnvSettings
+from robot_sf.sensor.range_sensor import lidar_ray_scan
+
+from robot_sf.render.sim_view import (
+    SimulationView,
+    VisualizableAction,
+    VisualizableSimState)
+from robot_sf.sim.simulator import init_simulators
+from robot_sf.gym_env.reward import simple_reward
+from robot_sf.gym_env.env_util import init_collision_and_sensors, init_spaces
+
+logger = loguru.logger
+
+Vec2D = Tuple[float, float]
+PolarVec2D = Tuple[float, float]
+RobotPose = Tuple[Vec2D, float]
+
+
+class RobotEnv(Env):
+    """
+    Representing a Gymnasium environment for training a self-driving robot
+    with reinforcement learning.
+    """
+
+    def __init__(
+            self,
+            env_config: EnvSettings = EnvSettings(),
+            reward_func: Callable[[dict], float] = simple_reward,
+            debug: bool = False,
+            recording_enabled: bool = False
+            ):
+        """
+        Initialize the Robot Environment.
+
+        Parameters:
+        - env_config (EnvSettings): Configuration for environment settings.
+        - reward_func (Callable[[dict], float]): Reward function that takes
+            a dictionary as input and returns a float as reward.
+        - debug (bool): If True, enables debugging information such as 
+            visualizations.
+        """
+
+        # Environment configuration details
+        self.env_config = env_config
+
+        # Extract first map definition; currently only supports using the first map
+        self.map_def = env_config.map_pool.choose_random_map()
+
+        # Initialize spaces based on the environment configuration and map
+        self.action_space, self.observation_space, orig_obs_space = \
+            init_spaces(env_config, self.map_def)
+
+        # Assign the reward function and debug flag
+        self.reward_func = reward_func
+        self.debug = debug
+
+        # Initialize the list to store recorded states
+        self.recorded_states: List[VisualizableSimState] = []
+        self.recording_enabled = recording_enabled
+
+        # Initialize simulator with a random start position
+        self.simulator = init_simulators(
+            env_config,
+            self.map_def,
+            random_start_pos=True
+            )[0]
+
+        # Delta time per simulation step and maximum episode time
+        d_t = env_config.sim_config.time_per_step_in_secs
+        max_ep_time = env_config.sim_config.sim_time_in_secs
+
+        # Initialize collision detectors and sensor data processors
+        occupancies, sensors = init_collision_and_sensors(
+            self.simulator,
+            env_config,
+            orig_obs_space
+            )
+
+        # Setup initial state of the robot
+        self.state = RobotState(
+            self.simulator.robot_navs[0],
+            occupancies[0],
+            sensors[0],
+            d_t,
+            max_ep_time)
+
+        # Store last action executed by the robot
+        self.last_action = None
+
+        # If in debug mode, create a simulation view to visualize the state
+        if debug:
+            self.sim_ui = SimulationView(
+                scaling=10,
+                map_def=self.map_def,
+                obstacles=self.map_def.obstacles,
+                robot_radius=env_config.robot_config.radius,
+                ped_radius=env_config.sim_config.ped_radius,
+                goal_radius=env_config.sim_config.goal_radius)
+
+            # Display the simulation UI
+            self.sim_ui.show()
+
+    def step(self, action):
+        """
+        Execute one time step within the environment.
+
+        Parameters:
+        - action: Action to be executed.
+
+        Returns:
+        - obs: Observation after taking the action.
+        - reward: Calculated reward for the taken action.
+        - term: Boolean indicating if the episode has terminated.
+        - info: Additional information as dictionary.
+        """
+        # Process the action through the simulator
+        action = self.simulator.robots[0].parse_action(action)
+        self.last_action = action
+        # Perform simulation step
+        self.simulator.step_once([action])
+        # Get updated observation
+        obs = self.state.step()
+        # Fetch metadata about the current state
+        meta = self.state.meta_dict()
+        # Determine if the episode has reached terminal state
+        term = self.state.is_terminal
+        # Compute the reward using the provided reward function
+        reward = self.reward_func(meta)
+
+        # if recording is enabled, record the state
+        if self.recording_enabled:
+            self.record()
+
+        return obs, reward, term, {"step": meta["step"], "meta": meta}
+
+    def reset(self):
+        """
+        Reset the environment state to start a new episode.
+
+        Returns:
+        - obs: The initial observation after resetting the environment.
+        """
+        # Reset internal simulator state
+        self.simulator.reset_state()
+        # Reset the environment's state and return the initial observation
+        obs = self.state.reset()
+
+        # if recording is enabled, save the recording and reset the state list
+        if self.recording_enabled:
+            self.save_recording()
+
+        return obs
+
+    def _prepare_visualizable_state(self):
+        # Prepare action visualization, if any action was executed
+        action = None if not self.last_action else VisualizableAction(
+            self.simulator.robot_poses[0],
+            self.last_action,
+            self.simulator.goal_pos[0])
+
+        # Robot position and LIDAR scanning visualization preparation
+        robot_pos = self.simulator.robot_poses[0][0]
+        distances, directions = lidar_ray_scan(
+            self.simulator.robot_poses[0],
+            self.state.occupancy,
+            self.env_config.lidar_config)
+
+        # Construct ray vectors for visualization
+        ray_vecs = zip(
+            np.cos(directions) * distances,
+            np.sin(directions) * distances
+            )
+        ray_vecs_np = np.array([[
+            [robot_pos[0], robot_pos[1]],
+            [robot_pos[0] + x, robot_pos[1] + y]
+            ] for x, y in ray_vecs]
+            )
+
+        # Prepare pedestrian action visualization
+        ped_actions = zip(
+            self.simulator.pysf_sim.peds.pos(),
+            self.simulator.pysf_sim.peds.pos() +
+            self.simulator.pysf_sim.peds.vel() * 2)
+        ped_actions_np = np.array([[pos, vel] for pos, vel in ped_actions])
+
+        # Package the state for visualization
+        state = VisualizableSimState(
+            self.state.timestep, action, self.simulator.robot_poses[0],
+            deepcopy(self.simulator.ped_pos), ray_vecs_np, ped_actions_np)
+
+        return state
+
+    def render(self):
+        """
+        Render the environment visually if in debug mode.
+
+        Raises RuntimeError if debug mode is not enabled.
+        """
+        if not self.sim_ui:
+            raise RuntimeError(
+                'Debug mode is not activated! Consider setting '
+                'debug=True!')
+
+        state = self._prepare_visualizable_state()
+
+        # Execute rendering of the state through the simulation UI
+        self.sim_ui.render(state)
+
+    def record(self):
+        """
+        Records the current state as visualizable state and stores it in the list.
+        """
+        state = self._prepare_visualizable_state()
+        self.recorded_states.append(state)
+
+    def save_recording(self, filename: str = None):
+        """
+        save the recorded states to a file
+        filname: str, must end with *.pkl
+        resets the recorded states list at the end
+        """
+        if filename is None:
+            now = datetime.datetime.now()
+            filename = f'recordings/{now.strftime("%Y-%m-%d_%H-%M-%S")}.pkl'
+
+        # only save if there are recorded states
+        if len(self.recorded_states) == 0:
+            logger.warning("No states recorded, skipping save")
+            # TODO: First env.reset will always have no recorded states
+            return
+
+        os.makedirs(os.path.dirname(filename), exist_ok=True)
+
+        with open(filename, 'wb') as f: # write binary
+            pickle.dump((self.recorded_states, self.map_def), f)
+            logger.info(f"Recording saved to {filename}")
+            logger.info("Reset state list")
+            self.recorded_states = []
+
+    def seed(self, seed=None):
+        """
+        Set the seed for this env's random number generator(s).
+
+        Note:
+            Some environments use multiple pseudorandom number generators.
+            We want to capture all such seeds used in order to ensure that
+            there aren't accidental correlations between multiple generators.
+
+        Returns:
+            list<bigint>: Returns the list of seeds used in this env's random
+            number generators. The first value in the list should be the
+            "main" seed, or the value which a reproducer should pass to
+            'seed'. Often, the main seed equals the provided 'seed', but
+            this won't be true if seed=None, for example.
+
+        TODO: validate this method
+        """
+        self.np_random, seed = seeding.np_random(seed)
+        return [seed]
+
+    def exit(self):
+        """
+        Clean up and exit the simulation UI, if it exists.
+        """
+        if self.sim_ui:
+            self.sim_ui.exit()
diff --git a/robot_sf/render/playback_recording.py b/robot_sf/render/playback_recording.py
new file mode 100644
index 0000000..a3d945b
--- /dev/null
+++ b/robot_sf/render/playback_recording.py
@@ -0,0 +1,49 @@
+"""
+playback a recorded list of states
+"""
+import os
+import pickle
+from typing import List
+import loguru
+from robot_sf.render.sim_view import (
+    SimulationView,
+    VisualizableSimState
+    )
+from robot_sf.nav.map_config import MapDefinition
+
+logger = loguru.logger
+
+
+def load_states(filename: str) -> List[VisualizableSimState]:
+    """
+    load a list of states from a file with pickle
+    """
+    # Check if the file is empty
+    if os.path.getsize(filename) == 0:
+        logger.error(f"File {filename} is empty")
+        return []
+
+    logger.info(f"Loading states from {filename}")
+    with open(filename, 'rb') as f: # rb = read binary
+        states, map_def = pickle.load(f)
+    logger.info(f"Loaded {len(states)} states")
+    return states, map_def
+
+def visualize_states(
+        states: List[VisualizableSimState],
+        map_def: MapDefinition
+        ):
+    """
+    use the SimulationView to render a list of states
+    on the recorded map defintion
+    """
+    sim_view = SimulationView(map_def=map_def)
+    for state in states:
+        sim_view.render(state)
+
+def load_states_and_visualize(filename: str):
+    """
+    load a list of states from a file and visualize them
+    """
+    states, map_def = load_states(filename)
+    visualize_states(states, map_def)
diff --git a/robot_sf/render/sim_view.py b/robot_sf/render/sim_view.py
index 58b9521..5ea957e 100644
--- a/robot_sf/render/sim_view.py
+++ b/robot_sf/render/sim_view.py
@@ -211,6 +211,7 @@ def clear(self):
 
     def render(self, state: VisualizableSimState):
         sleep(0.01) # limit UI update rate to 100 fps
+        # TODO: make the sleep time configurable
 
         # info: event handling needs to be processed
         #       in the main thread to access UI resources
diff --git a/test_pygame/README.md b/test_pygame/README.md
new file mode 100644
index 0000000..fc31028
--- /dev/null
+++ b/test_pygame/README.md
@@ -0,0 +1,3 @@
+# Pygame specific test that can not be run in the CI
+
+Pygame can not be tested in the CI because it requires a display to be present. This test is meant to be run locally.
diff --git a/test_pygame/recordings/2024-06-04_08-39-59.pkl b/test_pygame/recordings/2024-06-04_08-39-59.pkl
new file mode 100644
index 0000000..8610bca
Binary files /dev/null and b/test_pygame/recordings/2024-06-04_08-39-59.pkl differ
diff --git a/test_pygame/test_load_and_visualize_states.py b/test_pygame/test_load_and_visualize_states.py
new file mode 100644
index 0000000..d751818
--- /dev/null
+++ b/test_pygame/test_load_and_visualize_states.py
@@ -0,0 +1,16 @@
+"""
+load a recording and play it back
+"""
+import loguru
+
+
+from robot_sf.render.playback_recording import load_states_and_visualize
+
+logger = loguru.logger
+
+def test_load_and_visualize_states():
+    logger.info("Testing load and visualize states")
+    test_file = "test_pygame/recordings/2024-06-04_08-39-59.pkl"
+
+    # Load the states from the file
+    load_states_and_visualize(test_file)
diff --git a/tests/test_recording.py b/tests/test_recording.py
new file mode 100644
index 0000000..7186a69
--- /dev/null
+++ b/tests/test_recording.py
@@ -0,0 +1,33 @@
+import os
+import pickle
+
+from robot_sf.gym_env.robot_env import RobotEnv, VisualizableSimState
+
+def test_recording():
+    env = RobotEnv(
+        recording_enabled=True
+    )
+    env.reset()
+
+    # Run the simulation for a few timesteps
+    for _ in range(10):
+        action = env.action_space.sample()  # replace with your action sampling logic
+        env.step(action)
+
+    # Save the recording
+    env.reset()
+
+    # Check that the file was created
+    filename = max(
+        os.listdir('recordings'), key=lambda x: os.path.getctime(os.path.join('recordings', x)))
+    assert os.path.exists(os.path.join('recordings', filename))
+
+    # Load the recording
+    with open(os.path.join('recordings', filename), 'rb') as f:
+        recorded_states = pickle.load(f)
+
+    # Check that the recording has the correct length
+    assert len(recorded_states) == 10
+
+    # Check that the recorded states are instances of VisualizableSimState
+    assert all(isinstance(state, VisualizableSimState) for state in recorded_states)