From f11c797a69ef0aab69f3b868b9831a90b4ec7bd6 Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Mon, 23 Feb 2026 15:45:52 +0300
Subject: [PATCH 01/15] Migrate to gymnasium >= 1.0 and modernize build tooling

- Use `env.unwrapped` for pogema-specific attributes (gymnasium >= 1.0 removed Wrapper.__getattr__ forwarding)
- Replace flake8 with ruff, migrate CI to uv
- Remove stale setup.py, requirements.txt, build.sh
- Misc pyproject.toml cleanup (numpy bound, classifiers, requires-python)
---
 .github/workflows/CI.yml                  |  26 ++---
 build.sh                                  |   3 -
 local_build.sh                            |   1 -
 pogema/envs.py                            |   2 +-
 pogema/grid_config.py                     | 133 +++++++++++++---------
 pogema/integrations/make_pogema.py        |   2 +-
 pogema/integrations/pettingzoo.py         |   6 +-
 pogema/integrations/pymarl.py             |  10 +-
 pogema/integrations/sample_factory.py     |   2 +-
 pogema/svg_animation/animation_wrapper.py |  23 ++--
 pogema/wrappers/metrics.py                |  22 ++--
 pogema/wrappers/multi_time_limit.py       |   4 +-
 pogema/wrappers/persistence.py            |  20 ++--
 pyproject.toml                            |  53 +++++++++
 requirements.txt                          |   6 -
 setup.py                                  |  53 ---------
 tests/test_grid.py                        |   4 +-
 tests/test_integrations.py                |   6 +-
 tests/test_pogema_env.py                  |  12 +-
 19 files changed, 198 insertions(+), 190 deletions(-)
 delete mode 100644 build.sh
 delete mode 100644 local_build.sh
 create mode 100644 pyproject.toml
 delete mode 100644 requirements.txt
 delete mode 100644 setup.py

diff --git a/.github/workflows/CI.yml b/.github/workflows/CI.yml
index 7e9132b..b04db17 100644
--- a/.github/workflows/CI.yml
+++ b/.github/workflows/CI.yml
@@ -16,25 +16,17 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        python-version: ["3.8", "3.9", "3.10", "3.11", "3.12"]
+        python-version: ["3.10", "3.11", "3.12", "3.13", "3.14"]
 
     steps:
-    - uses: actions/checkout@v2
+    - uses: actions/checkout@v4
+    - name: Install uv
+      uses: astral-sh/setup-uv@v4
     - name: Set up Python ${{ matrix.python-version }}
-      uses: actions/setup-python@v2
-      with:
-        python-version: ${{ matrix.python-version }}
+      run: uv python install ${{ matrix.python-version }}
     - name: Install dependencies
-      run: |
-        python -m pip install --upgrade pip
-        python -m pip install flake8 pytest
-        if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
-    - name: Lint with flake8
-      run: |
-        # stop the build if there are Python syntax errors or undefined names
-        flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics
-        # exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide
-        flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics
+      run: uv sync --extra test --extra dev
+    - name: Lint with ruff
+      run: uv run ruff check .
     - name: Test with pytest
-      run: |
-        PYTHONPATH=. pytest -s
+      run: uv run pytest -s
diff --git a/build.sh b/build.sh
deleted file mode 100644
index b1024db..0000000
--- a/build.sh
+++ /dev/null
@@ -1,3 +0,0 @@
-rm -rf dist/
-python3 -m build
-python3 -m twine upload dist/*
diff --git a/local_build.sh b/local_build.sh
deleted file mode 100644
index ddcd346..0000000
--- a/local_build.sh
+++ /dev/null
@@ -1 +0,0 @@
-pip3 install --no-cache-dir .
\ No newline at end of file
diff --git a/pogema/envs.py b/pogema/envs.py
index c7c5d74..dd4d1c9 100644
--- a/pogema/envs.py
+++ b/pogema/envs.py
@@ -464,7 +464,7 @@ def _make_pogema(grid_config):
         raise KeyError(f'Unknown on_target option: {grid_config.on_target}')
 
     env = MultiTimeLimit(env, grid_config.max_episode_steps)
-    if env.grid_config.persistent:
+    if grid_config.persistent:
         env = PersistentWrapper(env)
     else:
         # adding metrics wrappers
diff --git a/pogema/grid_config.py b/pogema/grid_config.py
index 77cf63e..ff18c23 100644
--- a/pogema/grid_config.py
+++ b/pogema/grid_config.py
@@ -1,13 +1,20 @@
 import sys
 from typing import Optional, Union
 from pydantic import validator, root_validator
+from pydantic import BaseModel, model_validator
 
 from pogema.utils import CommonSettings
 
 from typing_extensions import Literal
 
+import sys
+from typing import Optional, Union
+from pydantic import validator, model_validator
+from pogema.utils import CommonSettings
+from typing_extensions import Literal
 
-class GridConfig(CommonSettings, ):
+
+class GridConfig(CommonSettings):
     on_target: Literal['finish', 'nothing', 'restart'] = 'finish'
     seed: Optional[int] = None
     width: Optional[int] = None
@@ -24,52 +31,69 @@ class GridConfig(CommonSettings, ):
     persistent: bool = False
     observation_type: Literal['POMAPF', 'MAPF', 'default'] = 'default'
     map: Optional[Union[list, str]] = None
-
     map_name: Optional[str] = None
-
-    integration: Literal['SampleFactory', 'PyMARL', 'rllib', 'gymnasium', 'PettingZoo'] = None
+    integration: Optional[Literal['SampleFactory', 'PyMARL', 'rllib', 'gymnasium', 'PettingZoo']] = None
     max_episode_steps: int = 64
     auto_reset: Optional[bool] = None
 
-    @root_validator
-    def validate_dimensions_and_positions(cls, values):
-        width_provided = values.get('width') is not None
-        height_provided = values.get('height') is not None
-        
+    @model_validator(mode='after')
+    def validate_dimensions_and_positions(cls, model):
+        # Use getattr for safe access, with default fallback
+        width = getattr(model, 'width', None)
+        height = getattr(model, 'height', None)
+        size = getattr(model, 'size', 8)
+
+        width_provided = width is not None and width > 0
+        height_provided = height is not None and height > 0
+
         if width_provided and not height_provided:
-            raise ValueError("Invalid dimension configuration. Please provide height.")
-        elif not width_provided and height_provided:
-            raise ValueError("Invalid dimension configuration. Please provide width.")
-        
+            raise ValueError("Invalid dimension configuration: width provided but height missing.")
+        if height_provided and not width_provided:
+            raise ValueError("Invalid dimension configuration: height provided but width missing.")
+
         if not width_provided and not height_provided:
-            values['width'] = values.get('size', 8)
-            values['height'] = values.get('size', 8)
-        if 'size' not in values or values.get('size') != max(values.get('width'), values.get('height')):
-            values['size'] = max(values.get('width'), values.get('height'))
-        
-
-        width = values.get('width')
-        height = values.get('height')
-        
-        if width is not None and height is not None:
-            agents_xy = values.get('agents_xy')
-            if agents_xy is not None:
-                cls.check_positions(agents_xy, width, height)
-
-            targets_xy = values.get('targets_xy')
-            if targets_xy is not None:
-                first_element = targets_xy[0]
-                if isinstance(first_element[0], (list, tuple)):
-                    for agent_goals in targets_xy:
-                        cls.check_positions(agent_goals, width, height)
-                else:
-                    cls.check_positions(targets_xy, width, height)
-        
-        return values
+            fallback_size = size if size >= 2 else 8
+            width = fallback_size
+            height = fallback_size
+
+        if width <= 0:
+            width = 8
+        if height <= 0:
+            height = 8
+
+        size = max(width, height, 2)
+
+        setattr(model, 'width', width)
+        setattr(model, 'height', height)
+        setattr(model, 'size', size)
+
+        if not (1 <= width <= 4096):
+            raise ValueError(f"width must be in [1, 4096], got {width}")
+        if not (1 <= height <= 4096):
+            raise ValueError(f"height must be in [1, 4096], got {height}")
+        if not (2 <= size <= 4096):
+            raise ValueError(f"size must be in [2, 4096], got {size}")
+
+        # Validate positions
+        agents_xy = getattr(model, 'agents_xy', None)
+        targets_xy = getattr(model, 'targets_xy', None)
+
+        if agents_xy is not None:
+            cls.check_positions(agents_xy, width, height)
+
+        if targets_xy is not None:
+            first_element = targets_xy[0]
+            if isinstance(first_element[0], (list, tuple)):
+                for agent_goals in targets_xy:
+                    cls.check_positions(agent_goals, width, height)
+            else:
+                cls.check_positions(targets_xy, width, height)
+
+        return model
 
     @validator('seed')
     def seed_initialization(cls, v):
-        assert v is None or (0 <= v < sys.maxsize), "seed must be in [0, " + str(sys.maxsize) + ']'
+        assert v is None or (0 <= v < sys.maxsize), f"seed must be in [0, {sys.maxsize}]"
         return v
 
     @staticmethod
@@ -99,7 +123,7 @@ def density_restrictions(cls, v):
         return v
 
     @validator('agents_xy')
-    def agents_xy_validation(cls, v, values):
+    def agents_xy_validation(cls, v):
         if v is not None:
             if not isinstance(v, (list, tuple)):
                 raise ValueError("agents_xy must be a list")
@@ -115,11 +139,11 @@ def targets_xy_validation(cls, v, values):
         if v is not None:
             if not v or not isinstance(v, (list, tuple)):
                 raise ValueError("targets_xy must be a list")
-            
+
             first_element = v[0]
             if not isinstance(first_element, (list, tuple)):
                 raise ValueError("Invalid targets_xy format")
-            
+
             if isinstance(first_element[0], (list, tuple)):
                 for agent_goals in v:
                     if not isinstance(agent_goals, (list, tuple)) or len(agent_goals) < 2:
@@ -132,7 +156,10 @@ def targets_xy_validation(cls, v, values):
             else:
                 on_target = values.get('on_target', 'finish')
                 if on_target == 'restart':
-                    raise ValueError("on_target='restart' requires goal sequences, not single goals. Use format: targets_xy: [[[x1,y1],[x2,y2]], [[x3,y3],[x4,y4]]]")
+                    raise ValueError(
+                        "on_target='restart' requires goal sequences, not single goals. "
+                        "Use format: targets_xy: [[[x1,y1],[x2,y2]], [[x3,y3],[x4,y4]]]"
+                    )
                 for position in v:
                     if not isinstance(position, (list, tuple)) or len(position) != 2:
                         raise ValueError("Position must be a list/tuple of length 2")
@@ -188,14 +215,14 @@ def map_validation(cls, v, values):
                     'targets_xy') is None) and possible_agents_xy and possible_targets_xy:
                 values['possible_agents_xy'] = possible_agents_xy
                 values['possible_targets_xy'] = possible_targets_xy
-        
+
         height = len(v)
         width = 0
         area = 0
         for line in v:
             width = max(width, len(line))
             area += len(line)
-        
+
         values['size'] = max(width, height)
         values['width'] = width
         values['height'] = height
@@ -203,13 +230,13 @@ def map_validation(cls, v, values):
 
         return v
 
-    @validator('possible_agents_xy')
-    def possible_agents_xy_validation(cls, v):
-        return v
-
-    @validator('possible_targets_xy')
-    def possible_targets_xy_validation(cls, v):
-        return v
+    # @validator('possible_agents_xy')
+    # def possible_agents_xy_validation(cls, v):
+    #     return v
+    #
+    # @validator('possible_targets_xy')
+    # def possible_targets_xy_validation(cls, v):
+    #     return v
 
     @staticmethod
     def str_map_to_list(str_map, free, obstacle):
@@ -266,7 +293,7 @@ def str_map_to_list(str_map, free, obstacle):
 
     def update_config(self, **kwargs):
         current_values = self.dict()
-        
+
         if 'size' in kwargs:
             current_values.pop('width', None)
             current_values.pop('height', None)
@@ -274,6 +301,6 @@ def update_config(self, **kwargs):
             current_values.pop('size', None)
         current_values.update(kwargs)
         new_instance = GridConfig(**current_values)
-        
+
         for field_name, field_value in new_instance.__dict__.items():
             setattr(self, field_name, field_value)
diff --git a/pogema/integrations/make_pogema.py b/pogema/integrations/make_pogema.py
index 83a8b46..9e64901 100644
--- a/pogema/integrations/make_pogema.py
+++ b/pogema/integrations/make_pogema.py
@@ -26,7 +26,7 @@ class SingleAgentWrapper(Wrapper):
 
     def step(self, action):
         observations, rewards, terminated, truncated, infos = self.env.step(
-            [action] + [self.env.action_space.sample() for _ in range(self.get_num_agents() - 1)])
+            [action] + [self.env.action_space.sample() for _ in range(self.unwrapped.get_num_agents() - 1)])
         return observations[0], rewards[0], terminated[0], truncated[0], infos[0]
 
     def reset(self, seed: Optional[int] = None, return_info: bool = True, options: Optional[dict] = None, ):
diff --git a/pogema/integrations/pettingzoo.py b/pogema/integrations/pettingzoo.py
index 41a8792..b2166bd 100644
--- a/pogema/integrations/pettingzoo.py
+++ b/pogema/integrations/pettingzoo.py
@@ -12,13 +12,13 @@ def parallel_env(grid_config: GridConfig = GridConfig()):
 class PogemaParallel:
 
     def state(self):
-        return self.pogema.get_state()
+        return self.pogema.unwrapped.get_state()
 
     def __init__(self, grid_config: GridConfig, render_mode='ansi'):
         self.metadata = {'render_modes': ['ansi'], "name": "pogema"}
         self.render_mode = render_mode
         self.pogema = _make_pogema(grid_config)
-        self.possible_agents = ["player_" + str(r) for r in range(self.pogema.get_num_agents())]
+        self.possible_agents = ["player_" + str(r) for r in range(self.pogema.unwrapped.get_num_agents())]
         self.agent_name_mapping = dict(zip(self.possible_agents, list(range(len(self.possible_agents)))))
         self.agents = None
         self.num_moves = None
@@ -58,7 +58,7 @@ def step(self, actions):
         d_infos = {agent: infos[anm[agent]] for agent in self.agents}
 
         for agent, idx in anm.items():
-            if (not self.pogema.grid.is_active[idx] or all(truncated) or all(terminated)) and agent in self.agents:
+            if (not self.pogema.unwrapped.grid.is_active[idx] or all(truncated) or all(terminated)) and agent in self.agents:
                 self.agents.remove(agent)
 
         return d_observations, d_rewards, d_terminated, d_truncated, d_infos
diff --git a/pogema/integrations/pymarl.py b/pogema/integrations/pymarl.py
index 5a9ec87..f28d6e2 100644
--- a/pogema/integrations/pymarl.py
+++ b/pogema/integrations/pymarl.py
@@ -15,7 +15,7 @@ def __init__(self, grid_config, mh_distance=False):
         self._observations, _ = self.env.reset()
         self.max_episode_steps = gc.max_episode_steps
         self.episode_limit = gc.max_episode_steps
-        self.n_agents = self.env.get_num_agents()
+        self.n_agents = self.env.unwrapped.get_num_agents()
 
         self.spec = None
 
@@ -43,14 +43,14 @@ def get_obs_size(self):
         return len(np.array(self._observations[0]).flatten())
 
     def get_state(self):
-        return self.env.get_state()
+        return self.env.unwrapped.get_state()
 
     def get_state_size(self):
         return len(self.get_state())
 
     def get_avail_actions(self):
         actions = []
-        for i in range(self.env.get_num_agents()):
+        for i in range(self.env.unwrapped.get_num_agents()):
             actions.append(self.get_avail_agent_actions(i))
         return actions
 
@@ -64,7 +64,7 @@ def get_total_actions():
         return 5
 
     def reset(self):
-        self._grid_config = self.env.grid_config
+        self._grid_config = self.env.unwrapped.grid_config
         self._observations, _ = self.env.reset()
         return np.array(self._observations).flatten()
 
@@ -91,4 +91,4 @@ def close(self):
         return
 
     def sample_actions(self):
-        return self.env.sample_actions()
+        return self.env.unwrapped.sample_actions()
diff --git a/pogema/integrations/sample_factory.py b/pogema/integrations/sample_factory.py
index 1152aff..94b6de9 100644
--- a/pogema/integrations/sample_factory.py
+++ b/pogema/integrations/sample_factory.py
@@ -11,7 +11,7 @@ def __init__(self, env):
 
     @property
     def num_agents(self):
-        return self.get_num_agents()
+        return self.unwrapped.get_num_agents()
 
 
 class MetricsForwardingWrapper(Wrapper):
diff --git a/pogema/svg_animation/animation_wrapper.py b/pogema/svg_animation/animation_wrapper.py
index adaa88d..ed7aa33 100644
--- a/pogema/svg_animation/animation_wrapper.py
+++ b/pogema/svg_animation/animation_wrapper.py
@@ -1,6 +1,6 @@
 import os
 from itertools import cycle
-from gymnasium import logger, Wrapper
+from gymnasium import Wrapper
 
 from pogema import GridConfig
 from pogema.svg_animation.animation_drawer import AnimationConfig, SvgSettings, GridHolder, AnimationDrawer
@@ -13,7 +13,7 @@ class AnimationMonitor(Wrapper):
     """
 
     def __init__(self, env, animation_config=AnimationConfig()):
-        self._working_radius = env.grid_config.obs_radius - 1
+        self._working_radius = env.unwrapped.grid_config.obs_radius - 1
         env = PersistentWrapper(env, xy_offset=-self._working_radius)
 
         super().__init__(env)
@@ -43,11 +43,10 @@ def step(self, action):
             if save_tau:
                 if (self._episode_idx + 1) % save_tau or save_tau == 1:
                     if not os.path.exists(self.animation_config.directory):
-                        logger.info(f"Creating pogema monitor directory {self.animation_config.directory}", )
                         os.makedirs(self.animation_config.directory, exist_ok=True)
 
                     path = os.path.join(self.animation_config.directory,
-                                        self.pick_name(self.grid_config, self._episode_idx))
+                                        self.pick_name(self.unwrapped.grid_config, self._episode_idx))
                     self.save_animation(path)
 
         return obs, reward, terminated, truncated, info
@@ -96,23 +95,23 @@ def save_animation(self, name='render.svg', animation_config: AnimationConfig =
         """
         wr = self._working_radius
         if wr > 0:
-            obstacles = self.env.get_obstacles(ignore_borders=False)[wr:-wr, wr:-wr]
+            obstacles = self.unwrapped.get_obstacles(ignore_borders=False)[wr:-wr, wr:-wr]
         else:
-            obstacles = self.env.get_obstacles(ignore_borders=False)
+            obstacles = self.unwrapped.get_obstacles(ignore_borders=False)
         history: list[list[AgentState]] = self.env.decompress_history(self.history)
 
         svg_settings = SvgSettings()
         colors_cycle = cycle(svg_settings.colors)
-        agents_colors = {index: next(colors_cycle) for index in range(self.grid_config.num_agents)}
+        agents_colors = {index: next(colors_cycle) for index in range(self.unwrapped.grid_config.num_agents)}
 
-        for agent_idx in range(self.grid_config.num_agents):
+        for agent_idx in range(self.unwrapped.grid_config.num_agents):
             history[agent_idx].append(history[agent_idx][-1])
 
         episode_length = len(history[0])
         # Change episode length for egocentric environment
-        if animation_config.egocentric_idx is not None and self.grid_config.on_target == 'finish':
+        if animation_config.egocentric_idx is not None and self.unwrapped.grid_config.on_target == 'finish':
             episode_length = history[animation_config.egocentric_idx][-1].step + 1
-            for agent_idx in range(self.grid_config.num_agents):
+            for agent_idx in range(self.unwrapped.grid_config.num_agents):
                 history[agent_idx] = history[agent_idx][:episode_length]
 
         grid_holder = GridHolder(
@@ -120,8 +119,8 @@ def save_animation(self, name='render.svg', animation_config: AnimationConfig =
             obstacles=obstacles,
             episode_length=episode_length,
             history=history,
-            obs_radius=self.grid_config.obs_radius,
-            on_target=self.grid_config.on_target,
+            obs_radius=self.unwrapped.grid_config.obs_radius,
+            on_target=self.unwrapped.grid_config.on_target,
             colors=agents_colors,
             config=animation_config,
             svg_settings=svg_settings
diff --git a/pogema/wrappers/metrics.py b/pogema/wrappers/metrics.py
index c684411..6d09c19 100644
--- a/pogema/wrappers/metrics.py
+++ b/pogema/wrappers/metrics.py
@@ -16,7 +16,7 @@ def step(self, action):
         obs, reward, terminated, truncated, infos = self.env.step(action)
         finished = all(truncated) or all(terminated)
 
-        metric = self._compute_stats(self._current_step, self.was_on_goal, finished)
+        metric = self._compute_stats(self._current_step, self.unwrapped.was_on_goal, finished)
         self._current_step += 1
         if finished:
             self._current_step = 0
@@ -40,7 +40,7 @@ def _compute_stats(self, step, is_on_goal, finished):
             if on_goal:
                 self._solved_instances += 1
         if finished:
-            result = {'avg_throughput': self._solved_instances / self.grid_config.max_episode_steps}
+            result = {'avg_throughput': self._solved_instances / self.unwrapped.grid_config.max_episode_steps}
             self._solved_instances = 0
             return result
 
@@ -56,7 +56,7 @@ class NonDisappearISRMetric(AbstractMetric):
 
     def _compute_stats(self, step, is_on_goal, finished):
         if finished:
-            return {'ISR': float(sum(is_on_goal)) / self.get_num_agents()}
+            return {'ISR': float(sum(is_on_goal)) / self.unwrapped.get_num_agents()}
 
 
 class NonDisappearEpLengthMetric(AbstractMetric):
@@ -69,7 +69,7 @@ def _compute_stats(self, step, is_on_goal, finished):
 class EpLengthMetric(AbstractMetric):
     def __init__(self, env):
         super().__init__(env)
-        self._solve_time = [None for _ in range(self.get_num_agents())]
+        self._solve_time = [None for _ in range(self.unwrapped.get_num_agents())]
 
     def _compute_stats(self, step, is_on_goal, finished):
         for idx, on_goal in enumerate(is_on_goal):
@@ -78,8 +78,8 @@ def _compute_stats(self, step, is_on_goal, finished):
                     self._solve_time[idx] = step
 
         if finished:
-            result = {'ep_length': sum(self._solve_time) / self.get_num_agents() + 1}
-            self._solve_time = [None for _ in range(self.get_num_agents())]
+            result = {'ep_length': sum(self._solve_time) / self.unwrapped.get_num_agents() + 1}
+            self._solve_time = [None for _ in range(self.unwrapped.get_num_agents())]
             return result
 
 
@@ -91,7 +91,7 @@ def __init__(self, env):
     def _compute_stats(self, step, is_on_goal, finished):
         self._solved_instances += sum(is_on_goal)
         if finished:
-            results = {'CSR': float(self._solved_instances == self.get_num_agents())}
+            results = {'CSR': float(self._solved_instances == self.unwrapped.get_num_agents())}
             self._solved_instances = 0
             return results
 
@@ -104,7 +104,7 @@ def __init__(self, env):
     def _compute_stats(self, step, is_on_goal, finished):
         self._solved_instances += sum(is_on_goal)
         if finished:
-            results = {'ISR': self._solved_instances / self.get_num_agents()}
+            results = {'ISR': self._solved_instances / self.unwrapped.get_num_agents()}
             self._solved_instances = 0
             return results
 
@@ -112,7 +112,7 @@ def _compute_stats(self, step, is_on_goal, finished):
 class SumOfCostsAndMakespanMetric(AbstractMetric):
     def __init__(self, env):
         super().__init__(env)
-        self._solve_time = [None for _ in range(self.get_num_agents())]
+        self._solve_time = [None for _ in range(self.unwrapped.get_num_agents())]
 
     def _compute_stats(self, step, is_on_goal, finished):
         for idx, on_goal in enumerate(is_on_goal):
@@ -122,8 +122,8 @@ def _compute_stats(self, step, is_on_goal, finished):
                 self._solve_time[idx] = None
 
         if finished:
-            result = {'SoC': sum(self._solve_time) + self.get_num_agents(), 'makespan': max(self._solve_time) + 1}
-            self._solve_time = [None for _ in range(self.get_num_agents())]
+            result = {'SoC': sum(self._solve_time) + self.unwrapped.get_num_agents(), 'makespan': max(self._solve_time) + 1}
+            self._solve_time = [None for _ in range(self.unwrapped.get_num_agents())]
             return result
 
 
diff --git a/pogema/wrappers/multi_time_limit.py b/pogema/wrappers/multi_time_limit.py
index b120f71..13c9cc9 100644
--- a/pogema/wrappers/multi_time_limit.py
+++ b/pogema/wrappers/multi_time_limit.py
@@ -6,11 +6,11 @@ def step(self, action):
         observation, reward, terminated, truncated, info = self.env.step(action)
         self._elapsed_steps += 1
         if self._elapsed_steps >= self._max_episode_steps:
-            truncated = [True] * self.get_num_agents()
+            truncated = [True] * self.unwrapped.get_num_agents()
         return observation, reward, terminated, truncated, info
 
     def set_elapsed_steps(self, elapsed_steps):
-        if not self.grid_config.persistent:
+        if not self.unwrapped.grid_config.persistent:
             raise ValueError("Cannot set elapsed steps for non-persistent environment!")
         assert elapsed_steps >= 0
         self._elapsed_steps = elapsed_steps
diff --git a/pogema/wrappers/persistence.py b/pogema/wrappers/persistence.py
index 33df9aa..6658eef 100644
--- a/pogema/wrappers/persistence.py
+++ b/pogema/wrappers/persistence.py
@@ -40,8 +40,8 @@ def __init__(self, env, xy_offset=None):
     def step(self, action):
         result = self.env.step(action)
         self._step += 1
-        for agent_idx in range(self.get_num_agents()):
-            agent_state = self._get_agent_state(self.grid, agent_idx)
+        for agent_idx in range(self.unwrapped.get_num_agents()):
+            agent_state = self._get_agent_state(self.unwrapped.grid, agent_idx)
             if agent_state != self._agent_states[agent_idx][-1]:
                 self._agent_states[agent_idx].append(agent_state)
 
@@ -51,19 +51,19 @@ def step_back(self):
         if self._step <= 0:
             return False
         self._step -= 1
-        self.set_elapsed_steps(self._step)
-        for idx in reversed(range(self.get_num_agents())):
+        self.env.set_elapsed_steps(self._step)
+        for idx in reversed(range(self.unwrapped.get_num_agents())):
 
             if self._step < self._agent_states[idx][-1].step:
                 self._agent_states[idx].pop()
                 state = self._agent_states[idx][-1]
 
                 if state.active:
-                    self.grid.show_agent(idx)
+                    self.unwrapped.grid.show_agent(idx)
                 else:
-                    self.grid.hide_agent(idx)
-                self.grid.move_agent_to_cell(idx, state.x, state.y)
-                self.grid.finishes_xy[idx] = state.tx, state.ty
+                    self.unwrapped.grid.hide_agent(idx)
+                self.unwrapped.grid.move_agent_to_cell(idx, state.x, state.y)
+                self.unwrapped.grid.finishes_xy[idx] = state.tx, state.ty
 
         return True
 
@@ -84,8 +84,8 @@ def reset(self, **kwargs):
         self._step = 0
 
         self._agent_states = []
-        for agent_idx in range(self.get_num_agents()):
-            self._agent_states.append([self._get_agent_state(self.grid, agent_idx)])
+        for agent_idx in range(self.unwrapped.get_num_agents()):
+            self._agent_states.append([self._get_agent_state(self.unwrapped.grid, agent_idx)])
 
         return result
 
diff --git a/pyproject.toml b/pyproject.toml
new file mode 100644
index 0000000..64962e6
--- /dev/null
+++ b/pyproject.toml
@@ -0,0 +1,53 @@
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+
+[project]
+name = "pogema"
+description = "Partially Observable Grid Environment for Multiple Agents"
+readme = "README.md"
+requires-python = ">=3.10,<3.15"
+license = {text = "MIT"}
+authors = [{name = "Alexey Skrynnik", email = "skrynnikalexey@gmail.com"}]
+dynamic = ["version"]
+classifiers = [
+    "Development Status :: 4 - Beta",
+    "License :: OSI Approved :: MIT License",
+    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.12",
+    "Programming Language :: Python :: 3.13",
+    "Programming Language :: Python :: 3.14",
+    "Topic :: Scientific/Engineering :: Artificial Intelligence",
+    "Intended Audience :: Science/Research",
+]
+dependencies = [
+    "gymnasium>=1.2.3",
+    "numpy>=2.0",
+    "pydantic>=2.12.5",
+    "pettingzoo==1.23.1"
+]
+urls = { "Homepage" = "https://github.com/Cognitive-AI-Systems/pogema" }
+
+[project.optional-dependencies]
+test = ["pytest", "pytest-cov", "tabulate"]
+dev = ["ruff"]
+
+[tool.hatch.version]
+path = "pogema/__init__.py"
+
+[tool.hatch.build.targets.wheel]
+packages = ["pogema"]
+
+[tool.hatch.build.targets.sdist]
+include = ["pogema"]
+
+[tool.pytest.ini_options]
+testpaths = ["tests"]
+
+[tool.ruff]
+line-length = 127
+
+[tool.ruff.lint]
+select = ["E", "F"]
+ignore = []
diff --git a/requirements.txt b/requirements.txt
deleted file mode 100644
index 07c5376..0000000
--- a/requirements.txt
+++ /dev/null
@@ -1,6 +0,0 @@
-numpy>1.23.5,<=1.26.4
-pydantic>=1.8.2,<=1.9.1
-pytest>=6.2.5,<=7.1.2
-pettingzoo==1.23.1
-tabulate>=0.8.7,<=0.8.10
-gymnasium==0.28.1
diff --git a/setup.py b/setup.py
deleted file mode 100644
index 81c3327..0000000
--- a/setup.py
+++ /dev/null
@@ -1,53 +0,0 @@
-import codecs
-import os
-import re
-
-from setuptools import setup, find_packages
-
-cur_dir = os.path.abspath(os.path.dirname(__file__))
-with open(os.path.join(cur_dir, 'README.md'), 'rb') as f:
-    lines = [x.decode('utf-8') for x in f.readlines()]
-    lines = ''.join([re.sub('^<.*>\n$', '', x) for x in lines])
-    long_description = lines
-
-
-def read(*parts):
-    with codecs.open(os.path.join(cur_dir, *parts), 'r') as fp:
-        return fp.read()
-
-
-def find_version(*file_paths):
-    version_file = read(*file_paths)
-    version_match = re.search(
-        r"^__version__ = ['\"]([^'\"]*)['\"]",
-        version_file,
-        re.M,
-    )
-    if version_match:
-        return version_match.group(1)
-
-    raise RuntimeError("Unable to find version string.")
-
-
-setup(
-    name='pogema',
-    author='Alexey Skrynnik',
-    license='MIT',
-    version=find_version("pogema", "__init__.py"),
-    description='Partially Observable Grid Environment for Multiple Agents',
-    long_description=long_description,
-    long_description_content_type='text/markdown',
-    url='https://github.com/Cognitive-AI-Systems/pogema',
-    install_requires=[
-        "gymnasium==0.28.1",
-        "numpy>1.23.5,<=1.26.4",
-        "pydantic>=1.8.2,<=1.9.1",
-    ],
-    extras_require={
-
-    },
-    package_dir={'': './'},
-    packages=find_packages(where='./', include='pogema*'),
-    include_package_data=True,
-    python_requires=">=3.8,<3.13"
-)
diff --git a/tests/test_grid.py b/tests/test_grid.py
index f8c5c8f..653112b 100644
--- a/tests/test_grid.py
+++ b/tests/test_grid.py
@@ -181,8 +181,8 @@ def test_custom_starts_and_finishes_random():
     env = pogema_v0(grid_config=grid_config)
     env.reset()
     r = grid_config.obs_radius
-    assert [(x - r, y - r) for x, y in env.grid.positions_xy] == agents_xy and \
-           [(x - r, y - r) for x, y in env.grid.finishes_xy] == targets_xy
+    assert [(x - r, y - r) for x, y in env.unwrapped.grid.positions_xy] == agents_xy and \
+           [(x - r, y - r) for x, y in env.unwrapped.grid.finishes_xy] == targets_xy
 
 
 def test_out_of_bounds_for_custom_positions():
diff --git a/tests/test_integrations.py b/tests/test_integrations.py
index 146a05a..3e727ed 100644
--- a/tests/test_integrations.py
+++ b/tests/test_integrations.py
@@ -23,15 +23,15 @@ def test_sample_factory_integration():
     env = pogema_v0(GridConfig(seed=7, num_agents=4, size=12, integration='SampleFactory'))
     env.reset()
 
-    assert env.num_agents == 4
-    assert env.is_multiagent is True
+    assert env.unwrapped.get_num_agents() == 4
+    assert env.env.is_multiagent is True
 
     # testing auto-reset wrapper
     for _ in range(2):
         dones = [False]
         infos = None
         while True:
-            _, _, terminated, truncated, infos = env.step(env.sample_actions())
+            _, _, terminated, truncated, infos = env.step(env.unwrapped.sample_actions())
             if all(terminated) or all(truncated):
                 break
 
diff --git a/tests/test_pogema_env.py b/tests/test_pogema_env.py
index ad81170..02720e5 100644
--- a/tests/test_pogema_env.py
+++ b/tests/test_pogema_env.py
@@ -60,7 +60,7 @@ def run_episode(grid_config=None, env=None):
 
     results = [[obs, rewards, terminated, truncated, infos]]
     while True:
-        results.append(env.step(env.sample_actions()))
+        results.append(env.step(env.unwrapped.sample_actions()))
         terminated, truncated = results[-1][2], results[-1][3]
         if all(terminated) or all(truncated):
             break
@@ -182,8 +182,8 @@ def test_custom_positions_and_num_agents():
         gc.num_agents = num_agents
         env = pogema_v0(grid_config=gc)
         env.reset()
-        assert num_agents == len(env.get_agents_xy())
-        assert num_agents == len(env.get_targets_xy())
+        assert num_agents == len(env.unwrapped.get_agents_xy())
+        assert num_agents == len(env.unwrapped.get_targets_xy())
 
 
 def test_custom_positions_and_empty_num_agents():
@@ -198,7 +198,7 @@ def test_custom_positions_and_empty_num_agents():
     )
     env = pogema_v0(grid_config=gc)
     env.reset()
-    assert len(gc.agents_xy) == len(env.get_agents_xy())
+    assert len(gc.agents_xy) == len(env.unwrapped.get_agents_xy())
 
 
 def test_persistent_env(num_steps=100):
@@ -217,7 +217,7 @@ def state_repr(observations, rewards, terminates, truncates, infos):
         return np.concatenate([np.array(observations).flatten(), terminates, truncates, np.array(rewards), ])
 
     for current_step in range(num_steps):
-        actions = action_sampler.sample_actions(dim=env.get_num_agents())
+        actions = action_sampler.sample_actions(dim=env.unwrapped.get_num_agents())
         obs, reward, terminated, truncated, info = env.step(actions)
 
         first_run_observations.append(state_repr(obs, reward, terminated, truncated, info))
@@ -233,7 +233,7 @@ def state_repr(observations, rewards, terminates, truncates, infos):
 
     second_run_observations = []
     for current_step in range(num_steps):
-        actions = action_sampler.sample_actions(dim=env.get_num_agents())
+        actions = action_sampler.sample_actions(dim=env.unwrapped.get_num_agents())
         obs, reward, terminated, truncated, info = env.step(actions)
         second_run_observations.append(state_repr(obs, reward, terminated, truncated, info))
         assert np.isclose(first_run_observations[current_step], second_run_observations[current_step]).all()

From 6fc985f616977e0b78236dafd6bdf3a82c585354 Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Mon, 23 Feb 2026 16:37:33 +0300
Subject: [PATCH 02/15] - migrated to newer version of checks in pydantic -
 fixed ruff checks

---
 pogema/a_star_policy.py                  |   2 +-
 pogema/generator.py                      |   3 +-
 pogema/grid_config.py                    | 175 ++++++++++++-----------
 pogema/svg_animation/animation_drawer.py |   3 +-
 pyproject.toml                           |   4 +-
 tests/test_grid.py                       |  14 +-
 tests/test_integrations.py               |   8 +-
 tests/test_pogema_env.py                 |   4 +-
 8 files changed, 109 insertions(+), 104 deletions(-)

diff --git a/pogema/a_star_policy.py b/pogema/a_star_policy.py
index f143601..0b41a96 100644
--- a/pogema/a_star_policy.py
+++ b/pogema/a_star_policy.py
@@ -99,7 +99,7 @@ def __init__(self, seed=0):
         self._rnd = np.random.default_rng(seed)
 
     def act(self, obs):
-        xy, target_xy, obstacles, agents = obs['xy'], obs['target_xy'], obs['obstacles'], obs['agents']
+        xy, target_xy, obstacles, _ = obs['xy'], obs['target_xy'], obs['obstacles'], obs['agents']
 
 
         if self._saved_xy is not None and h(self._saved_xy, xy) > 1:
diff --git a/pogema/generator.py b/pogema/generator.py
index cb0e3f4..c45b21d 100644
--- a/pogema/generator.py
+++ b/pogema/generator.py
@@ -104,7 +104,8 @@ def placing(order, components, grid, start_id, num_agents):
     return positions_xy, finishes_xy
 
 def generate_from_possible_positions(grid_config: GridConfig):
-    if len(grid_config.possible_agents_xy) < grid_config.num_agents or len(grid_config.possible_targets_xy) < grid_config.num_agents:
+    if (len(grid_config.possible_agents_xy) < grid_config.num_agents or
+            len(grid_config.possible_targets_xy) < grid_config.num_agents):
         raise OverflowError(f"Can't create task. Not enough possible positions for {grid_config.num_agents} agents.")
     rng = np.random.default_rng(grid_config.seed)
     rng.shuffle(grid_config.possible_agents_xy)
diff --git a/pogema/grid_config.py b/pogema/grid_config.py
index ff18c23..c3c055b 100644
--- a/pogema/grid_config.py
+++ b/pogema/grid_config.py
@@ -1,15 +1,6 @@
 import sys
 from typing import Optional, Union
-from pydantic import validator, root_validator
-from pydantic import BaseModel, model_validator
-
-from pogema.utils import CommonSettings
-
-from typing_extensions import Literal
-
-import sys
-from typing import Optional, Union
-from pydantic import validator, model_validator
+from pydantic import field_validator, model_validator
 from pogema.utils import CommonSettings
 from typing_extensions import Literal
 
@@ -36,12 +27,62 @@ class GridConfig(CommonSettings):
     max_episode_steps: int = 64
     auto_reset: Optional[bool] = None
 
+    @model_validator(mode='before')
+    @classmethod
+    def process_map_and_defaults(cls, data):
+        if isinstance(data, dict):
+            # Process string map into list and extract agents/targets
+            map_val = data.get('map')
+            if map_val is not None and isinstance(map_val, str):
+                free = CommonSettings().FREE
+                obstacle = CommonSettings().OBSTACLE
+                map_val, agents_xy, targets_xy, possible_agents_xy, possible_targets_xy = cls.str_map_to_list(
+                    map_val, free, obstacle
+                )
+                if agents_xy and targets_xy and data.get('agents_xy') is not None and data.get(
+                        'targets_xy') is not None:
+                    raise KeyError("""Can't create task. Please provide agents_xy and targets_xy only once.
+                Either with parameters or with a map.""")
+                if (agents_xy or targets_xy) and (possible_agents_xy or possible_targets_xy):
+                    raise KeyError("""Can't create task. Mark either possible locations or precise ones.""")
+                elif agents_xy and targets_xy:
+                    data['agents_xy'] = agents_xy
+                    data['targets_xy'] = targets_xy
+                    data['num_agents'] = len(agents_xy)
+                elif (data.get('agents_xy') is None or data.get(
+                        'targets_xy') is None) and possible_agents_xy and possible_targets_xy:
+                    data['possible_agents_xy'] = possible_agents_xy
+                    data['possible_targets_xy'] = possible_targets_xy
+
+                data['map'] = map_val
+
+            # Compute map-derived dimensions
+            if map_val is not None and not isinstance(map_val, str):
+                height = len(map_val)
+                width = 0
+                area = 0
+                for line in map_val:
+                    width = max(width, len(line))
+                    area += len(line)
+                data['size'] = max(width, height)
+                data['width'] = width
+                data['height'] = height
+                data['density'] = sum([sum(line) for line in map_val]) / area
+
+            # Default num_agents
+            if data.get('num_agents') is None:
+                if data.get('agents_xy'):
+                    data['num_agents'] = len(data['agents_xy'])
+                else:
+                    data['num_agents'] = 1
+
+        return data
+
     @model_validator(mode='after')
-    def validate_dimensions_and_positions(cls, model):
-        # Use getattr for safe access, with default fallback
-        width = getattr(model, 'width', None)
-        height = getattr(model, 'height', None)
-        size = getattr(model, 'size', 8)
+    def validate_dimensions_and_positions(self):
+        width = self.width
+        height = self.height
+        size = self.size
 
         width_provided = width is not None and width > 0
         height_provided = height is not None and height > 0
@@ -63,9 +104,9 @@ def validate_dimensions_and_positions(cls, model):
 
         size = max(width, height, 2)
 
-        setattr(model, 'width', width)
-        setattr(model, 'height', height)
-        setattr(model, 'size', size)
+        self.width = width
+        self.height = height
+        self.size = size
 
         if not (1 <= width <= 4096):
             raise ValueError(f"width must be in [1, 4096], got {width}")
@@ -75,23 +116,24 @@ def validate_dimensions_and_positions(cls, model):
             raise ValueError(f"size must be in [2, 4096], got {size}")
 
         # Validate positions
-        agents_xy = getattr(model, 'agents_xy', None)
-        targets_xy = getattr(model, 'targets_xy', None)
+        agents_xy = self.agents_xy
+        targets_xy = self.targets_xy
 
         if agents_xy is not None:
-            cls.check_positions(agents_xy, width, height)
+            self.check_positions(agents_xy, width, height)
 
         if targets_xy is not None:
             first_element = targets_xy[0]
             if isinstance(first_element[0], (list, tuple)):
                 for agent_goals in targets_xy:
-                    cls.check_positions(agent_goals, width, height)
+                    self.check_positions(agent_goals, width, height)
             else:
-                cls.check_positions(targets_xy, width, height)
+                self.check_positions(targets_xy, width, height)
 
-        return model
+        return self
 
-    @validator('seed')
+    @field_validator('seed')
+    @classmethod
     def seed_initialization(cls, v):
         assert v is None or (0 <= v < sys.maxsize), f"seed must be in [0, {sys.maxsize}]"
         return v
@@ -105,24 +147,29 @@ def _validate_dimension(v, field_name):
                 assert 1 <= v <= 4096, f"{field_name} must be in [1, 4096]"
         return v
 
-    @validator('size')
+    @field_validator('size')
+    @classmethod
     def size_restrictions(cls, v):
         return cls._validate_dimension(v, 'size')
 
-    @validator('width')
+    @field_validator('width')
+    @classmethod
     def width_restrictions(cls, v):
         return cls._validate_dimension(v, 'width')
 
-    @validator('height')
+    @field_validator('height')
+    @classmethod
     def height_restrictions(cls, v):
         return cls._validate_dimension(v, 'height')
 
-    @validator('density')
+    @field_validator('density')
+    @classmethod
     def density_restrictions(cls, v):
         assert 0.0 <= v <= 1, "density must be in [0, 1]"
         return v
 
-    @validator('agents_xy')
+    @field_validator('agents_xy')
+    @classmethod
     def agents_xy_validation(cls, v):
         if v is not None:
             if not isinstance(v, (list, tuple)):
@@ -134,8 +181,9 @@ def agents_xy_validation(cls, v):
                     raise ValueError("Position coordinates must be integers")
         return v
 
-    @validator('targets_xy')
-    def targets_xy_validation(cls, v, values):
+    @field_validator('targets_xy')
+    @classmethod
+    def targets_xy_validation(cls, v, info):
         if v is not None:
             if not v or not isinstance(v, (list, tuple)):
                 raise ValueError("targets_xy must be a list")
@@ -154,7 +202,7 @@ def targets_xy_validation(cls, v, values):
                         if not all(isinstance(coord, int) for coord in position):
                             raise ValueError("Position coordinates must be integers")
             else:
-                on_target = values.get('on_target', 'finish')
+                on_target = info.data.get('on_target', 'finish')
                 if on_target == 'restart':
                     raise ValueError(
                         "on_target='restart' requires goal sequences, not single goals. "
@@ -178,66 +226,27 @@ def check_positions(v, width, height):
             if not (0 <= x < height and 0 <= y < width):
                 raise IndexError(f"Position is out of bounds! {position} is not in [{0}, {height}] x [{0}, {width}]")
 
-
-    @validator('num_agents', always=True)
-    def num_agents_must_be_positive(cls, v, values):
-        if v is None:
-            if values['agents_xy']:
-                v = len(values['agents_xy'])
-            else:
-                v = 1
+    @field_validator('num_agents')
+    @classmethod
+    def num_agents_must_be_positive(cls, v):
         assert 1 <= v <= 10000000, "num_agents must be in [1, 10000000]"
         return v
 
-    @validator('obs_radius')
+    @field_validator('obs_radius')
+    @classmethod
     def obs_radius_must_be_positive(cls, v):
         assert 1 <= v <= 128, "obs_radius must be in [1, 128]"
         return v
 
-    @validator('map', always=True)
-    def map_validation(cls, v, values):
+    @field_validator('map')
+    @classmethod
+    def map_validation(cls, v):
         if v is None:
             return None
-        if isinstance(v, str):
-            v, agents_xy, targets_xy, possible_agents_xy, possible_targets_xy = cls.str_map_to_list(v, values['FREE'],
-                                                                                                    values['OBSTACLE'])
-            if agents_xy and targets_xy and values.get('agents_xy') is not None and values.get(
-                    'targets_xy') is not None:
-                raise KeyError("""Can't create task. Please provide agents_xy and targets_xy only once.
-                Either with parameters or with a map.""")
-            if (agents_xy or targets_xy) and (possible_agents_xy or possible_targets_xy):
-                raise KeyError("""Can't create task. Mark either possible locations or precise ones.""")
-            elif agents_xy and targets_xy:
-                values['agents_xy'] = agents_xy
-                values['targets_xy'] = targets_xy
-                values['num_agents'] = len(agents_xy)
-            elif (values.get('agents_xy') is None or values.get(
-                    'targets_xy') is None) and possible_agents_xy and possible_targets_xy:
-                values['possible_agents_xy'] = possible_agents_xy
-                values['possible_targets_xy'] = possible_targets_xy
-
-        height = len(v)
-        width = 0
-        area = 0
-        for line in v:
-            width = max(width, len(line))
-            area += len(line)
-
-        values['size'] = max(width, height)
-        values['width'] = width
-        values['height'] = height
-        values['density'] = sum([sum(line) for line in v]) / area
-
+        # String maps are already processed in model_validator(mode='before')
+        # At this point v should be a list
         return v
 
-    # @validator('possible_agents_xy')
-    # def possible_agents_xy_validation(cls, v):
-    #     return v
-    #
-    # @validator('possible_targets_xy')
-    # def possible_targets_xy_validation(cls, v):
-    #     return v
-
     @staticmethod
     def str_map_to_list(str_map, free, obstacle):
         obstacles = []
@@ -292,7 +301,7 @@ def str_map_to_list(str_map, free, obstacle):
         return obstacles, agents_xy, targets_xy, possible_agents_xy, possible_targets_xy
 
     def update_config(self, **kwargs):
-        current_values = self.dict()
+        current_values = self.model_dump()
 
         if 'size' in kwargs:
             current_values.pop('width', None)
diff --git a/pogema/svg_animation/animation_drawer.py b/pogema/svg_animation/animation_drawer.py
index 5ccf37d..ff19ae1 100644
--- a/pogema/svg_animation/animation_drawer.py
+++ b/pogema/svg_animation/animation_drawer.py
@@ -84,7 +84,8 @@ def render(self):
              width="{scaled_width}" height="{scaled_height}" viewBox="{" ".join(map(str, view_box))}">'''
 
         definitions = f'''
-        <rect id="obstacle" width="{self.svg_settings.r * 2}" height="{self.svg_settings.r * 2}" fill="{self.svg_settings.obstacle_color}" rx="{self.svg_settings.rx}"/>
+        <rect id="obstacle" width="{self.svg_settings.r * 2}" height="{self.svg_settings.r * 2}" 
+            fill="{self.svg_settings.obstacle_color}" rx="{self.svg_settings.rx}"/>
         <style>
         .line {{stroke: {self.svg_settings.obstacle_color}; stroke-width: {self.svg_settings.stroke_width};}}
         .agent {{r: {self.svg_settings.r};}}
diff --git a/pyproject.toml b/pyproject.toml
index 64962e6..bc282a6 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -25,13 +25,13 @@ dependencies = [
     "gymnasium>=1.2.3",
     "numpy>=2.0",
     "pydantic>=2.12.5",
-    "pettingzoo==1.23.1"
+    "pettingzoo>=1.24.0,<1.25.0"
 ]
 urls = { "Homepage" = "https://github.com/Cognitive-AI-Systems/pogema" }
 
 [project.optional-dependencies]
 test = ["pytest", "pytest-cov", "tabulate"]
-dev = ["ruff"]
+dev = ["ruff", "pytest", "pytest-cov", "tabulate"]
 
 [tool.hatch.version]
 path = "pogema/__init__.py"
diff --git a/tests/test_grid.py b/tests/test_grid.py
index 653112b..23d7220 100644
--- a/tests/test_grid.py
+++ b/tests/test_grid.py
@@ -412,21 +412,21 @@ def test_pogema_lifelong_with_sequences():
     )
     
     env = PogemaLifeLong(grid_config=config)
-    obs = env.reset()
+    env.reset()
     
-    assert env.has_custom_sequences == True
+    assert env.has_custom_sequences is True
     assert np.isclose(env.current_goal_indices, [0, 0]).all()
     
     with warnings.catch_warnings(record=True) as w:
         warnings.simplefilter("always")
         
-        target1 = env._generate_new_target(0)
+        env._generate_new_target(0)
         assert np.isclose(env.current_goal_indices[0], 1)
         
-        target2 = env._generate_new_target(0)
+        env._generate_new_target(0)
         assert np.isclose(env.current_goal_indices[0], 2)
         
-        target3 = env._generate_new_target(0)
+        env._generate_new_target(0)
         assert np.isclose(env.current_goal_indices[0], 0)
         
         cycling_warnings = [warning for warning in w if "completed all 3 provided targets" in str(warning.message)]
@@ -477,9 +477,9 @@ def test_pogema_lifelong_without_sequences():
     )
     
     env = PogemaLifeLong(grid_config=config)
-    obs = env.reset()
+    env.reset()
     
-    assert env.has_custom_sequences == False
+    assert env.has_custom_sequences is False
     
     target = env._generate_new_target(0)
     assert isinstance(target, tuple)
diff --git a/tests/test_integrations.py b/tests/test_integrations.py
index 3e727ed..5719751 100644
--- a/tests/test_integrations.py
+++ b/tests/test_integrations.py
@@ -28,8 +28,7 @@ def test_sample_factory_integration():
 
     # testing auto-reset wrapper
     for _ in range(2):
-        dones = [False]
-        infos = None
+
         while True:
             _, _, terminated, truncated, infos = env.step(env.unwrapped.sample_actions())
             if all(terminated) or all(truncated):
@@ -101,8 +100,7 @@ def test_single_agent_gym_integration():
 
 
 def test_petting_zoo():
-    from pettingzoo.test import api_test, parallel_api_test, render_test
-    # from pettingzoo.test import render_test
+    from pettingzoo.test import api_test, parallel_api_test
 
     gc = GridConfig(num_agents=16, size=16, integration='PettingZoo')
 
@@ -115,7 +113,5 @@ def env(grid_config: GridConfig = GridConfig(num_agents=20, size=16)):
             return parallel_to_aec(pogema_v0(grid_config))
 
         api_test(env(gc), num_cycles=1000, verbose_progress=True)
-        # todo fix this
-        # render_test(lambda: pogema_v0(gc))
     except ImportError:
         pass
diff --git a/tests/test_pogema_env.py b/tests/test_pogema_env.py
index 02720e5..78b9231 100644
--- a/tests/test_pogema_env.py
+++ b/tests/test_pogema_env.py
@@ -1,8 +1,6 @@
-import re
 import time
 
 import numpy as np
-import pytest
 from tabulate import tabulate
 
 from pogema import pogema_v0, AnimationMonitor
@@ -122,7 +120,7 @@ def test_gym_pogema_animation():
                                                 on_target='finish'))
     env = AnimationMonitor(env)
     env.reset()
-    done = False
+
     while True:
         _, _, terminated, truncated, _ = env.step(env.action_space.sample())
         if terminated or truncated:

From beb45313e1111cbd8a8c20aba7c238eb28998d3d Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Sat, 28 Feb 2026 13:40:02 +0300
Subject: [PATCH 03/15] Improvements: - Removed PyMARL stuff - Add
 PogemaWrapper base class with explicit method forwarding (using base.py) -
 AnimationWrapper - enable/disable/save API, zero-overhead when inactive -
 Soft collision_system by default - Trimming for terminal render

---
 .github/workflows/CI.yml                  |   2 +-
 pogema/__init__.py                        |  10 +-
 pogema/envs.py                            |  39 ++++---
 pogema/grid.py                            |  23 +++-
 pogema/grid_config.py                     |   4 +-
 pogema/integrations/make_pogema.py        |  16 +--
 pogema/integrations/pymarl.py             |  94 ----------------
 pogema/integrations/sample_factory.py     |   8 +-
 pogema/svg_animation/animation_wrapper.py | 121 +++++++--------------
 pogema/wrappers/base.py                   |  92 ++++++++++++++++
 pogema/wrappers/metrics.py                |   9 +-
 pogema/wrappers/multi_time_limit.py       |  19 +++-
 pogema/wrappers/persistence.py            |  40 +++----
 tests/test_integrations.py                |  43 +-------
 tests/test_pogema_env.py                  | 127 +++++++++++++++++++++-
 version_history.MD                        |   2 +-
 16 files changed, 356 insertions(+), 293 deletions(-)
 delete mode 100644 pogema/integrations/pymarl.py
 create mode 100644 pogema/wrappers/base.py

diff --git a/.github/workflows/CI.yml b/.github/workflows/CI.yml
index b04db17..7480784 100644
--- a/.github/workflows/CI.yml
+++ b/.github/workflows/CI.yml
@@ -5,7 +5,7 @@ name: CI
 
 on:
   push:
-    branches: [ main, dev]
+    branches: [ main, dev, pogema-2.0]
   pull_request:
     branches: [ main, dev]
 
diff --git a/pogema/__init__.py b/pogema/__init__.py
index f61b743..1b77cb9 100644
--- a/pogema/__init__.py
+++ b/pogema/__init__.py
@@ -1,8 +1,12 @@
 from gymnasium import register
 from pogema.grid_config import GridConfig
 from pogema.integrations.make_pogema import pogema_v0
-from pogema.svg_animation.animation_wrapper import AnimationMonitor, AnimationConfig
+from pogema.svg_animation.animation_wrapper import AnimationMonitor
+from pogema.svg_animation.animation_drawer import AnimationConfig
 from pogema.a_star_policy import AStarAgent, BatchAStarAgent
+from pogema.wrappers.base import PogemaWrapper
+from pogema.wrappers.animation import AnimationWrapper
+from pogema.wrappers.persistence import PersistentWrapper
 
 __version__ = '1.4.0'
 
@@ -10,7 +14,9 @@
     'GridConfig',
     'pogema_v0',
     'AStarAgent', 'BatchAStarAgent',
-    "AnimationMonitor", "AnimationConfig",
+    "PogemaWrapper",
+    "AnimationWrapper",
+    "PersistentWrapper",
 ]
 
 register(
diff --git a/pogema/envs.py b/pogema/envs.py
index dd4d1c9..0f03883 100644
--- a/pogema/envs.py
+++ b/pogema/envs.py
@@ -10,7 +10,7 @@
     NonDisappearCSRMetric, NonDisappearISRMetric, EpLengthMetric, ISRMetric, CSRMetric, SumOfCostsAndMakespanMetric
 from pogema.wrappers.multi_time_limit import MultiTimeLimit
 from pogema.generator import generate_new_target, generate_from_possible_targets
-from pogema.wrappers.persistence import PersistentWrapper
+from pogema.wrappers.animation import AnimationWrapper
 
 
 class ActionsSampler:
@@ -464,22 +464,29 @@ def _make_pogema(grid_config):
         raise KeyError(f'Unknown on_target option: {grid_config.on_target}')
 
     env = MultiTimeLimit(env, grid_config.max_episode_steps)
+    env = AnimationWrapper(env)
+
     if grid_config.persistent:
-        env = PersistentWrapper(env)
+        warnings.warn(
+            "GridConfig.persistent is deprecated. Use env.enable_animation() instead.",
+            DeprecationWarning,
+            stacklevel=3,
+        )
+        env.enable_animation()
+
+    # adding metrics wrappers
+    if grid_config.on_target == 'restart':
+        env = LifeLongAverageThroughputMetric(env)
+    elif grid_config.on_target == 'nothing':
+        env = NonDisappearISRMetric(env)
+        env = NonDisappearCSRMetric(env)
+        env = NonDisappearEpLengthMetric(env)
+        env = SumOfCostsAndMakespanMetric(env)
+    elif grid_config.on_target == 'finish':
+        env = ISRMetric(env)
+        env = CSRMetric(env)
+        env = EpLengthMetric(env)
     else:
-        # adding metrics wrappers
-        if grid_config.on_target == 'restart':
-            env = LifeLongAverageThroughputMetric(env)
-        elif grid_config.on_target == 'nothing':
-            env = NonDisappearISRMetric(env)
-            env = NonDisappearCSRMetric(env)
-            env = NonDisappearEpLengthMetric(env)
-            env = SumOfCostsAndMakespanMetric(env)
-        elif grid_config.on_target == 'finish':
-            env = ISRMetric(env)
-            env = CSRMetric(env)
-            env = EpLengthMetric(env)
-        else:
-            raise KeyError(f'Unknown on_target option: {grid_config.on_target}')
+        raise KeyError(f'Unknown on_target option: {grid_config.on_target}')
 
     return env
diff --git a/pogema/grid.py b/pogema/grid.py
index 604b861..63aef77 100644
--- a/pogema/grid.py
+++ b/pogema/grid.py
@@ -215,8 +215,27 @@ def get_square_target(self, agent_id):
         result[c.obs_radius - dx, c.obs_radius - dy] = 1
         return result.astype(np.float32)
 
-    def render(self, mode='human'):
-        render_grid(self.obstacles, self.positions_xy, self.finishes_xy, self.is_active, mode=mode)
+    def render(self, mode='human', border='thin'):
+        gc = self.config
+        r = gc.obs_radius
+
+        if border == 'none':
+            trim = r
+        elif border == 'full':
+            trim = 0
+        else:
+            trim = max(r - 1, 0)
+
+        if trim == 0:
+            obs = self.obstacles.copy()
+            agents = deepcopy(self.positions_xy)
+            targets = deepcopy(self.finishes_xy)
+        else:
+            obs = self.obstacles[trim:-trim, trim:-trim].copy()
+            agents = [[x - trim, y - trim] for x, y in self.positions_xy]
+            targets = [[x - trim, y - trim] for x, y in self.finishes_xy]
+
+        render_grid(obs, agents, targets, self.is_active, mode=mode)
 
     def move_agent_to_cell(self, agent_id, x, y):
         if self.positions[self.positions_xy[agent_id]] == self.config.FREE:
diff --git a/pogema/grid_config.py b/pogema/grid_config.py
index c3c055b..f537d7b 100644
--- a/pogema/grid_config.py
+++ b/pogema/grid_config.py
@@ -18,12 +18,12 @@ class GridConfig(CommonSettings):
     num_agents: Optional[int] = None
     possible_agents_xy: Optional[list] = None
     possible_targets_xy: Optional[list] = None
-    collision_system: Literal['block_both', 'priority', 'soft'] = 'priority'
+    collision_system: Literal['block_both', 'priority', 'soft'] = 'soft'
     persistent: bool = False
     observation_type: Literal['POMAPF', 'MAPF', 'default'] = 'default'
     map: Optional[Union[list, str]] = None
     map_name: Optional[str] = None
-    integration: Optional[Literal['SampleFactory', 'PyMARL', 'rllib', 'gymnasium', 'PettingZoo']] = None
+    integration: Optional[Literal['SampleFactory', 'gymnasium', 'PettingZoo']] = None
     max_episode_steps: int = 64
     auto_reset: Optional[bool] = None
 
diff --git a/pogema/integrations/make_pogema.py b/pogema/integrations/make_pogema.py
index 9e64901..9bc37b4 100644
--- a/pogema/integrations/make_pogema.py
+++ b/pogema/integrations/make_pogema.py
@@ -1,11 +1,9 @@
 from typing import Union, Optional
 
-from gymnasium import Wrapper
-
 from pogema import GridConfig
+from pogema.wrappers.base import PogemaWrapper
 from pogema.envs import _make_pogema
 from pogema.integrations.pettingzoo import parallel_env
-from pogema.integrations.pymarl import PyMarlPogema
 from pogema.integrations.sample_factory import AutoResetWrapper, IsMultiAgentWrapper, MetricsForwardingWrapper
 
 
@@ -18,11 +16,7 @@ def _make_sample_factory_integration(grid_config):
     return env
 
 
-def _make_py_marl_integration(grid_config, *_, **__):
-    return PyMarlPogema(grid_config)
-
-
-class SingleAgentWrapper(Wrapper):
+class SingleAgentWrapper(PogemaWrapper):
 
     def step(self, action):
         observations, rewards, terminated, truncated, infos = self.env.step(
@@ -44,7 +38,7 @@ def make_single_agent_gym(grid_config: Union[GridConfig, dict] = GridConfig()):
     return env
 
 
-def make_pogema(grid_config: Union[GridConfig, dict] = GridConfig(), *args, **kwargs):
+def make_pogema(grid_config: Union[GridConfig, dict] = GridConfig(), *args, **kwargs) -> PogemaWrapper:
     if isinstance(grid_config, dict):
         grid_config = GridConfig(**grid_config)
 
@@ -55,10 +49,6 @@ def make_pogema(grid_config: Union[GridConfig, dict] = GridConfig(), *args, **kw
         return _make_pogema(grid_config)
     elif grid_config.integration == 'SampleFactory':
         return _make_sample_factory_integration(grid_config)
-    elif grid_config.integration == 'PyMARL':
-        return _make_py_marl_integration(grid_config, *args, **kwargs)
-    elif grid_config.integration == 'rllib':
-        raise NotImplementedError('Please use PettingZoo integration for rllib')
     elif grid_config.integration == 'PettingZoo':
         return parallel_env(grid_config)
     elif grid_config.integration == 'gymnasium':
diff --git a/pogema/integrations/pymarl.py b/pogema/integrations/pymarl.py
deleted file mode 100644
index f28d6e2..0000000
--- a/pogema/integrations/pymarl.py
+++ /dev/null
@@ -1,94 +0,0 @@
-import numpy as np
-
-from pogema import GridConfig
-from pogema.envs import _make_pogema
-
-
-class PyMarlPogema:
-
-    def __init__(self, grid_config, mh_distance=False):
-        gc = grid_config
-        self._grid_config: GridConfig = gc
-
-        self.env = _make_pogema(grid_config)
-        self._mh_distance = mh_distance
-        self._observations, _ = self.env.reset()
-        self.max_episode_steps = gc.max_episode_steps
-        self.episode_limit = gc.max_episode_steps
-        self.n_agents = self.env.unwrapped.get_num_agents()
-
-        self.spec = None
-
-    @property
-    def unwrapped(self):
-        return self
-
-    def step(self, actions):
-        self._observations, rewards, terminated, truncated, infos = self.env.step(actions)
-        info = {}
-        done = all(terminated) or all(truncated)
-        if done:
-            for key, value in infos[0]['metrics'].items():
-                info[key] = value
-            
-        return sum(rewards), done, info
-
-    def get_obs(self):
-        return np.array([self.get_obs_agent(agent_id) for agent_id in range(self.n_agents)])
-
-    def get_obs_agent(self, agent_id):
-        return np.array(self._observations[agent_id]).flatten()
-
-    def get_obs_size(self):
-        return len(np.array(self._observations[0]).flatten())
-
-    def get_state(self):
-        return self.env.unwrapped.get_state()
-
-    def get_state_size(self):
-        return len(self.get_state())
-
-    def get_avail_actions(self):
-        actions = []
-        for i in range(self.env.unwrapped.get_num_agents()):
-            actions.append(self.get_avail_agent_actions(i))
-        return actions
-
-    # noinspection PyUnusedLocal
-    @staticmethod
-    def get_avail_agent_actions(agent_id):
-        return list(range(5))
-
-    @staticmethod
-    def get_total_actions():
-        return 5
-
-    def reset(self):
-        self._grid_config = self.env.unwrapped.grid_config
-        self._observations, _ = self.env.reset()
-        return np.array(self._observations).flatten()
-
-    def save_replay(self):
-        return
-
-    def render(self, *args, **kwargs):
-        return self.env.render(*args, **kwargs)
-
-    def get_env_info(self):
-        env_info = {"state_shape": self.get_state_size(),
-                    "obs_shape": self.get_obs_size(),
-                    "n_actions": self.get_total_actions(),
-                    "n_agents": self.n_agents,
-                    "episode_limit": self.episode_limit,
-                    }
-        return env_info
-
-    @staticmethod
-    def get_stats():
-        return {}
-
-    def close(self):
-        return
-
-    def sample_actions(self):
-        return self.env.unwrapped.sample_actions()
diff --git a/pogema/integrations/sample_factory.py b/pogema/integrations/sample_factory.py
index 94b6de9..44564c0 100644
--- a/pogema/integrations/sample_factory.py
+++ b/pogema/integrations/sample_factory.py
@@ -1,9 +1,9 @@
 from copy import deepcopy
 
-from gymnasium import Wrapper
+from pogema.wrappers.base import PogemaWrapper
 
 
-class IsMultiAgentWrapper(Wrapper):
+class IsMultiAgentWrapper(PogemaWrapper):
     def __init__(self, env):
         super().__init__(env)
 
@@ -14,7 +14,7 @@ def num_agents(self):
         return self.unwrapped.get_num_agents()
 
 
-class MetricsForwardingWrapper(Wrapper):
+class MetricsForwardingWrapper(PogemaWrapper):
     def step(self, action):
 
         observations, rewards, terminated, truncated, infos = self.env.step(action)
@@ -24,7 +24,7 @@ def step(self, action):
         return observations, rewards, terminated, truncated, infos
 
 
-class AutoResetWrapper(Wrapper):
+class AutoResetWrapper(PogemaWrapper):
     def step(self, action):
         observations, rewards, terminated, truncated, infos = self.env.step(action)
         if all(terminated) or all(truncated):
diff --git a/pogema/svg_animation/animation_wrapper.py b/pogema/svg_animation/animation_wrapper.py
index ed7aa33..338d49b 100644
--- a/pogema/svg_animation/animation_wrapper.py
+++ b/pogema/svg_animation/animation_wrapper.py
@@ -1,36 +1,44 @@
 import os
-from itertools import cycle
-from gymnasium import Wrapper
+import warnings
 
 from pogema import GridConfig
-from pogema.svg_animation.animation_drawer import AnimationConfig, SvgSettings, GridHolder, AnimationDrawer
-from pogema.wrappers.persistence import PersistentWrapper, AgentState
+from pogema.svg_animation.animation_drawer import AnimationConfig
+from pogema.wrappers.base import PogemaWrapper
+from pogema.wrappers.animation import AnimationWrapper
 
 
-class AnimationMonitor(Wrapper):
+def _find_animation_wrapper(env):
+    wrapper = env
+    while wrapper is not None:
+        if isinstance(wrapper, AnimationWrapper):
+            return wrapper
+        wrapper = getattr(wrapper, 'env', None)
+    return None
+
+
+class AnimationMonitor(PogemaWrapper):
     """
-    Defines the animation, which saves the episode as SVG.
+    Deprecated: Use env.enable_animation() instead.
     """
 
     def __init__(self, env, animation_config=AnimationConfig()):
-        self._working_radius = env.unwrapped.grid_config.obs_radius - 1
-        env = PersistentWrapper(env, xy_offset=-self._working_radius)
-
+        warnings.warn(
+            "AnimationMonitor is deprecated. Use env.enable_animation(animation_config) "
+            "and env.save_animation(name) instead.",
+            DeprecationWarning,
+            stacklevel=2,
+        )
         super().__init__(env)
-
-        self.history = env.get_history()
-
-        self.svg_settings: SvgSettings = SvgSettings()
         self.animation_config: AnimationConfig = animation_config
-
         self._episode_idx = 0
 
+        aw = _find_animation_wrapper(self.env)
+        if aw is not None:
+            aw.enable_animation(animation_config)
+        else:
+            raise RuntimeError("No AnimationWrapper found in the wrapper chain.")
+
     def step(self, action):
-        """
-        Saves information about the episode.
-        :param action: current actions
-        :return: obs, reward, done, info
-        """
         obs, reward, terminated, truncated, info = self.env.step(action)
 
         multi_agent_terminated = isinstance(terminated, (list, tuple)) and all(terminated)
@@ -53,13 +61,6 @@ def step(self, action):
 
     @staticmethod
     def pick_name(grid_config: GridConfig, episode_idx=None, zfill_ep=5):
-        """
-        Picks a name for the SVG file.
-        :param grid_config: configuration of the grid
-        :param episode_idx: idx of the episode
-        :param zfill_ep: zfill for the episode number
-        :return:
-        """
         gc = grid_config
         name = 'pogema'
         if episode_idx is not None:
@@ -74,65 +75,19 @@ def pick_name(grid_config: GridConfig, episode_idx=None, zfill_ep=5):
         return name + '.svg'
 
     def reset(self, **kwargs):
-        """
-        Resets the environment and resets the current positions of agents and targets
-        :param kwargs:
-        :return: obs: observation
-        """
         obs = self.env.reset(**kwargs)
-
         self._episode_idx += 1
-        self.history = self.env.get_history()
-
         return obs
 
-    def save_animation(self, name='render.svg', animation_config: AnimationConfig = AnimationConfig()):
-        """
-        Saves the animation.
-        :param name: name of the file
-        :param animation_config: animation configuration
-        :return: None
-        """
-        wr = self._working_radius
-        if wr > 0:
-            obstacles = self.unwrapped.get_obstacles(ignore_borders=False)[wr:-wr, wr:-wr]
-        else:
-            obstacles = self.unwrapped.get_obstacles(ignore_borders=False)
-        history: list[list[AgentState]] = self.env.decompress_history(self.history)
-
-        svg_settings = SvgSettings()
-        colors_cycle = cycle(svg_settings.colors)
-        agents_colors = {index: next(colors_cycle) for index in range(self.unwrapped.grid_config.num_agents)}
-
-        for agent_idx in range(self.unwrapped.grid_config.num_agents):
-            history[agent_idx].append(history[agent_idx][-1])
-
-        episode_length = len(history[0])
-        # Change episode length for egocentric environment
-        if animation_config.egocentric_idx is not None and self.unwrapped.grid_config.on_target == 'finish':
-            episode_length = history[animation_config.egocentric_idx][-1].step + 1
-            for agent_idx in range(self.unwrapped.grid_config.num_agents):
-                history[agent_idx] = history[agent_idx][:episode_length]
-
-        grid_holder = GridHolder(
-            width=len(obstacles), height=len(obstacles[0]),
-            obstacles=obstacles,
-            episode_length=episode_length,
-            history=history,
-            obs_radius=self.unwrapped.grid_config.obs_radius,
-            on_target=self.unwrapped.grid_config.on_target,
-            colors=agents_colors,
-            config=animation_config,
-            svg_settings=svg_settings
-        )
-
-        animation = AnimationDrawer().create_animation(grid_holder)
-        with open(name, "w") as f:
-            f.write(animation.render())
+    def save_animation(self, name='render.svg', animation_config=None):
+        if animation_config is None:
+            animation_config = self.animation_config
+        aw = _find_animation_wrapper(self.env)
+        aw.save_animation(name, animation_config=animation_config)
 
 
 def main():
-    from pogema import GridConfig, pogema_v0, AnimationMonitor, BatchAStarAgent, AnimationConfig
+    from pogema import GridConfig, pogema_v0, BatchAStarAgent
 
     for egocentric_idx in [0, 1]:
         for on_target in ['nothing', 'restart', 'finish']:
@@ -148,7 +103,7 @@ def main():
                                      max_episode_steps=16,
                                      density=0.1, map=grid, observation_type="POMAPF")
             env = pogema_v0(grid_config=grid_config)
-            env = AnimationMonitor(env, AnimationConfig(save_every_idx_episode=None))
+            env.enable_animation()
 
             obs, _ = env.reset()
             truncated = terminated = [False]
@@ -164,10 +119,12 @@ def main():
             env.save_animation(f'{anim_folder}/anim-{on_target}.svg')
             env.save_animation(f'{anim_folder}/anim-{on_target}-ego-{egocentric_idx}.svg',
                                AnimationConfig(egocentric_idx=egocentric_idx))
-            env.save_animation(f'{anim_folder}/anim-static.svg', AnimationConfig(static=True))
-            env.save_animation(f'{anim_folder}/anim-static-ego.svg', AnimationConfig(egocentric_idx=0, static=True))
+            env.save_animation(f'{anim_folder}/anim-static.svg', AnimationConfig(static_frame_idx=0))
+            env.save_animation(f'{anim_folder}/anim-static-ego.svg',
+                               AnimationConfig(egocentric_idx=0, static_frame_idx=0))
             env.save_animation(f'{anim_folder}/anim-static-no-agents.svg',
-                               AnimationConfig(show_agents=False, static=True))
+                               AnimationConfig(show_agents=False, static_frame_idx=0))
+            env.disable_animation()
 
 
 if __name__ == '__main__':
diff --git a/pogema/wrappers/base.py b/pogema/wrappers/base.py
new file mode 100644
index 0000000..65a4045
--- /dev/null
+++ b/pogema/wrappers/base.py
@@ -0,0 +1,92 @@
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import numpy as np
+from gymnasium import Wrapper
+
+if TYPE_CHECKING:
+    from pogema.grid import Grid
+    from pogema.grid_config import GridConfig
+
+_POGEMA_FORWARDED = frozenset({
+    # PogemaBase methods
+    'get_num_agents', 'get_obstacles', 'get_agents_xy', 'get_targets_xy',
+    'get_state', 'get_agents_xy_relative', 'get_targets_xy_relative',
+    'sample_actions',
+    # PogemaBase attributes
+    'grid_config', 'grid', 'was_on_goal',
+    # PogemaLifeLong
+    'get_lifelong_targets_xy',
+    # AnimationWrapper
+    'enable_animation', 'disable_animation', 'save_animation', 'animation_is_active',
+})
+
+
+class PogemaWrapper(Wrapper):
+    env: PogemaWrapper
+
+    # -- Gymnasium overrides with multi-agent types --
+
+    def step(self, action) -> tuple[list, list[float], list[bool], list[bool], list[dict]]:
+        return self.env.step(action)
+
+    def reset(self, **kwargs) -> tuple[list, list[dict]]:
+        return self.env.reset(**kwargs)
+
+    # -- PogemaBase methods --
+
+    def get_num_agents(self) -> int:
+        return self.env.get_num_agents()
+
+    def get_obstacles(self, ignore_borders: bool = False) -> np.ndarray:
+        return self.env.get_obstacles(ignore_borders=ignore_borders)
+
+    def get_agents_xy(self, only_active: bool = False, ignore_borders: bool = False) -> list:
+        return self.env.get_agents_xy(only_active=only_active, ignore_borders=ignore_borders)
+
+    def get_targets_xy(self, only_active: bool = False, ignore_borders: bool = False) -> list:
+        return self.env.get_targets_xy(only_active=only_active, ignore_borders=ignore_borders)
+
+    def get_state(self, ignore_borders: bool = False, as_dict: bool = False):
+        return self.env.get_state(ignore_borders=ignore_borders, as_dict=as_dict)
+
+    def get_agents_xy_relative(self) -> list:
+        return self.env.get_agents_xy_relative()
+
+    def get_targets_xy_relative(self) -> list:
+        return self.env.get_targets_xy_relative()
+
+    def sample_actions(self) -> np.ndarray:
+        return self.env.sample_actions()
+
+    # -- PogemaBase attributes --
+
+    @property
+    def grid_config(self) -> GridConfig:
+        return self.unwrapped.grid_config
+
+    @property
+    def grid(self) -> Grid:
+        return self.unwrapped.grid
+
+    @property
+    def was_on_goal(self) -> list:
+        return self.unwrapped.was_on_goal
+
+    # -- PogemaLifeLong --
+
+    def get_lifelong_targets_xy(self, ignore_borders: bool = False) -> list:
+        return self.env.get_lifelong_targets_xy(ignore_borders=ignore_borders)
+
+    # -- MultiTimeLimit --
+
+    def set_elapsed_steps(self, elapsed_steps: int) -> None:
+        return self.env.set_elapsed_steps(elapsed_steps)
+
+    # -- Fallback for any remaining forwarded names --
+
+    def __getattr__(self, name):
+        if name in _POGEMA_FORWARDED:
+            return getattr(self.env, name)
+        raise AttributeError(f"'{type(self).__name__}' object has no attribute '{name}'")
diff --git a/pogema/wrappers/metrics.py b/pogema/wrappers/metrics.py
index 6d09c19..bb095ab 100644
--- a/pogema/wrappers/metrics.py
+++ b/pogema/wrappers/metrics.py
@@ -1,10 +1,11 @@
 import time
 
 import numpy as np
-from gymnasium import Wrapper
 
+from pogema.wrappers.base import PogemaWrapper
 
-class AbstractMetric(Wrapper):
+
+class AbstractMetric(PogemaWrapper):
     def _compute_stats(self, step, is_on_goal, finished):
         raise NotImplementedError
 
@@ -127,7 +128,7 @@ def _compute_stats(self, step, is_on_goal, finished):
             return result
 
 
-class AgentsDensityWrapper(Wrapper):
+class AgentsDensityWrapper(PogemaWrapper):
     def __init__(self, env):
         super().__init__(env)
         self._avg_agents_density = None
@@ -155,7 +156,7 @@ def reset(self, **kwargs):
         return observations, info
 
 
-class RuntimeMetricWrapper(Wrapper):
+class RuntimeMetricWrapper(PogemaWrapper):
     def __init__(self, env):
         super().__init__(env)
         self._start_time = None
diff --git a/pogema/wrappers/multi_time_limit.py b/pogema/wrappers/multi_time_limit.py
index 13c9cc9..2e2e2a1 100644
--- a/pogema/wrappers/multi_time_limit.py
+++ b/pogema/wrappers/multi_time_limit.py
@@ -1,16 +1,23 @@
-from gymnasium.wrappers import TimeLimit
+from pogema.wrappers.base import PogemaWrapper
 
 
-class MultiTimeLimit(TimeLimit):
+class MultiTimeLimit(PogemaWrapper):
+    def __init__(self, env, max_episode_steps: int):
+        super().__init__(env)
+        self._max_episode_steps = max_episode_steps
+        self._elapsed_steps = None
+
     def step(self, action):
         observation, reward, terminated, truncated, info = self.env.step(action)
         self._elapsed_steps += 1
         if self._elapsed_steps >= self._max_episode_steps:
-            truncated = [True] * self.unwrapped.get_num_agents()
+            truncated = [True] * self.get_num_agents()
         return observation, reward, terminated, truncated, info
 
-    def set_elapsed_steps(self, elapsed_steps):
-        if not self.unwrapped.grid_config.persistent:
-            raise ValueError("Cannot set elapsed steps for non-persistent environment!")
+    def reset(self, **kwargs):
+        self._elapsed_steps = 0
+        return self.env.reset(**kwargs)
+
+    def set_elapsed_steps(self, elapsed_steps: int) -> None:
         assert elapsed_steps >= 0
         self._elapsed_steps = elapsed_steps
diff --git a/pogema/wrappers/persistence.py b/pogema/wrappers/persistence.py
index 6658eef..f38d453 100644
--- a/pogema/wrappers/persistence.py
+++ b/pogema/wrappers/persistence.py
@@ -1,4 +1,4 @@
-from gymnasium import Wrapper
+from pogema.wrappers.base import PogemaWrapper
 
 
 class AgentState:
@@ -30,7 +30,24 @@ def __str__(self):
         return str([self.x, self.y, self.tx, self.ty, self.step, self.active])
 
 
-class PersistentWrapper(Wrapper):
+def agent_state_to_full_list(agent_states, num_steps):
+    result = []
+    current_state_id = 0
+    # going over num_steps + 1, to handle last step
+    for episode_step in range(num_steps + 1):
+        if current_state_id < len(agent_states) - 1 and agent_states[current_state_id + 1].step == episode_step:
+            current_state_id += 1
+        result.append(agent_states[current_state_id])
+    return result
+
+
+def decompress_history(history):
+    max_steps = max([agent_states[-1].step for agent_states in history])
+    result = [agent_state_to_full_list(agent_states, max_steps) for agent_states in history]
+    return result
+
+
+class PersistentWrapper(PogemaWrapper):
     def __init__(self, env, xy_offset=None):
         super().__init__(env)
         self._step = None
@@ -89,25 +106,8 @@ def reset(self, **kwargs):
 
         return result
 
-    @staticmethod
-    def agent_state_to_full_list(agent_states, num_steps):
-        result = []
-        current_state_id = 0
-        # going over num_steps + 1, to handle last step
-        for episode_step in range(num_steps + 1):
-            if current_state_id < len(agent_states) - 1 and agent_states[current_state_id + 1].step == episode_step:
-                current_state_id += 1
-            result.append(agent_states[current_state_id])
-        return result
-
-    @classmethod
-    def decompress_history(cls, history):
-        max_steps = max([agent_states[-1].step for agent_states in history])
-        result = [cls.agent_state_to_full_list(agent_states, max_steps) for agent_states in history]
-        return result
-
     def get_full_history(self):
-        return [self.agent_state_to_full_list(agent_states, self._step) for agent_states in self._agent_states]
+        return [agent_state_to_full_list(agent_states, self._step) for agent_states in self._agent_states]
 
     def get_history(self):
         return self._agent_states
diff --git a/tests/test_integrations.py b/tests/test_integrations.py
index 5719751..5f4b021 100644
--- a/tests/test_integrations.py
+++ b/tests/test_integrations.py
@@ -1,5 +1,3 @@
-from functools import reduce
-
 import numpy as np
 
 from pogema import GridConfig
@@ -14,7 +12,7 @@ def test_gym_creation():
 
 
 def test_integrations():
-    for integration in ['SampleFactory', 'PyMARL', 'gymnasium', "PettingZoo", None]:
+    for integration in ['SampleFactory', 'gymnasium', "PettingZoo", None]:
         env = pogema_v0(grid_config=GridConfig(integration=integration))
         env.reset()
 
@@ -38,45 +36,6 @@ def test_sample_factory_integration():
         assert np.isclose(infos[0]['episode_extra_stats']['CSR'], 0.0)
 
 
-def test_pymarl_integration():
-    gc = GridConfig(seed=7, num_agents=4, obs_radius=3, max_episode_steps=16, integration='PyMARL')
-    env = pogema_v0(gc)
-
-    _state = [0.14285714285714285, 1.0, 1.0, 0.5714285714285714, 0.42857142857142855, 0.7142857142857143,
-              0.8571428571428571, 0.2857142857142857, 0.8571428571428571, 0.42857142857142855, 0.42857142857142855, 1.0,
-              0.5714285714285714, 0.7142857142857143, 0.14285714285714285, 0.42857142857142855, 0.0, 0.0, 0.0, 0.0, 0.0,
-              0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
-              0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0,
-              1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0,
-              0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0,
-              0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0,
-              0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0,
-              0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0,
-              0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
-              0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
-              0.0, 0.0]
-    assert np.isclose(_state, env.get_state()).all()
-
-    assert env.episode_limit == 16
-    assert env.get_env_info()['state_shape'] == 212
-    assert env.get_env_info()['obs_shape'] == 147
-    assert env.get_env_info()['n_agents'] == 4
-    assert env.get_env_info()['episode_limit'] == 16
-
-    num_agents, dimension = env.get_obs().shape
-    assert num_agents == gc.num_agents
-    assert dimension == reduce(lambda a, b: a * b, env.env.observation_space.shape)
-    assert dimension == env.get_obs_size()
-    assert env.get_state_size() == env.get_state().shape[0]
-
-    done = False
-    cnt = 0
-    while not done:
-        assert cnt < gc.max_episode_steps
-        _, done, _ = env.step(env.sample_actions())
-        cnt += 1
-
-
 def test_single_agent_gym_integration():
     gc = GridConfig(seed=7, num_agents=1, integration='gymnasium')
     env = pogema_v0(gc)
diff --git a/tests/test_pogema_env.py b/tests/test_pogema_env.py
index 78b9231..4e432a6 100644
--- a/tests/test_pogema_env.py
+++ b/tests/test_pogema_env.py
@@ -1,12 +1,16 @@
+import os
 import time
+import warnings
 
 import numpy as np
+import pytest
 from tabulate import tabulate
 
-from pogema import pogema_v0, AnimationMonitor
+from pogema import pogema_v0, AnimationMonitor, AnimationConfig
 
 from pogema.envs import ActionsSampler
 from pogema.grid import GridConfig
+from pogema.wrappers.persistence import PersistentWrapper
 
 
 class ActionMapping:
@@ -203,8 +207,8 @@ def test_persistent_env(num_steps=100):
     seed = 42
 
     env = pogema_v0(
-        grid_config=GridConfig(on_target='finish', seed=seed, num_agents=8, density=0.132, size=8, obs_radius=2,
-                               persistent=True))
+        grid_config=GridConfig(on_target='finish', seed=seed, num_agents=8, density=0.132, size=8, obs_radius=2))
+    env = PersistentWrapper(env)
 
     env.reset()
     action_sampler = ActionsSampler(env.action_space.n, seed=seed)
@@ -240,12 +244,51 @@ def state_repr(observations, rewards, terminates, truncates, infos):
     assert np.isclose(first_run_observations, second_run_observations).all()
 
 
+def test_wrapper_attribute_forwarding():
+    import pytest
+    for on_target in ['finish', 'nothing', 'restart']:
+        gc = GridConfig(num_agents=2, size=6, seed=42, on_target=on_target)
+        env = pogema_v0(gc)
+        env.reset()
+
+        assert env.get_num_agents() == 2
+        assert env.grid_config is not None
+        assert env.sample_actions() is not None
+        assert env.get_obstacles() is not None
+        assert env.get_agents_xy() is not None
+        assert env.get_targets_xy() is not None
+
+        with pytest.raises(AttributeError):
+            env.nonexistent_attribute_xyz
+
+
+def test_wrapper_forwarding_persistent():
+    gc = GridConfig(num_agents=2, size=6, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env = PersistentWrapper(env)
+    env.reset()
+
+    assert env.get_num_agents() == 2
+    assert env.get_history() is not None
+    assert env.grid_config is not None
+
+
+def test_wrapper_forwarding_animation():
+    gc = GridConfig(num_agents=2, size=6, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env = AnimationMonitor(env)
+    env.reset()
+
+    assert env.get_num_agents() == 2
+    assert env.grid_config is not None
+
+
 def test_steps_per_second_throughput():
     table = []
     for on_target in ['finish', 'nothing', 'restart']:
         for num_agents in [1, 32, 64]:
             for size in [32, 64]:
-                gc = GridConfig(obs_radius=5, seed=42, max_episode_steps=1024, 
+                gc = GridConfig(obs_radius=5, seed=42, max_episode_steps=1024,
                               size=size, num_agents=num_agents, on_target=on_target)
 
                 start_time = time.monotonic()
@@ -254,3 +297,79 @@ def test_steps_per_second_throughput():
                 steps_per_second = gc.max_episode_steps / (end_time - start_time)
                 table.append([on_target, num_agents, size, steps_per_second * gc.num_agents])
     print('\n' + tabulate(table, headers=['on_target', 'num_agents', 'size', 'SPS (individual)'], tablefmt='grid'))
+
+
+def test_enable_animation_and_save(tmp_path):
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env.enable_animation()
+    env.reset()
+    run_episode(env=env)
+
+    svg_path = str(tmp_path / 'test_anim.svg')
+    env.save_animation(svg_path)
+    assert os.path.exists(svg_path)
+    with open(svg_path) as f:
+        content = f.read()
+    assert '<svg' in content
+
+
+def test_no_overhead_without_animation():
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    assert not env.animation_is_active
+    env.reset()
+    run_episode(env=env)
+
+
+def test_disable_animation():
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env.enable_animation()
+    assert env.animation_is_active
+    env.disable_animation()
+    assert not env.animation_is_active
+
+
+def test_save_animation_without_enable_raises():
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env.reset()
+    with pytest.raises(RuntimeError, match="Animation is not active"):
+        env.save_animation('test.svg')
+
+
+def test_animation_monitor_backward_compat():
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    with warnings.catch_warnings(record=True) as w:
+        warnings.simplefilter("always")
+        env = AnimationMonitor(env, AnimationConfig(save_every_idx_episode=None))
+        assert len(w) == 1
+        assert issubclass(w[0].category, DeprecationWarning)
+        assert "deprecated" in str(w[0].message).lower()
+    env.reset()
+    run_episode(env=env)
+
+
+def test_metrics_with_animation():
+    for on_target in ['finish', 'nothing', 'restart']:
+        gc = GridConfig(num_agents=2, seed=5, size=5, max_episode_steps=64, on_target=on_target)
+        env = pogema_v0(gc)
+        env.enable_animation()
+        env.reset()
+        *_, infos = run_episode(env=env)[-1]
+        assert 'metrics' in infos[0]
+
+
+def test_enable_animation_for_all_on_target_modes(tmp_path):
+    for on_target in ['finish', 'nothing', 'restart']:
+        gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42,
+                        on_target=on_target, max_episode_steps=16)
+        env = pogema_v0(gc)
+        env.enable_animation()
+        env.reset()
+        run_episode(env=env)
+        svg_path = str(tmp_path / f'test_{on_target}.svg')
+        env.save_animation(svg_path)
+        assert os.path.exists(svg_path)
diff --git a/version_history.MD b/version_history.MD
index e1d23ba..8e10994 100644
--- a/version_history.MD
+++ b/version_history.MD
@@ -1,6 +1,6 @@
 The development history of POGEMA, starting from version 1.0.0.
 
-Version 1.5.0 (August, 2025)
+Version 1.4.X (August, 2025)
 	•	Added support of custom targets_xy for lifelong MAPF.
 	•	Improved work with rectangular grids. Added width and height attributes to GridConfig.
 	•	Added method update_config to properly update all attributes of GridConfig.

From d3ad40bea177892a089b73f1a5163d57909883dc Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Sat, 28 Feb 2026 13:55:54 +0300
Subject: [PATCH 04/15] hotfix

---
 pogema/__init__.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/pogema/__init__.py b/pogema/__init__.py
index 1b77cb9..5538f1e 100644
--- a/pogema/__init__.py
+++ b/pogema/__init__.py
@@ -13,6 +13,8 @@
 __all__ = [
     'GridConfig',
     'pogema_v0',
+    'AnimationMonitor',
+    'AnimationConfig',
     'AStarAgent', 'BatchAStarAgent',
     "PogemaWrapper",
     "AnimationWrapper",

From 3a23ea605e3320194655caeb56375dd74e969f53 Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Sat, 28 Feb 2026 13:55:54 +0300
Subject: [PATCH 05/15] hotfix

---
 pogema/grid_config.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pogema/grid_config.py b/pogema/grid_config.py
index f537d7b..46f6458 100644
--- a/pogema/grid_config.py
+++ b/pogema/grid_config.py
@@ -18,7 +18,7 @@ class GridConfig(CommonSettings):
     num_agents: Optional[int] = None
     possible_agents_xy: Optional[list] = None
     possible_targets_xy: Optional[list] = None
-    collision_system: Literal['block_both', 'priority', 'soft'] = 'soft'
+    collision_system: Literal['block_both', 'priority', 'soft'] = 'priority'
     persistent: bool = False
     observation_type: Literal['POMAPF', 'MAPF', 'default'] = 'default'
     map: Optional[Union[list, str]] = None

From 8df84b9dd63f3ba7d3d467cac093f98fb00df67d Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Sat, 28 Feb 2026 14:32:41 +0300
Subject: [PATCH 06/15] fix for animation.py and tests

---
 pogema/__init__.py                 |   2 +
 pogema/wrappers/animation.py       | 124 +++++++++++++++++++++++++++++
 pogema/wrappers/base.py            |  15 ++++
 tests/test_deterministic_policy.py |  18 ++---
 tests/test_grid.py                 |   4 +-
 tests/test_pogema_env.py           |  10 +--
 6 files changed, 155 insertions(+), 18 deletions(-)
 create mode 100644 pogema/wrappers/animation.py

diff --git a/pogema/__init__.py b/pogema/__init__.py
index 5538f1e..08f1436 100644
--- a/pogema/__init__.py
+++ b/pogema/__init__.py
@@ -24,4 +24,6 @@
 register(
     id="Pogema-v0",
     entry_point="pogema.integrations.make_pogema:make_single_agent_gym",
+    order_enforce=False,
+    disable_env_checker=True,
 )
diff --git a/pogema/wrappers/animation.py b/pogema/wrappers/animation.py
new file mode 100644
index 0000000..3de14ff
--- /dev/null
+++ b/pogema/wrappers/animation.py
@@ -0,0 +1,124 @@
+from itertools import cycle
+
+from pogema.wrappers.base import PogemaWrapper
+from pogema.wrappers.persistence import AgentState, decompress_history
+
+
+class AnimationWrapper(PogemaWrapper):
+    def __init__(self, env):
+        super().__init__(env)
+        self._active = False
+        self._animation_config = None
+        self._step = None
+        self._agent_states = None
+
+    def step(self, action):
+        result = self.env.step(action)
+        if not self._active:
+            return result
+        self._step += 1
+        for agent_idx in range(self.unwrapped.get_num_agents()):
+            agent_state = self._get_agent_state(self.unwrapped.grid, agent_idx)
+            if agent_state != self._agent_states[agent_idx][-1]:
+                self._agent_states[agent_idx].append(agent_state)
+
+        return result
+
+    def reset(self, **kwargs):
+        result = self.env.reset(**kwargs)
+        if not self._active:
+            return result
+
+        self._step = 0
+
+        self._agent_states = []
+        for agent_idx in range(self.unwrapped.get_num_agents()):
+            self._agent_states.append([self._get_agent_state(self.unwrapped.grid, agent_idx)])
+
+        return result
+
+    def _get_agent_state(self, grid, agent_idx):
+        x, y = grid.positions_xy[agent_idx]
+        tx, ty = grid.finishes_xy[agent_idx]
+        active = grid.is_active[agent_idx]
+        return AgentState(x, y, tx, ty, self._step, active)
+
+    def enable_animation(self, animation_config=None):
+        self._active = True
+        if animation_config is not None:
+            self._animation_config = animation_config
+
+    def disable_animation(self):
+        self._active = False
+
+    @property
+    def animation_is_active(self):
+        return self._active
+
+    def save_animation(self, name='render.svg', animation_config=None):
+        if not self._active:
+            raise RuntimeError(
+                "Animation is not active. Call env.enable_animation() and then env.reset() before saving."
+            )
+        if self._agent_states is None:
+            raise RuntimeError(
+                "No history recorded. Call env.reset() after enable_animation() before saving."
+            )
+
+        from pogema.svg_animation.animation_drawer import AnimationConfig, SvgSettings, GridHolder, AnimationDrawer
+
+        if animation_config is None:
+            animation_config = self._animation_config
+        if animation_config is None:
+            animation_config = AnimationConfig()
+
+        working_radius = self.unwrapped.grid_config.obs_radius - 1
+        if working_radius > 0:
+            obstacles = self.unwrapped.get_obstacles(ignore_borders=False)[working_radius:-working_radius,
+                        working_radius:-working_radius]
+        else:
+            obstacles = self.unwrapped.get_obstacles(ignore_borders=False)
+
+        # Apply offset at render time to shift positions into trimmed coordinate space
+        offset = -working_radius
+        raw_history = self._agent_states
+        shifted_history = []
+        for agent_states in raw_history:
+            shifted = []
+            for s in agent_states:
+                if offset != 0:
+                    shifted.append(AgentState(s.x + offset, s.y + offset, s.tx + offset, s.ty + offset, s.step, s.active))
+                else:
+                    shifted.append(s)
+            shifted_history.append(shifted)
+
+        history = decompress_history(shifted_history)
+
+        svg_settings = SvgSettings()
+        colors_cycle = cycle(svg_settings.colors)
+        agents_colors = {index: next(colors_cycle) for index in range(self.unwrapped.grid_config.num_agents)}
+
+        for agent_idx in range(self.unwrapped.grid_config.num_agents):
+            history[agent_idx].append(history[agent_idx][-1])
+
+        episode_length = len(history[0])
+        if animation_config.egocentric_idx is not None and self.unwrapped.grid_config.on_target == 'finish':
+            episode_length = history[animation_config.egocentric_idx][-1].step + 1
+            for agent_idx in range(self.unwrapped.grid_config.num_agents):
+                history[agent_idx] = history[agent_idx][:episode_length]
+
+        grid_holder = GridHolder(
+            width=len(obstacles), height=len(obstacles[0]),
+            obstacles=obstacles,
+            episode_length=episode_length,
+            history=history,
+            obs_radius=self.unwrapped.grid_config.obs_radius,
+            on_target=self.unwrapped.grid_config.on_target,
+            colors=agents_colors,
+            config=animation_config,
+            svg_settings=svg_settings,
+        )
+
+        animation = AnimationDrawer().create_animation(grid_holder)
+        with open(name, "w") as f:
+            f.write(animation.render())
diff --git a/pogema/wrappers/base.py b/pogema/wrappers/base.py
index 65a4045..98c9141 100644
--- a/pogema/wrappers/base.py
+++ b/pogema/wrappers/base.py
@@ -84,6 +84,21 @@ def get_lifelong_targets_xy(self, ignore_borders: bool = False) -> list:
     def set_elapsed_steps(self, elapsed_steps: int) -> None:
         return self.env.set_elapsed_steps(elapsed_steps)
 
+    # -- AnimationWrapper --
+
+    def enable_animation(self, animation_config=None):
+        return self.env.enable_animation(animation_config)
+
+    def disable_animation(self):
+        return self.env.disable_animation()
+
+    def save_animation(self, name='render.svg', animation_config=None):
+        return self.env.save_animation(name, animation_config=animation_config)
+
+    @property
+    def animation_is_active(self):
+        return self.env.animation_is_active
+
     # -- Fallback for any remaining forwarded names --
 
     def __getattr__(self, name):
diff --git a/tests/test_deterministic_policy.py b/tests/test_deterministic_policy.py
index b1b7e31..639fcc1 100644
--- a/tests/test_deterministic_policy.py
+++ b/tests/test_deterministic_policy.py
@@ -1,8 +1,6 @@
 import numpy as np
 from heapq import heappop, heappush
-from pogema import GridConfig, pogema_v0, AnimationMonitor
-
-# from pogema.animation import AnimationMonitor
+from pogema import GridConfig, pogema_v0
 
 INF = 1000000007
 
@@ -124,11 +122,9 @@ def act(self, obs) -> list:
         return actions
 
 
-def run_policy(gc: GridConfig, save_animation=False):
+def run_policy(gc: GridConfig):
     policy = DeterministicPolicy()
     env = pogema_v0(grid_config=gc)
-    if save_animation:
-        env = AnimationMonitor(env)
 
     while True:
         obs, info = env.reset()
@@ -142,7 +138,7 @@ def run_policy(gc: GridConfig, save_animation=False):
 
 def test_life_long():
     gc = GridConfig(num_agents=20, size=8, obs_radius=4, seed=42, max_episode_steps=64, on_target='restart')
-    results_generator = run_policy(gc, save_animation=False)
+    results_generator = run_policy(gc)
 
     metrics = results_generator.__next__()
     assert np.isclose(metrics['avg_throughput'], 1.671875)
@@ -150,7 +146,7 @@ def test_life_long():
     assert np.isclose(metrics['avg_throughput'], 1.609375)
     
     gc = GridConfig(num_agents=24, size=8, obs_radius=4, seed=43, max_episode_steps=64, on_target='restart')
-    results_generator = run_policy(gc, save_animation=False)
+    results_generator = run_policy(gc)
 
     metrics = results_generator.__next__()
     assert np.isclose(metrics['avg_throughput'], 0.4375)
@@ -158,7 +154,7 @@ def test_life_long():
 
 def test_disappearing():
     gc = GridConfig(num_agents=20, size=8, obs_radius=2, seed=42, density=0.2, max_episode_steps=32, on_target='finish')
-    results_generator = run_policy(gc, save_animation=False)
+    results_generator = run_policy(gc)
 
     metrics = results_generator.__next__()
     assert np.isclose(metrics['ep_length'], 22.95)
@@ -173,7 +169,7 @@ def test_disappearing():
 
 def test_non_disappearing():
     gc = GridConfig(num_agents=4, size=5, obs_radius=2, seed=3, density=0.2, max_episode_steps=32, on_target='nothing')
-    results_generator = run_policy(gc, save_animation=False)
+    results_generator = run_policy(gc)
 
     metrics = results_generator.__next__()
     assert np.isclose(metrics['ep_length'], 21)
@@ -186,7 +182,7 @@ def test_non_disappearing():
     assert np.isclose(metrics['ISR'], 1.0)
 
     gc = GridConfig(num_agents=7, size=5, obs_radius=2, seed=3, density=0.2, max_episode_steps=32, on_target='nothing')
-    results_generator = run_policy(gc, save_animation=False)
+    results_generator = run_policy(gc)
 
     metrics = results_generator.__next__()
     assert np.isclose(metrics['ep_length'], 32)
diff --git a/tests/test_grid.py b/tests/test_grid.py
index 23d7220..6b214cd 100644
--- a/tests/test_grid.py
+++ b/tests/test_grid.py
@@ -400,9 +400,9 @@ def test_grid_with_goal_sequences():
 def test_pogema_lifelong_with_sequences():
     from pogema.envs import PogemaLifeLong
     import warnings
-    
+
     config = GridConfig(
-        width=8, height=8,
+        width=8, height=8, density=0,
         agents_xy=[[1, 1], [1, 2]],
         targets_xy=[
             [[2, 2], [3, 3], [4, 4]],
diff --git a/tests/test_pogema_env.py b/tests/test_pogema_env.py
index 4e432a6..6edad88 100644
--- a/tests/test_pogema_env.py
+++ b/tests/test_pogema_env.py
@@ -112,7 +112,7 @@ def test_mapf_observation():
 
 def test_standard_pogema_animation():
     env = pogema_v0(GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish'))
-    env = AnimationMonitor(env)
+    env.enable_animation()
     env.reset()
     run_episode(env=env)
 
@@ -122,7 +122,7 @@ def test_gym_pogema_animation():
     env = gymnasium.make('Pogema-v0',
                          grid_config=GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42,
                                                 on_target='finish'))
-    env = AnimationMonitor(env)
+    env.enable_animation()
     env.reset()
 
     while True:
@@ -145,7 +145,7 @@ def test_non_disappearing_pogema_no_seed():
 
 def test_non_disappearing_pogema_animation():
     env = pogema_v0(GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='nothing'))
-    env = AnimationMonitor(env)
+    env.enable_animation()
     env.reset()
     run_episode(env=env)
 
@@ -164,7 +164,7 @@ def test_life_long_pogema_empty_seed():
 
 def test_life_long_pogema_animation():
     env = pogema_v0(GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='restart'))
-    env = AnimationMonitor(env)
+    env.enable_animation()
     env.reset()
     run_episode(env=env)
 
@@ -276,7 +276,7 @@ def test_wrapper_forwarding_persistent():
 def test_wrapper_forwarding_animation():
     gc = GridConfig(num_agents=2, size=6, seed=42, on_target='finish')
     env = pogema_v0(gc)
-    env = AnimationMonitor(env)
+    env.enable_animation()
     env.reset()
 
     assert env.get_num_agents() == 2

From c147e11d994f16f0446801a7b6fc6dee78e705d1 Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Sun, 1 Mar 2026 00:16:09 +0300
Subject: [PATCH 07/15] Removing CodeFactor

---
 README.md | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 0fd0fb2..f3ecc05 100644
--- a/README.md
+++ b/README.md
@@ -5,7 +5,7 @@
 
 **Partially-Observable Grid Environment for Multiple Agents**
 
-[![CodeFactor](https://www.codefactor.io/repository/github/tviskaron/pogema/badge)](https://www.codefactor.io/repository/github/tviskaron/pogema)
+
 [![Downloads](https://static.pepy.tech/badge/pogema)](https://pepy.tech/project/pogema)
 [![CI](https://github.com/Cognitive-AI-Systems/pogema/actions/workflows/CI.yml/badge.svg?branch=main)](https://github.com/Cognitive-AI-Systems/pogema/actions/workflows/CI.yml)
 [![CodeQL](https://github.com/Cognitive-AI-Systems/pogema/actions/workflows/codeql-analysis.yml/badge.svg)](https://github.com/Cognitive-AI-Systems/pogema/actions/workflows/codeql-analysis.yml) 
@@ -108,7 +108,6 @@ grid_config = GridConfig(num_agents=4,  # number of agents
 env = pogema_v0(grid_config=grid_config)
 env.reset()
 env.render()
-
 ```
 
 ### Custom maps

From b6bd459d1144c58aef0ce6193d2b771c3893f3cb Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Sun, 1 Mar 2026 11:45:44 +0300
Subject: [PATCH 08/15] update codeql

---
 .github/workflows/codeql-analysis.yml | 40 +++------------------------
 1 file changed, 4 insertions(+), 36 deletions(-)

diff --git a/.github/workflows/codeql-analysis.yml b/.github/workflows/codeql-analysis.yml
index 1080356..b1b9f86 100644
--- a/.github/workflows/codeql-analysis.yml
+++ b/.github/workflows/codeql-analysis.yml
@@ -1,21 +1,9 @@
-# For most projects, this workflow file will not need changing; you simply need
-# to commit it to your repository.
-#
-# You may wish to alter this file to override the set of languages analyzed,
-# or to provide custom queries or build logic.
-#
-# ******** NOTE ********
-# We have attempted to detect the languages in your repository. Please check
-# the `language` matrix defined below to confirm you have the correct set of
-# supported CodeQL languages.
-#
 name: "CodeQL"
 
 on:
   push:
     branches: [ main ]
   pull_request:
-    # The branches below must be a subset of the branches above
     branches: [ main ]
   schedule:
     - cron: '21 4 * * 1'
@@ -33,38 +21,18 @@ jobs:
       fail-fast: false
       matrix:
         language: [ 'python' ]
-        # CodeQL supports [ 'cpp', 'csharp', 'go', 'java', 'javascript', 'python', 'ruby' ]
-        # Learn more about CodeQL language support at https://git.io/codeql-language-support
 
     steps:
     - name: Checkout repository
-      uses: actions/checkout@v2
+      uses: actions/checkout@v4
 
-    # Initializes the CodeQL tools for scanning.
     - name: Initialize CodeQL
-      uses: github/codeql-action/init@v1
+      uses: github/codeql-action/init@v3
       with:
         languages: ${{ matrix.language }}
-        # If you wish to specify custom queries, you can do so here or in a config file.
-        # By default, queries listed here will override any specified in a config file.
-        # Prefix the list here with "+" to use these queries and those in the config file.
-        # queries: ./path/to/local/query, your-org/your-repo/queries@main
 
-    # Autobuild attempts to build any compiled languages  (C/C++, C#, or Java).
-    # If this step fails, then you should remove it and run the build manually (see below)
     - name: Autobuild
-      uses: github/codeql-action/autobuild@v1
-
-    # ℹ️ Command-line programs to run using the OS shell.
-    # 📚 https://git.io/JvXDl
-
-    # ✏️ If the Autobuild fails above, remove it and uncomment the following three lines
-    #    and modify them (or add more) to build your code if your project
-    #    uses a compiled language
-
-    #- run: |
-    #   make bootstrap
-    #   make release
+      uses: github/codeql-action/autobuild@v3
 
     - name: Perform CodeQL Analysis
-      uses: github/codeql-action/analyze@v1
+      uses: github/codeql-action/analyze@v3

From 08d88354339a83267176097a6208916a83c9c8bd Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Sun, 1 Mar 2026 11:51:56 +0300
Subject: [PATCH 09/15] ruff "W", "I", "UP", "B" flags, and corresponding
 fixes, plus fixed seeding in reset

---
 pogema/__init__.py                        |   8 +-
 pogema/a_star_policy.py                   |   5 +-
 pogema/envs.py                            |  63 +++++++------
 pogema/generator.py                       |   2 +-
 pogema/grid.py                            |  20 +++--
 pogema/grid_config.py                     |  29 +++---
 pogema/integrations/make_pogema.py        |   9 +-
 pogema/integrations/pettingzoo.py         |   5 +-
 pogema/svg_animation/animation_drawer.py  |  26 +++---
 pogema/svg_animation/animation_wrapper.py |   4 +-
 pogema/utils.py                           |  12 +--
 pogema/wrappers/animation.py              |  35 +++++++-
 pogema/wrappers/base.py                   |   5 +-
 pogema/wrappers/metrics.py                |   2 +-
 pyproject.toml                            |  17 ++--
 tests/test_deterministic_policy.py        |   8 +-
 tests/test_grid.py                        |  72 +++++++--------
 tests/test_pogema_env.py                  | 102 +++++++++++++++++-----
 18 files changed, 268 insertions(+), 156 deletions(-)

diff --git a/pogema/__init__.py b/pogema/__init__.py
index 08f1436..4d02a63 100644
--- a/pogema/__init__.py
+++ b/pogema/__init__.py
@@ -1,11 +1,12 @@
 from gymnasium import register
+
 from pogema.grid_config import GridConfig
+from pogema.a_star_policy import AStarAgent, BatchAStarAgent
 from pogema.integrations.make_pogema import pogema_v0
-from pogema.svg_animation.animation_wrapper import AnimationMonitor
 from pogema.svg_animation.animation_drawer import AnimationConfig
-from pogema.a_star_policy import AStarAgent, BatchAStarAgent
+from pogema.svg_animation.animation_wrapper import AnimationMonitor
+from pogema.wrappers.animation import AnimationWrapper, SvgAnimation
 from pogema.wrappers.base import PogemaWrapper
-from pogema.wrappers.animation import AnimationWrapper
 from pogema.wrappers.persistence import PersistentWrapper
 
 __version__ = '1.4.0'
@@ -18,6 +19,7 @@
     'AStarAgent', 'BatchAStarAgent',
     "PogemaWrapper",
     "AnimationWrapper",
+    "SvgAnimation",
     "PersistentWrapper",
 ]
 
diff --git a/pogema/a_star_policy.py b/pogema/a_star_policy.py
index 0b41a96..294c8b8 100644
--- a/pogema/a_star_policy.py
+++ b/pogema/a_star_policy.py
@@ -1,7 +1,8 @@
+from heapq import heappop, heappush
+
 import numpy as np
-from pogema import GridConfig
 
-from heapq import heappop, heappush
+from pogema import GridConfig
 
 INF = 1e7
 
diff --git a/pogema/envs.py b/pogema/envs.py
index 0f03883..e4fa9d9 100644
--- a/pogema/envs.py
+++ b/pogema/envs.py
@@ -1,16 +1,24 @@
-from typing import Optional
 import warnings
-import numpy as np
+
 import gymnasium
+import numpy as np
 from gymnasium.error import ResetNeeded
 
+from pogema.generator import generate_from_possible_targets, generate_new_target
 from pogema.grid import Grid, GridLifeLong
 from pogema.grid_config import GridConfig
-from pogema.wrappers.metrics import LifeLongAverageThroughputMetric, NonDisappearEpLengthMetric, \
-    NonDisappearCSRMetric, NonDisappearISRMetric, EpLengthMetric, ISRMetric, CSRMetric, SumOfCostsAndMakespanMetric
-from pogema.wrappers.multi_time_limit import MultiTimeLimit
-from pogema.generator import generate_new_target, generate_from_possible_targets
 from pogema.wrappers.animation import AnimationWrapper
+from pogema.wrappers.metrics import (
+    CSRMetric,
+    EpLengthMetric,
+    ISRMetric,
+    LifeLongAverageThroughputMetric,
+    NonDisappearCSRMetric,
+    NonDisappearEpLengthMetric,
+    NonDisappearISRMetric,
+    SumOfCostsAndMakespanMetric,
+)
+from pogema.wrappers.multi_time_limit import MultiTimeLimit
 
 
 class ActionsSampler:
@@ -39,7 +47,7 @@ class PogemaBase(gymnasium.Env):
     def step(self, action):
         raise NotImplementedError
 
-    def reset(self, seed: Optional[int] = None, return_info: bool = False, options: Optional[dict] = None, ):
+    def reset(self, seed: int | None = None, return_info: bool = False, options: dict | None = None, ):
         raise NotImplementedError
 
     def __init__(self, grid_config: GridConfig = GridConfig()):
@@ -157,13 +165,12 @@ def update_was_on_goal(self):
         self.was_on_goal = [self.grid.on_goal(agent_idx) and self.grid.is_active[agent_idx]
                             for agent_idx in range(self.grid_config.num_agents)]
 
-    def reset(self, seed: Optional[int] = None, return_info: bool = True, options: Optional[dict] = None, ):
+    def reset(self, seed: int | None = None, return_info: bool = True, options: dict | None = None, ):
+        if seed is not None:
+            self.grid_config.seed = seed
         self._initialize_grid()
         self.update_was_on_goal()
 
-        if seed is not None:
-            self.grid.seed = seed
-
         if return_info:
             return self._obs(), self._get_infos()
         return self._obs()
@@ -268,7 +275,7 @@ def move_agents(self, actions):
                 if self.grid.is_active[agent_idx]:
                     self.grid.move_without_checks(agent_idx, actions[agent_idx])
         else:
-            raise ValueError('Unknown collision system: {}'.format(self.grid.config.collision_system))
+            raise ValueError(f'Unknown collision system: {self.grid.config.collision_system}')
 
     def get_agents_xy_relative(self):
         return self.grid.get_agents_xy_relative()
@@ -301,15 +308,15 @@ def _initialize_grid(self):
         main_rng = np.random.default_rng(self.grid_config.seed)
         seeds = main_rng.integers(np.iinfo(np.int32).max, size=self.grid_config.num_agents)
         self.random_generators = [np.random.default_rng(seed) for seed in seeds]
-        
+
     def get_lifelong_targets_xy(self, ignore_borders=False):
         if self.has_custom_sequences:
             if ignore_borders:
                 return self.grid_config.targets_xy
             else:
-                return [[[x + self.grid_config.obs_radius, y + self.grid_config.obs_radius] for x, y in sequence] 
+                return [[[x + self.grid_config.obs_radius, y + self.grid_config.obs_radius] for x, y in sequence]
                         for sequence in self.grid_config.targets_xy]
-        
+
         sequences = []
 
         main_rng = np.random.default_rng(self.grid_config.seed)
@@ -323,24 +330,24 @@ def get_lifelong_targets_xy(self, ignore_borders=False):
             agent_sequence.append(initial_target)
             current_pos = initial_target
             total_distance = abs(start_pos[0] - initial_target[0]) + abs(start_pos[1] - initial_target[1])
-            
+
             while total_distance < self.grid_config.max_episode_steps:
                 if ignore_borders:
-                    generator_pos = (current_pos[0] + self.grid_config.obs_radius, 
+                    generator_pos = (current_pos[0] + self.grid_config.obs_radius,
                                    current_pos[1] + self.grid_config.obs_radius)
                 else:
                     generator_pos = tuple(current_pos)
 
                 if self.grid_config.possible_targets_xy is not None:
                     new_goal = generate_from_possible_targets(
-                        temp_generators[agent_idx], 
-                        self.grid_config.possible_targets_xy, 
+                        temp_generators[agent_idx],
+                        self.grid_config.possible_targets_xy,
                         generator_pos
                     )
                     if ignore_borders:
                         goal_coords = list(new_goal)
                     else:
-                        goal_coords = [new_goal[0] + self.grid_config.obs_radius, 
+                        goal_coords = [new_goal[0] + self.grid_config.obs_radius,
                                        new_goal[1] + self.grid_config.obs_radius]
                 else:
                     new_goal = generate_new_target(
@@ -350,7 +357,7 @@ def get_lifelong_targets_xy(self, ignore_borders=False):
                         generator_pos
                     )
                     if ignore_borders:
-                        goal_coords = [new_goal[0] - self.grid_config.obs_radius, 
+                        goal_coords = [new_goal[0] - self.grid_config.obs_radius,
                                        new_goal[1] - self.grid_config.obs_radius]
                     else:
                         goal_coords = list(new_goal)
@@ -361,7 +368,7 @@ def get_lifelong_targets_xy(self, ignore_borders=False):
             sequences.append(agent_sequence)
         return sequences
 
-    def reset(self, seed: Optional[int] = None, return_info: bool = True, options: Optional[dict] = None):
+    def reset(self, seed: int | None = None, return_info: bool = True, options: dict | None = None):
         self.current_goal_indices = [0] * self.grid_config.num_agents
         return super().reset(seed=seed, return_info=return_info, options=options)
 
@@ -370,9 +377,9 @@ def _generate_new_target(self, agent_idx):
             agent_targets = self.grid_config.targets_xy[agent_idx]
             current_idx = self.current_goal_indices[agent_idx]
             next_target = agent_targets[(current_idx + 1) % len(agent_targets)]
-            
+
             self.current_goal_indices[agent_idx] = (current_idx + 1) % len(agent_targets)
-            
+
             if self.current_goal_indices[agent_idx] == 0 and current_idx == len(agent_targets) - 1:
                 warnings.warn(
                     f"Agent {agent_idx} has completed all {len(agent_targets)} provided targets and "
@@ -381,12 +388,12 @@ def _generate_new_target(self, agent_idx):
                     UserWarning,
                     stacklevel=2
                 )
-            
-            return (next_target[0] + self.grid_config.obs_radius, 
+
+            return (next_target[0] + self.grid_config.obs_radius,
                    next_target[1] + self.grid_config.obs_radius)
         elif self.grid_config.possible_targets_xy is not None:
-            new_goal = generate_from_possible_targets(self.random_generators[agent_idx], 
-                                                     self.grid_config.possible_targets_xy, 
+            new_goal = generate_from_possible_targets(self.random_generators[agent_idx],
+                                                     self.grid_config.possible_targets_xy,
                                                      self.grid.positions_xy[agent_idx])
             return (new_goal[0] + self.grid_config.obs_radius, new_goal[1] + self.grid_config.obs_radius)
         else:
diff --git a/pogema/generator.py b/pogema/generator.py
index c45b21d..25d4c52 100644
--- a/pogema/generator.py
+++ b/pogema/generator.py
@@ -111,7 +111,7 @@ def generate_from_possible_positions(grid_config: GridConfig):
     rng.shuffle(grid_config.possible_agents_xy)
     rng.shuffle(grid_config.possible_targets_xy)
     return grid_config.possible_agents_xy[:grid_config.num_agents], grid_config.possible_targets_xy[:grid_config.num_agents]
-    
+
 
 def generate_positions_and_targets_fast(obstacles, grid_config):
     c = grid_config
diff --git a/pogema/grid.py b/pogema/grid.py
index 63aef77..ed344bf 100644
--- a/pogema/grid.py
+++ b/pogema/grid.py
@@ -1,12 +1,17 @@
-from copy import deepcopy
 import warnings
+from copy import deepcopy
 
 import numpy as np
 
-from pogema.generator import generate_obstacles, generate_positions_and_targets_fast, \
-    get_components, generate_from_possible_positions
+from pogema.generator import (
+    generate_from_possible_positions,
+    generate_obstacles,
+    generate_positions_and_targets_fast,
+    get_components,
+)
+
 from .grid_config import GridConfig
-from .grid_registry import in_registry, get_grid
+from .grid_registry import get_grid, in_registry
 from .utils import render_grid
 
 
@@ -31,7 +36,7 @@ def __init__(self, grid_config: GridConfig, add_artificial_border: bool = True,
                 self.finishes_xy = [sequence[0] for sequence in grid_config.targets_xy]
             else:
                 self.finishes_xy = grid_config.targets_xy
-                
+
             if len(self.starts_xy) != len(self.finishes_xy):
                 raise IndexError("Can't create task. Please provide agents_xy and targets_xy of the same size.")
             if grid_config.num_agents > len(self.starts_xy):
@@ -239,7 +244,7 @@ def render(self, mode='human', border='thin'):
 
     def move_agent_to_cell(self, agent_id, x, y):
         if self.positions[self.positions_xy[agent_id]] == self.config.FREE:
-            raise KeyError("Agent {} is not in the map".format(agent_id))
+            raise KeyError(f"Agent {agent_id} is not in the map")
         self.positions[self.positions_xy[agent_id]] = self.config.FREE
         if self.obstacles[x, y] != self.config.FREE or self.positions[x, y] != self.config.FREE:
             raise ValueError(f"Can't force agent to blocked position {x} {y}")
@@ -270,9 +275,6 @@ def move(self, agent_id, action):
     def on_goal(self, agent_id):
         return self.positions_xy[agent_id] == self.finishes_xy[agent_id]
 
-    def is_active(self, agent_id):
-        return self.is_active[agent_id]
-
     def hide_agent(self, agent_id):
         if not self.is_active[agent_id]:
             return False
diff --git a/pogema/grid_config.py b/pogema/grid_config.py
index 46f6458..78193af 100644
--- a/pogema/grid_config.py
+++ b/pogema/grid_config.py
@@ -1,31 +1,32 @@
 import sys
-from typing import Optional, Union
+from typing import Literal
+
 from pydantic import field_validator, model_validator
+
 from pogema.utils import CommonSettings
-from typing_extensions import Literal
 
 
 class GridConfig(CommonSettings):
     on_target: Literal['finish', 'nothing', 'restart'] = 'finish'
-    seed: Optional[int] = None
-    width: Optional[int] = None
-    height: Optional[int] = None
+    seed: int | None = None
+    width: int | None = None
+    height: int | None = None
     size: int = 8
     density: float = 0.3
     obs_radius: int = 5
-    agents_xy: Optional[list] = None
-    targets_xy: Optional[list] = None
-    num_agents: Optional[int] = None
-    possible_agents_xy: Optional[list] = None
-    possible_targets_xy: Optional[list] = None
+    agents_xy: list | None = None
+    targets_xy: list | None = None
+    num_agents: int | None = None
+    possible_agents_xy: list | None = None
+    possible_targets_xy: list | None = None
     collision_system: Literal['block_both', 'priority', 'soft'] = 'priority'
     persistent: bool = False
     observation_type: Literal['POMAPF', 'MAPF', 'default'] = 'default'
-    map: Optional[Union[list, str]] = None
-    map_name: Optional[str] = None
-    integration: Optional[Literal['SampleFactory', 'gymnasium', 'PettingZoo']] = None
+    map: list | str | None = None
+    map_name: str | None = None
+    integration: Literal['SampleFactory', 'gymnasium', 'PettingZoo'] | None = None
     max_episode_steps: int = 64
-    auto_reset: Optional[bool] = None
+    auto_reset: bool | None = None
 
     @model_validator(mode='before')
     @classmethod
diff --git a/pogema/integrations/make_pogema.py b/pogema/integrations/make_pogema.py
index 9bc37b4..a7d5fda 100644
--- a/pogema/integrations/make_pogema.py
+++ b/pogema/integrations/make_pogema.py
@@ -1,10 +1,9 @@
-from typing import Union, Optional
 
 from pogema import GridConfig
-from pogema.wrappers.base import PogemaWrapper
 from pogema.envs import _make_pogema
 from pogema.integrations.pettingzoo import parallel_env
 from pogema.integrations.sample_factory import AutoResetWrapper, IsMultiAgentWrapper, MetricsForwardingWrapper
+from pogema.wrappers.base import PogemaWrapper
 
 
 def _make_sample_factory_integration(grid_config):
@@ -23,7 +22,7 @@ def step(self, action):
             [action] + [self.env.action_space.sample() for _ in range(self.unwrapped.get_num_agents() - 1)])
         return observations[0], rewards[0], terminated[0], truncated[0], infos[0]
 
-    def reset(self, seed: Optional[int] = None, return_info: bool = True, options: Optional[dict] = None, ):
+    def reset(self, seed: int | None = None, return_info: bool = True, options: dict | None = None, ):
         observations, infos = self.env.reset()
         if return_info:
             return observations[0], infos[0]
@@ -31,14 +30,14 @@ def reset(self, seed: Optional[int] = None, return_info: bool = True, options: O
             return observations[0]
 
 
-def make_single_agent_gym(grid_config: Union[GridConfig, dict] = GridConfig()):
+def make_single_agent_gym(grid_config: GridConfig | dict = GridConfig()):
     env = _make_pogema(grid_config)
     env = SingleAgentWrapper(env)
 
     return env
 
 
-def make_pogema(grid_config: Union[GridConfig, dict] = GridConfig(), *args, **kwargs) -> PogemaWrapper:
+def make_pogema(grid_config: GridConfig | dict = GridConfig(), *args, **kwargs) -> PogemaWrapper:
     if isinstance(grid_config, dict):
         grid_config = GridConfig(**grid_config)
 
diff --git a/pogema/integrations/pettingzoo.py b/pogema/integrations/pettingzoo.py
index b2166bd..677469b 100644
--- a/pogema/integrations/pettingzoo.py
+++ b/pogema/integrations/pettingzoo.py
@@ -1,6 +1,7 @@
 import functools
 
 import numpy as np
+
 from pogema import GridConfig
 from pogema.envs import _make_pogema
 
@@ -23,12 +24,12 @@ def __init__(self, grid_config: GridConfig, render_mode='ansi'):
         self.agents = None
         self.num_moves = None
 
-    @functools.lru_cache(maxsize=None)
+    @functools.cache
     def observation_space(self, agent):
         assert agent in self.possible_agents
         return self.pogema.observation_space
 
-    @functools.lru_cache(maxsize=None)
+    @functools.cache
     def action_space(self, agent):
         assert agent in self.possible_agents
         return self.pogema.action_space
diff --git a/pogema/svg_animation/animation_drawer.py b/pogema/svg_animation/animation_drawer.py
index ff19ae1..150506a 100644
--- a/pogema/svg_animation/animation_drawer.py
+++ b/pogema/svg_animation/animation_drawer.py
@@ -3,17 +3,17 @@
 from dataclasses import dataclass
 
 from pogema import GridConfig
-from pogema.svg_animation.svg_objects import Line, RectangleHref, Animation, Circle, Rectangle
+from pogema.svg_animation.svg_objects import Animation, Circle, Line, Rectangle, RectangleHref
 
 
 @dataclass
 class AnimationConfig:
     directory: str = 'renders/'
     show_agents: bool = True
-    egocentric_idx: typing.Optional[int] = None
-    static_frame_idx: typing.Optional[int] = None
-    uid: typing.Optional[str] = None
-    save_every_idx_episode: typing.Optional[int] = 1
+    egocentric_idx: int | None = None
+    static_frame_idx: int | None = None
+    uid: str | None = None
+    save_every_idx_episode: int | None = 1
     show_grid_lines: bool = True
 
 
@@ -84,7 +84,7 @@ def render(self):
              width="{scaled_width}" height="{scaled_height}" viewBox="{" ".join(map(str, view_box))}">'''
 
         definitions = f'''
-        <rect id="obstacle" width="{self.svg_settings.r * 2}" height="{self.svg_settings.r * 2}" 
+        <rect id="obstacle" width="{self.svg_settings.r * 2}" height="{self.svg_settings.r * 2}"
             fill="{self.svg_settings.obstacle_color}" rx="{self.svg_settings.rx}"/>
         <style>
         .line {{stroke: {self.svg_settings.obstacle_color}; stroke-width: {self.svg_settings.stroke_width};}}
@@ -149,7 +149,7 @@ def fix_point(x, y, length):
     @staticmethod
     def check_in_radius(x1, y1, x2, y2, r) -> bool:
         return x2 - r <= x1 <= x2 + r and y2 - r <= y1 <= y2 + r
-    
+
     @staticmethod
     def create_grid_lines(grid_holder: GridHolder, render_width, render_height):
         gh = grid_holder
@@ -183,7 +183,7 @@ def create_field_of_view(grid_holder):
         )
 
         return result
-        
+
     def create_frame_view(self, grid_holder):
         gh: GridHolder = grid_holder
         frame_idx = gh.config.static_frame_idx
@@ -289,7 +289,7 @@ def animate_targets(self, targets, grid_holder):
             x_path = []
             y_path = []
 
-            for step_idx, state in enumerate(gh.history[target_idx]):
+            for _step_idx, state in enumerate(gh.history[target_idx]):
                 x, y = state.get_target_xy()
                 x_path.append(str(gh.svg_settings.draw_start + y * gh.svg_settings.scale_size))
                 y_path.append(str(-gh.svg_settings.draw_start + -(gh.width - x - 1) * gh.svg_settings.scale_size))
@@ -333,7 +333,7 @@ def create_static_obstacles(self, obstacles, grid_holder):
         result = []
         seen = set()
 
-        for step_idx, agent_state in enumerate(gh.history[gh.config.egocentric_idx][:frame_idx + 1]):
+        for _step_idx, agent_state in enumerate(gh.history[gh.config.egocentric_idx][:frame_idx + 1]):
             ego_x, ego_y = agent_state.get_xy()
             for i in range(gh.height):
                 for j in range(gh.width):
@@ -359,7 +359,7 @@ def create_static_obstacles(self, obstacles, grid_holder):
                     result.append(RectangleHref(**obs_settings))
 
         return result
-                        
+
     def animate_obstacles(self, obstacles, grid_holder):
         gh: GridHolder = grid_holder
         obstacle_idx = 0
@@ -371,7 +371,7 @@ def animate_obstacles(self, obstacles, grid_holder):
                     continue
                 opacity = []
                 seen = set()
-                for step_idx, agent_state in enumerate(gh.history[gh.config.egocentric_idx]):
+                for _step_idx, agent_state in enumerate(gh.history[gh.config.egocentric_idx]):
                     ego_x, ego_y = agent_state.get_xy()
                     if self.check_in_radius(x, y, ego_x, ego_y, grid_holder.obs_radius):
                         seen.add((x, y))
@@ -416,7 +416,7 @@ def create_static_agents(self, grid_holder):
         gh: GridHolder = grid_holder
         ego_idx = grid_holder.config.egocentric_idx
         frame_idx = grid_holder.config.static_frame_idx
-        
+
         static_positions = [state[frame_idx].get_xy() for state in grid_holder.history]
         for idx, (x, y) in enumerate(static_positions):
             circle_settings = {
diff --git a/pogema/svg_animation/animation_wrapper.py b/pogema/svg_animation/animation_wrapper.py
index 338d49b..857268b 100644
--- a/pogema/svg_animation/animation_wrapper.py
+++ b/pogema/svg_animation/animation_wrapper.py
@@ -3,8 +3,8 @@
 
 from pogema import GridConfig
 from pogema.svg_animation.animation_drawer import AnimationConfig
-from pogema.wrappers.base import PogemaWrapper
 from pogema.wrappers.animation import AnimationWrapper
+from pogema.wrappers.base import PogemaWrapper
 
 
 def _find_animation_wrapper(env):
@@ -87,7 +87,7 @@ def save_animation(self, name='render.svg', animation_config=None):
 
 
 def main():
-    from pogema import GridConfig, pogema_v0, BatchAStarAgent
+    from pogema import BatchAStarAgent, GridConfig, pogema_v0
 
     for egocentric_idx in [0, 1]:
         for on_target in ['nothing', 'restart', 'finish']:
diff --git a/pogema/utils.py b/pogema/utils.py
index 1b127cc..3a5d8fd 100644
--- a/pogema/utils.py
+++ b/pogema/utils.py
@@ -1,9 +1,8 @@
 import sys
+from typing import Literal
 
 from pydantic import BaseModel
 
-from typing_extensions import Literal
-
 
 class AgentsTargetsSizeError(Exception):
     pass
@@ -50,10 +49,11 @@ def render_grid(obstacles, positions_xy=None, targets_xy=None, is_active=None, m
             is_active = [True] * len(positions_xy)
         else:
             is_active = []
-    from io import StringIO
     import string
-    from gymnasium import utils as gym_utils
     from contextlib import closing
+    from io import StringIO
+
+    from gymnasium import utils as gym_utils
 
     outfile = StringIO() if mode == 'ansi' else sys.stdout
     chars = string.digits + string.ascii_letters + string.punctuation
@@ -73,9 +73,9 @@ def render_grid(obstacles, positions_xy=None, targets_xy=None, is_active=None, m
                     out += str(
                         gym_utils.colorize('|' + chars[finish_id % len(chars)] + '|', 'white', highlight=False))
                 else:
-                    out += str(gym_utils.colorize(str(' . '), 'white', highlight=False))
+                    out += str(gym_utils.colorize(' . ', 'white', highlight=False))
             else:
-                out += str(gym_utils.colorize(str('   '), 'cyan', bold=False, highlight=True))
+                out += str(gym_utils.colorize('   ', 'cyan', bold=False, highlight=True))
         out += '\n'
         outfile.write(out)
 
diff --git a/pogema/wrappers/animation.py b/pogema/wrappers/animation.py
index 3de14ff..01c49ec 100644
--- a/pogema/wrappers/animation.py
+++ b/pogema/wrappers/animation.py
@@ -1,9 +1,31 @@
+import os
 from itertools import cycle
 
 from pogema.wrappers.base import PogemaWrapper
 from pogema.wrappers.persistence import AgentState, decompress_history
 
 
+class SvgAnimation:
+    def __init__(self, svg_str):
+        self._svg_str = svg_str
+
+    def _repr_html_(self):
+        return self._svg_str
+
+    def save(self, path='render.svg'):
+        parent = os.path.dirname(path)
+        if parent:
+            os.makedirs(parent, exist_ok=True)
+        with open(path, "w") as f:
+            f.write(self._svg_str)
+
+    def __str__(self):
+        return self._svg_str
+
+    def __repr__(self):
+        return f"SvgAnimation({len(self._svg_str)} chars)"
+
+
 class AnimationWrapper(PogemaWrapper):
     def __init__(self, env):
         super().__init__(env)
@@ -55,7 +77,7 @@ def disable_animation(self):
     def animation_is_active(self):
         return self._active
 
-    def save_animation(self, name='render.svg', animation_config=None):
+    def _build_svg_string(self, animation_config=None):
         if not self._active:
             raise RuntimeError(
                 "Animation is not active. Call env.enable_animation() and then env.reset() before saving."
@@ -65,7 +87,7 @@ def save_animation(self, name='render.svg', animation_config=None):
                 "No history recorded. Call env.reset() after enable_animation() before saving."
             )
 
-        from pogema.svg_animation.animation_drawer import AnimationConfig, SvgSettings, GridHolder, AnimationDrawer
+        from pogema.svg_animation.animation_drawer import AnimationConfig, AnimationDrawer, GridHolder, SvgSettings
 
         if animation_config is None:
             animation_config = self._animation_config
@@ -120,5 +142,10 @@ def save_animation(self, name='render.svg', animation_config=None):
         )
 
         animation = AnimationDrawer().create_animation(grid_holder)
-        with open(name, "w") as f:
-            f.write(animation.render())
+        return animation.render()
+
+    def render_animation(self, animation_config=None):
+        return SvgAnimation(self._build_svg_string(animation_config=animation_config))
+
+    def save_animation(self, name='render.svg', animation_config=None):
+        self.render_animation(animation_config=animation_config).save(name)
diff --git a/pogema/wrappers/base.py b/pogema/wrappers/base.py
index 98c9141..517f684 100644
--- a/pogema/wrappers/base.py
+++ b/pogema/wrappers/base.py
@@ -19,7 +19,7 @@
     # PogemaLifeLong
     'get_lifelong_targets_xy',
     # AnimationWrapper
-    'enable_animation', 'disable_animation', 'save_animation', 'animation_is_active',
+    'enable_animation', 'disable_animation', 'save_animation', 'render_animation', 'animation_is_active',
 })
 
 
@@ -95,6 +95,9 @@ def disable_animation(self):
     def save_animation(self, name='render.svg', animation_config=None):
         return self.env.save_animation(name, animation_config=animation_config)
 
+    def render_animation(self, animation_config=None):
+        return self.env.render_animation(animation_config=animation_config)
+
     @property
     def animation_is_active(self):
         return self.env.animation_is_active
diff --git a/pogema/wrappers/metrics.py b/pogema/wrappers/metrics.py
index bb095ab..453106d 100644
--- a/pogema/wrappers/metrics.py
+++ b/pogema/wrappers/metrics.py
@@ -37,7 +37,7 @@ def __init__(self, env):
         self._solved_instances = 0
 
     def _compute_stats(self, step, is_on_goal, finished):
-        for agent_idx, on_goal in enumerate(is_on_goal):
+        for _agent_idx, on_goal in enumerate(is_on_goal):
             if on_goal:
                 self._solved_instances += 1
         if finished:
diff --git a/pyproject.toml b/pyproject.toml
index bc282a6..7612d16 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -25,13 +25,13 @@ dependencies = [
     "gymnasium>=1.2.3",
     "numpy>=2.0",
     "pydantic>=2.12.5",
-    "pettingzoo>=1.24.0,<1.25.0"
+    "pettingzoo>=1.24.0,<2.0.0",
 ]
 urls = { "Homepage" = "https://github.com/Cognitive-AI-Systems/pogema" }
 
 [project.optional-dependencies]
-test = ["pytest", "pytest-cov", "tabulate"]
-dev = ["ruff", "pytest", "pytest-cov", "tabulate"]
+test = ["pytest", "pytest-cov", "tabulate", "pytest-codeblocks[test]>=0.17.0"]
+dev = ["pogema[test]", "ruff"]
 
 [tool.hatch.version]
 path = "pogema/__init__.py"
@@ -49,5 +49,12 @@ testpaths = ["tests"]
 line-length = 127
 
 [tool.ruff.lint]
-select = ["E", "F"]
-ignore = []
+select = ["E", "F", "W", "I", "UP", "B"]
+ignore = [
+    "B008",  # mutable default arguments — intentional for Pydantic/dataclass defaults
+    "B905",  # zip() without strict= — not needed for same-length iterables
+    "B019",  # functools.cache on methods — required by PettingZoo API
+]
+
+[tool.ruff.lint.per-file-ignores]
+"pogema/__init__.py" = ["I001"]  # import order constrained by circular import
diff --git a/tests/test_deterministic_policy.py b/tests/test_deterministic_policy.py
index 639fcc1..7d5650b 100644
--- a/tests/test_deterministic_policy.py
+++ b/tests/test_deterministic_policy.py
@@ -1,5 +1,7 @@
-import numpy as np
 from heapq import heappop, heappush
+
+import numpy as np
+
 from pogema import GridConfig, pogema_v0
 
 INF = 1000000007
@@ -116,7 +118,7 @@ def act(self, obs) -> list:
             self.agents[k].update_path(start, goal)
             next_node = self.agents[k].get_next_node()
             actions.append(self.actions[(next_node[0] - start[0], next_node[1] - start[1])])
-        for idx, action in enumerate(actions):
+        for idx, _action in enumerate(actions):
             if self._rnd.random() < self._random_rate:
                 actions[idx] = self._rnd.randint(1, 4)
         return actions
@@ -144,7 +146,7 @@ def test_life_long():
     assert np.isclose(metrics['avg_throughput'], 1.671875)
     metrics = results_generator.__next__()
     assert np.isclose(metrics['avg_throughput'], 1.609375)
-    
+
     gc = GridConfig(num_agents=24, size=8, obs_radius=4, seed=43, max_episode_steps=64, on_target='restart')
     results_generator = run_policy(gc)
 
diff --git a/tests/test_grid.py b/tests/test_grid.py
index 6b214cd..cab93ac 100644
--- a/tests/test_grid.py
+++ b/tests/test_grid.py
@@ -1,10 +1,9 @@
 import numpy as np
+import pytest
 from pydantic import ValidationError
 
 from pogema import GridConfig
 from pogema.grid import Grid
-import pytest
-
 from pogema.integrations.make_pogema import pogema_v0
 
 
@@ -291,10 +290,10 @@ def test_rectangular_grid_mixed_config():
 def test_rectangular_grid_validation():
     with pytest.raises(ValueError):
         GridConfig(width=12)
-    
+
     with pytest.raises(ValueError):
         GridConfig(height=8)
-    
+
     GridConfig(width=12, height=8)
     GridConfig(size=10)
     GridConfig(size=10, width=12, height=8)
@@ -304,10 +303,10 @@ def test_rectangular_grid_position_validation():
     config = GridConfig(width=12, height=8, agents_xy=[[0, 11], [7, 0]], targets_xy=[[7, 11], [0, 0]])
     assert len(config.agents_xy) == 2
     assert len(config.targets_xy) == 2
-    
+
     with pytest.raises(IndexError):
         GridConfig(width=12, height=8, agents_xy=[[8, 0]], targets_xy=[[0, 0]])
-    
+
     with pytest.raises(IndexError):
         GridConfig(width=12, height=8, agents_xy=[[0, 12]], targets_xy=[[0, 0]])
 
@@ -315,7 +314,7 @@ def test_rectangular_grid_position_validation():
 def test_rectangular_grid_creation():
     config = GridConfig(width=12, height=8, seed=1, num_agents=2)
     grid = Grid(config)
-    
+
     assert np.isclose(grid.config.width, 12)
     assert np.isclose(grid.config.height, 8)
     assert np.isclose(grid.config.size, 12)
@@ -333,42 +332,42 @@ def test_goal_sequences_validation():
     assert np.isclose(len(config.targets_xy), 2)
     assert np.isclose(len(config.targets_xy[0]), 3)
     assert np.isclose(len(config.targets_xy[1]), 2)
-    
+
     config = GridConfig(
         width=8, height=8,
         agents_xy=[[0, 0], [1, 1]],
         targets_xy=[[7, 7], [6, 6]]
     )
     assert np.isclose(len(config.targets_xy), 2)
-    
+
     with pytest.raises(ValueError):
         GridConfig(
             width=8, height=8,
             agents_xy=[[0, 0], [1, 1]],
             targets_xy=[[[2, 2], [3, 3]], [4, 4]]
         )
-    
+
     with pytest.raises(ValueError):
         GridConfig(
             width=8, height=8,
             agents_xy=[[0, 0]],
             targets_xy=[[[2, 2]]]
         )
-    
+
     with pytest.raises(ValueError):
         GridConfig(
             width=8, height=8,
             agents_xy=[[0, 0]],
             targets_xy=[[[2.5, 2], [3, 3]]]
         )
-    
+
     with pytest.raises(IndexError):
         GridConfig(
             width=8, height=8,
             agents_xy=[[0, 0]],
             targets_xy=[[[2, 2], [10, 10]]]
         )
-    
+
     with pytest.raises(ValueError, match="on_target='restart' requires goal sequences"):
         GridConfig(
             width=8, height=8,
@@ -387,20 +386,21 @@ def test_grid_with_goal_sequences():
             [[2, 4], [3, 5]]
         ]
     )
-    
+
     grid = Grid(config)
-    
+
     expected_initial_targets = [[2, 2], [2, 4]]
     r = config.obs_radius
     expected_with_offset = [(x + r, y + r) for x, y in expected_initial_targets]
-    
+
     assert np.isclose(grid.finishes_xy, expected_with_offset).all()
 
 
 def test_pogema_lifelong_with_sequences():
-    from pogema.envs import PogemaLifeLong
     import warnings
 
+    from pogema.envs import PogemaLifeLong
+
     config = GridConfig(
         width=8, height=8, density=0,
         agents_xy=[[1, 1], [1, 2]],
@@ -410,34 +410,34 @@ def test_pogema_lifelong_with_sequences():
         ],
         on_target='restart'
     )
-    
+
     env = PogemaLifeLong(grid_config=config)
     env.reset()
-    
+
     assert env.has_custom_sequences is True
     assert np.isclose(env.current_goal_indices, [0, 0]).all()
-    
+
     with warnings.catch_warnings(record=True) as w:
         warnings.simplefilter("always")
-        
+
         env._generate_new_target(0)
         assert np.isclose(env.current_goal_indices[0], 1)
-        
+
         env._generate_new_target(0)
         assert np.isclose(env.current_goal_indices[0], 2)
-        
+
         env._generate_new_target(0)
         assert np.isclose(env.current_goal_indices[0], 0)
-        
+
         cycling_warnings = [warning for warning in w if "completed all 3 provided targets" in str(warning.message)]
         assert np.isclose(len(cycling_warnings), 1)
-    
+
     with warnings.catch_warnings(record=True) as w:
         warnings.simplefilter("always")
-        
+
         env._generate_new_target(1)
         env._generate_new_target(1)
-        
+
         assert np.isclose(len(w), 1)
         assert "completed all 2 provided targets" in str(w[0].message)
         assert "cycling back to the beginning" in str(w[0].message)
@@ -445,7 +445,7 @@ def test_pogema_lifelong_with_sequences():
 
 def test_pogema_lifelong_reset():
     from pogema.envs import PogemaLifeLong
-    
+
     config = GridConfig(
         width=8, height=8,
         agents_xy=[[1, 1], [1, 2]],
@@ -455,32 +455,32 @@ def test_pogema_lifelong_reset():
         ],
         on_target='restart'
     )
-    
+
     env = PogemaLifeLong(grid_config=config)
     env.reset()
-    
+
     env._generate_new_target(0)
     env._generate_new_target(1)
     assert np.isclose(env.current_goal_indices, [1, 1]).all()
-    
+
     env.reset()
     assert np.isclose(env.current_goal_indices, [0, 0]).all()
 
 
 def test_pogema_lifelong_without_sequences():
     from pogema.envs import PogemaLifeLong
-    
+
     config = GridConfig(
         width=8, height=8,
         num_agents=2,
         on_target='restart'
     )
-    
+
     env = PogemaLifeLong(grid_config=config)
     env.reset()
-    
+
     assert env.has_custom_sequences is False
-    
+
     target = env._generate_new_target(0)
     assert isinstance(target, tuple)
     assert np.isclose(len(target), 2)
@@ -493,7 +493,7 @@ def test_goal_sequences_position_format():
             agents_xy=[[0, 0]],
             targets_xy=[[[2, 2, 3], [4, 4]]]
         )
-    
+
     with pytest.raises(ValueError, match="Position coordinates must be integers"):
         GridConfig(
             width=8, height=8,
diff --git a/tests/test_pogema_env.py b/tests/test_pogema_env.py
index 6edad88..b940d08 100644
--- a/tests/test_pogema_env.py
+++ b/tests/test_pogema_env.py
@@ -6,8 +6,7 @@
 import pytest
 from tabulate import tabulate
 
-from pogema import pogema_v0, AnimationMonitor, AnimationConfig
-
+from pogema import AnimationConfig, AnimationMonitor, SvgAnimation, pogema_v0
 from pogema.envs import ActionsSampler
 from pogema.grid import GridConfig
 from pogema.wrappers.persistence import PersistentWrapper
@@ -218,7 +217,7 @@ def test_persistent_env(num_steps=100):
     def state_repr(observations, rewards, terminates, truncates, infos):
         return np.concatenate([np.array(observations).flatten(), terminates, truncates, np.array(rewards), ])
 
-    for current_step in range(num_steps):
+    for _current_step in range(num_steps):
         actions = action_sampler.sample_actions(dim=env.unwrapped.get_num_agents())
         obs, reward, terminated, truncated, info = env.step(actions)
 
@@ -227,7 +226,7 @@ def state_repr(observations, rewards, terminates, truncates, infos):
             break
 
     # resetting the environment to the initial state using backward steps
-    for current_step in range(num_steps):
+    for _current_step in range(num_steps):
         if not env.step_back():
             break
 
@@ -259,7 +258,7 @@ def test_wrapper_attribute_forwarding():
         assert env.get_targets_xy() is not None
 
         with pytest.raises(AttributeError):
-            env.nonexistent_attribute_xyz
+            _ = env.nonexistent_attribute_xyz
 
 
 def test_wrapper_forwarding_persistent():
@@ -283,22 +282,6 @@ def test_wrapper_forwarding_animation():
     assert env.grid_config is not None
 
 
-def test_steps_per_second_throughput():
-    table = []
-    for on_target in ['finish', 'nothing', 'restart']:
-        for num_agents in [1, 32, 64]:
-            for size in [32, 64]:
-                gc = GridConfig(obs_radius=5, seed=42, max_episode_steps=1024,
-                              size=size, num_agents=num_agents, on_target=on_target)
-
-                start_time = time.monotonic()
-                run_episode(grid_config=gc)
-                end_time = time.monotonic()
-                steps_per_second = gc.max_episode_steps / (end_time - start_time)
-                table.append([on_target, num_agents, size, steps_per_second * gc.num_agents])
-    print('\n' + tabulate(table, headers=['on_target', 'num_agents', 'size', 'SPS (individual)'], tablefmt='grid'))
-
-
 def test_enable_animation_and_save(tmp_path):
     gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
     env = pogema_v0(gc)
@@ -373,3 +356,80 @@ def test_enable_animation_for_all_on_target_modes(tmp_path):
         svg_path = str(tmp_path / f'test_{on_target}.svg')
         env.save_animation(svg_path)
         assert os.path.exists(svg_path)
+
+
+def test_render_animation_returns_svg_animation():
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env.enable_animation()
+    env.reset()
+    run_episode(env=env)
+
+    anim = env.render_animation()
+    assert isinstance(anim, SvgAnimation)
+    assert '<svg' in str(anim)
+    assert '<svg' in anim._repr_html_()
+    assert 'SvgAnimation(' in repr(anim)
+
+
+def test_render_animation_save(tmp_path):
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env.enable_animation()
+    env.reset()
+    run_episode(env=env)
+
+    anim = env.render_animation()
+    nested_path = str(tmp_path / 'nested' / 'dirs' / 'out.svg')
+    anim.save(nested_path)
+    assert os.path.exists(nested_path)
+    with open(nested_path) as f:
+        assert '<svg' in f.read()
+
+
+def test_render_animation_without_enable_raises():
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env.reset()
+    with pytest.raises(RuntimeError, match="Animation is not active"):
+        env.render_animation()
+
+
+def test_save_animation_creates_parent_dirs(tmp_path):
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env.enable_animation()
+    env.reset()
+    run_episode(env=env)
+
+    svg_path = str(tmp_path / 'auto' / 'created' / 'render.svg')
+    env.save_animation(svg_path)
+    assert os.path.exists(svg_path)
+
+
+def test_render_animation_with_config():
+    gc = GridConfig(num_agents=2, size=6, obs_radius=2, density=0.3, seed=42, on_target='finish')
+    env = pogema_v0(gc)
+    env.enable_animation()
+    env.reset()
+    run_episode(env=env)
+
+    anim = env.render_animation(animation_config=AnimationConfig(egocentric_idx=0))
+    assert isinstance(anim, SvgAnimation)
+    assert '<svg' in str(anim)
+
+
+def test_steps_per_second_throughput():
+    table = []
+    for on_target in ['finish', 'nothing', 'restart']:
+        for num_agents in [1, 32, 64]:
+            for size in [32, 64]:
+                gc = GridConfig(obs_radius=5, seed=42, max_episode_steps=1024,
+                              size=size, num_agents=num_agents, on_target=on_target)
+
+                start_time = time.monotonic()
+                run_episode(grid_config=gc)
+                end_time = time.monotonic()
+                steps_per_second = gc.max_episode_steps / (end_time - start_time)
+                table.append([on_target, num_agents, size, steps_per_second * gc.num_agents])
+    print('\n' + tabulate(table, headers=['on_target', 'num_agents', 'size', 'SPS (individual)'], tablefmt='grid'))

From 3551c1a68360ae098c9f0dc8fcaf58a7aaff73c9 Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Mon, 2 Mar 2026 00:50:55 +0300
Subject: [PATCH 10/15] minor fix for version history

---
 version_history.MD | 92 +++++++++++++++++++++++-----------------------
 1 file changed, 46 insertions(+), 46 deletions(-)

diff --git a/version_history.MD b/version_history.MD
index 8e10994..7ed43b5 100644
--- a/version_history.MD
+++ b/version_history.MD
@@ -1,105 +1,105 @@
 The development history of POGEMA, starting from version 1.0.0.
 
 Version 1.4.X (August, 2025)
-	•	Added support of custom targets_xy for lifelong MAPF.
-	•	Improved work with rectangular grids. Added width and height attributes to GridConfig.
-	•	Added method update_config to properly update all attributes of GridConfig.
-	•	Added more tests for new features - custom targets_xy and width/height attributes.
+- Added support of custom targets_xy for lifelong MAPF.
+- Improved work with rectangular grids. Added width and height attributes to GridConfig.
+- Added method update_config to properly update all attributes of GridConfig.
+- Added more tests for new features - custom targets_xy and width/height attributes.
 
 Version 1.4.0 (April 5, 2025)
-	•	Extended limits for size of maps and number of agents.
-	•	Fixed ep_length value.
-	•	Updated some tests.
+- Extended limits for size of maps and number of agents.
+- Fixed ep_length value.
+- Updated some tests.
 
 Version 1.3.0 (June 13, 2024)
 
-	•	Updates for integration with newer version of gymnasium.
-	•	Refactored AgentsDensityWrapper for modularity and clarity.
-	•	Introduced RuntimeMetricWrapper for runtime monitoring.
-	•	Enhanced map generation methods and added new metrics like SOC_Makespan.
-	•	Animation improvements for better visualization.
+- Updates for integration with newer version of gymnasium.
+- Refactored AgentsDensityWrapper for modularity and clarity.
+- Introduced RuntimeMetricWrapper for runtime monitoring.
+- Enhanced map generation methods and added new metrics like SOC_Makespan.
+- Animation improvements for better visualization.
 
 Version 1.2.2 (September 22, 2023)
 
-	•	Implemented soft collision handling for agent interactions.
-	•	Improved lifelong scenario seeding for consistent agent behavior.
-	•	Enhanced metric logging for better integration with PyMARL.
+- Implemented soft collision handling for agent interactions.
+- Improved lifelong scenario seeding for consistent agent behavior.
+- Enhanced metric logging for better integration with PyMARL.
 
 Version 1.2.0 (August 30, 2023)
 
-	•	Fixed import issues with Literal and animation issues.
-	•	Improved visualizations, including grid lines and border toggles.
+- Fixed import issues with Literal and animation issues.
+- Improved visualizations, including grid lines and border toggles.
 
 Version 1.1.0 (March 30, 2023)
 
-	•	Updated dependencies for gymnasium and PettingZoo.
-	•	Added an option to remove animation borders for cleaner outputs.
-	•	Fixed animation bugs for stuck agents.
+- Updated dependencies for gymnasium and PettingZoo.
+- Added an option to remove animation borders for cleaner outputs.
+- Fixed animation bugs for stuck agents.
 
 Version 1.0.0 (February 2023)
 
-	•	Launched core features, including A* policy implementations* and CI/CD support.
-	•	Introduced basic visualization and fixed animation bugs.
+- Launched core features, including A* policy implementations* and CI/CD support.
+- Introduced basic visualization and fixed animation bugs.
 
 Post-Version Updates
 
-	•	Adjusted the number of agents in setups.
-	•	Updated package metadata for better compatibility.
-	•	Addressed legacy issues and improved benchmark generation.
+- Adjusted the number of agents in setups.
+- Updated package metadata for better compatibility.
+- Addressed legacy issues and improved benchmark generation.
 
 Version 1.1.6 (February 21, 2023)
 
-	•	Fixed static animation issues and added grid object rendering.
+- Fixed static animation issues and added grid object rendering.
 
 Version 1.1.5 (December 28, 2022)
 
-	•	Fixed Python 3.7 compatibility issues and added map registries for better management.
-	•	Introduced an attrition metric.
+- Fixed Python 3.7 compatibility issues and added map registries for better management.
+- Introduced an attrition metric.
 
 Version 1.1.4 (November 18, 2022)
 
-	•	Fixed flake8 warnings for improved code quality.
+- Fixed flake8 warnings for improved code quality.
 
 Version 1.1.3 (October 28, 2022)
 
-	•	Corrected random seed initialization for PogemaLifeLong.
-	•	Optimized animation behavior.
+- Corrected random seed initialization for PogemaLifeLong.
+- Optimized animation behavior.
 
 Version 1.1.2 (October 5, 2022)
 
-	•	Upgraded SVG animations for better compression.
+- Upgraded SVG animations for better compression.
 
 Version 1.1.1 (August 30, 2022)
 
-	•	Added map_name attributes for clearer references.
-	•	Implemented new observation types (MAPF, POMAPF) and enhanced metrics aggregation.
+- Added map_name attributes for clearer references.
+- Implemented new observation types (MAPF, POMAPF) and enhanced metrics aggregation.
 
 Version 1.0.x and Earlier
 
-	•	Introduced cooperative reward wrappers and lifelong environment versions.
-	•	Dropped Python 3.6 support and refined animation handling.
+- Introduced cooperative reward wrappers and lifelong environment versions.
+- Dropped Python 3.6 support and refined animation handling.
 
 Version 1.0.3 (June 29, 2022)
 
-	•	Fixed rendering issues for inactive agents.
+- Fixed rendering issues for inactive agents.
 
 Version 1.0.2 (June 27, 2022)
 
-	•	Enhanced customization for agent and target positions.
+- Enhanced customization for agent and target positions.
 
 Pre-1.0.2 Development (June 2022)
 
-	•	Improved tests, refactored code, and removed unnecessary dependencies.
+- Improved tests, refactored code, and removed unnecessary dependencies.
     •	Introduced the PogemaLifeLong class with target generation and metrics tailored for lifelong scenarios.
-	•	Introduced customizable map rules and agent/target positions.
-	•	Simplified installation by removing unnecessary dependencies.
+- Introduced customizable map rules and agent/target positions.
+- Simplified installation by removing unnecessary dependencies.
 
 
 Version 1.0.0 (March 31, 2022)
 
-	•	Added predefined configurations for grid environments and improved visualization.
-	•	Integrated PettingZoo support and enhanced usability with better examples.
-	•	Introduced grid_config class for environment configuration and improved state management.
-	•	Added methods for relative position observations and fixed PettingZoo compatibility.
-	•	Documentation improvements for better user guidance.
+- Added predefined configurations for grid environments and improved visualization.
+- Integrated PettingZoo support and enhanced usability with better examples.
+- Introduced grid_config class for environment configuration and improved state management.
+- Added methods for relative position observations and fixed PettingZoo compatibility.
+- Documentation improvements for better user guidance.
 

From da35a26cfd4c494401c897e2a8706bceb747d69d Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Mon, 2 Mar 2026 01:11:16 +0300
Subject: [PATCH 11/15] =?UTF-8?q?refactoring:=20-=20Replace=20assert=20wit?=
 =?UTF-8?q?h=20raise=20ValueError=20in=20all=20validators=20(safe=20under?=
 =?UTF-8?q?=20python=20-O)=20-=20Fix=20SingleAgentWrapper.reset()=20silent?=
 =?UTF-8?q?ly=20dropping=20seed=20parameter=20-=20Fix=20wrong=20exception?=
 =?UTF-8?q?=20types:=20KeyError/OverflowError=20=E2=86=92=20ValueError=20a?=
 =?UTF-8?q?cross=20codebase=20-=20Add=20reset()=20to=20metric=20wrappers?=
 =?UTF-8?q?=20to=20clear=20stale=20state=20on=20mid-episode=20reset=20-=20?=
 =?UTF-8?q?Fix=20ActionsSampler=20seed=20not=20updating=20on=20reset(seed?=
 =?UTF-8?q?=3D...)=20-=20Improve=20error=20messages=20(typos,=20unclear=20?=
 =?UTF-8?q?bounds=20notation,=20missing=20guidance)=20-=20Add=20Field(desc?=
 =?UTF-8?q?ription=3D...)=20and=20parameterized=20type=20hints=20to=20all?=
 =?UTF-8?q?=20GridConfig=20fields=20-=20Add=20=5F=5Frepr=5F=5F=20to=20Poge?=
 =?UTF-8?q?maWrapper=20showing=20config=20summary=20-=20Export=20missing?=
 =?UTF-8?q?=20public=20classes=20in=20=5F=5Fall=5F=5F=20(metrics,=20MultiT?=
 =?UTF-8?q?imeLimit,=20register=5Fgrid,=20etc.)=20-=20Raise=20dimension=20?=
 =?UTF-8?q?limit=20from=204096=20to=208,388,608=20(2^23)=20-=20Fix=20old-s?=
 =?UTF-8?q?tyle=20type=20hint=20(int,=20int)=20=E2=86=92=20tuple[int,=20in?=
 =?UTF-8?q?t]=20in=20a=5Fstar=5Fpolicy.py?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 pogema/__init__.py                 |  31 ++++++--
 pogema/a_star_policy.py            |   7 +-
 pogema/envs.py                     |   5 +-
 pogema/generator.py                |   4 +-
 pogema/grid.py                     |   9 ++-
 pogema/grid_config.py              | 120 +++++++++++++++++++----------
 pogema/integrations/make_pogema.py |   7 +-
 pogema/integrations/pettingzoo.py  |   9 ++-
 pogema/wrappers/base.py            |  10 +++
 pogema/wrappers/metrics.py         |  24 ++++++
 tests/test_grid.py                 |  24 +++---
 11 files changed, 178 insertions(+), 72 deletions(-)

diff --git a/pogema/__init__.py b/pogema/__init__.py
index 4d02a63..177bd3e 100644
--- a/pogema/__init__.py
+++ b/pogema/__init__.py
@@ -2,11 +2,25 @@
 
 from pogema.grid_config import GridConfig
 from pogema.a_star_policy import AStarAgent, BatchAStarAgent
-from pogema.integrations.make_pogema import pogema_v0
+from pogema.integrations.make_pogema import pogema_v0, SingleAgentWrapper
+from pogema.grid_registry import register_grid, get_grid
 from pogema.svg_animation.animation_drawer import AnimationConfig
 from pogema.svg_animation.animation_wrapper import AnimationMonitor
 from pogema.wrappers.animation import AnimationWrapper, SvgAnimation
 from pogema.wrappers.base import PogemaWrapper
+from pogema.wrappers.metrics import (
+    CSRMetric,
+    ISRMetric,
+    EpLengthMetric,
+    NonDisappearCSRMetric,
+    NonDisappearISRMetric,
+    NonDisappearEpLengthMetric,
+    SumOfCostsAndMakespanMetric,
+    LifeLongAverageThroughputMetric,
+    AgentsDensityWrapper,
+    RuntimeMetricWrapper,
+)
+from pogema.wrappers.multi_time_limit import MultiTimeLimit
 from pogema.wrappers.persistence import PersistentWrapper
 
 __version__ = '1.4.0'
@@ -17,10 +31,17 @@
     'AnimationMonitor',
     'AnimationConfig',
     'AStarAgent', 'BatchAStarAgent',
-    "PogemaWrapper",
-    "AnimationWrapper",
-    "SvgAnimation",
-    "PersistentWrapper",
+    'PogemaWrapper',
+    'AnimationWrapper',
+    'SvgAnimation',
+    'PersistentWrapper',
+    'SingleAgentWrapper',
+    'MultiTimeLimit',
+    'register_grid', 'get_grid',
+    'CSRMetric', 'ISRMetric', 'EpLengthMetric',
+    'NonDisappearCSRMetric', 'NonDisappearISRMetric', 'NonDisappearEpLengthMetric',
+    'SumOfCostsAndMakespanMetric', 'LifeLongAverageThroughputMetric',
+    'AgentsDensityWrapper', 'RuntimeMetricWrapper',
 ]
 
 register(
diff --git a/pogema/a_star_policy.py b/pogema/a_star_policy.py
index 294c8b8..31ecb64 100644
--- a/pogema/a_star_policy.py
+++ b/pogema/a_star_policy.py
@@ -42,7 +42,7 @@ def is_obstacle(self, x, y):
 
 
 class Node:
-    def __init__(self, coord: (int, int) = (INF, INF), g: int = 0, h: int = 0):
+    def __init__(self, coord: tuple[int, int] = (INF, INF), g: int = 0, h: int = 0):
         self.i, self.j = coord
         self.g = g
         self.h = h
@@ -104,7 +104,10 @@ def act(self, obs):
 
 
         if self._saved_xy is not None and h(self._saved_xy, xy) > 1:
-            raise IndexError("Agent moved more than 1 step. Please, call clear_state method before new episode.")
+            raise IndexError(
+                "Agent moved more than 1 step between calls to act(). "
+                "This usually means a new episode started. Call agent.clear_state() before each new episode."
+            )
         if self._saved_xy is not None and h(self._saved_xy, xy) == 0 and xy != target_xy:
             return self._rnd.integers(len(self._moves))
         self._gm.update(*xy, obstacles)
diff --git a/pogema/envs.py b/pogema/envs.py
index e4fa9d9..cd11847 100644
--- a/pogema/envs.py
+++ b/pogema/envs.py
@@ -168,6 +168,7 @@ def update_was_on_goal(self):
     def reset(self, seed: int | None = None, return_info: bool = True, options: dict | None = None, ):
         if seed is not None:
             self.grid_config.seed = seed
+            self._multi_action_sampler.update_seed(seed)
         self._initialize_grid()
         self.update_was_on_goal()
 
@@ -468,7 +469,7 @@ def _make_pogema(grid_config):
     elif grid_config.on_target == 'finish':
         env = Pogema(grid_config=grid_config)
     else:
-        raise KeyError(f'Unknown on_target option: {grid_config.on_target}')
+        raise ValueError(f"Unknown on_target option: '{grid_config.on_target}'. Must be 'finish', 'nothing', or 'restart'.")
 
     env = MultiTimeLimit(env, grid_config.max_episode_steps)
     env = AnimationWrapper(env)
@@ -494,6 +495,6 @@ def _make_pogema(grid_config):
         env = CSRMetric(env)
         env = EpLengthMetric(env)
     else:
-        raise KeyError(f'Unknown on_target option: {grid_config.on_target}')
+        raise ValueError(f"Unknown on_target option: '{grid_config.on_target}'. Must be 'finish', 'nothing', or 'restart'.")
 
     return env
diff --git a/pogema/generator.py b/pogema/generator.py
index 25d4c52..c8278d7 100644
--- a/pogema/generator.py
+++ b/pogema/generator.py
@@ -106,7 +106,9 @@ def placing(order, components, grid, start_id, num_agents):
 def generate_from_possible_positions(grid_config: GridConfig):
     if (len(grid_config.possible_agents_xy) < grid_config.num_agents or
             len(grid_config.possible_targets_xy) < grid_config.num_agents):
-        raise OverflowError(f"Can't create task. Not enough possible positions for {grid_config.num_agents} agents.")
+        raise ValueError(f"Can't create task. Not enough possible positions for {grid_config.num_agents} agents. "
+                         f"Available: {len(grid_config.possible_agents_xy)} agent positions, "
+                         f"{len(grid_config.possible_targets_xy)} target positions.")
     rng = np.random.default_rng(grid_config.seed)
     rng.shuffle(grid_config.possible_agents_xy)
     rng.shuffle(grid_config.possible_targets_xy)
diff --git a/pogema/grid.py b/pogema/grid.py
index ed344bf..d600a14 100644
--- a/pogema/grid.py
+++ b/pogema/grid.py
@@ -69,8 +69,9 @@ def __init__(self, grid_config: GridConfig, add_artificial_border: bool = True,
                 self.starts_xy, self.finishes_xy = generate_positions_and_targets_fast(self.obstacles, self.config)
 
         if not self.starts_xy or not self.finishes_xy or len(self.starts_xy) != len(self.finishes_xy):
-            raise OverflowError(
-                "Can't create task. Please check grid grid_config, especially density, num_agent and map.")
+            raise ValueError(
+                "Can't create task. Not enough free cells to place all agents and targets. "
+                "Try reducing density, num_agents, or using a larger map.")
 
         if add_artificial_border:
             self.add_artificial_border()
@@ -244,7 +245,7 @@ def render(self, mode='human', border='thin'):
 
     def move_agent_to_cell(self, agent_id, x, y):
         if self.positions[self.positions_xy[agent_id]] == self.config.FREE:
-            raise KeyError(f"Agent {agent_id} is not in the map")
+            raise ValueError(f"Agent {agent_id} is not in the map")
         self.positions[self.positions_xy[agent_id]] = self.config.FREE
         if self.obstacles[x, y] != self.config.FREE or self.positions[x, y] != self.config.FREE:
             raise ValueError(f"Can't force agent to blocked position {x} {y}")
@@ -290,7 +291,7 @@ def show_agent(self, agent_id):
 
         self.is_active[agent_id] = True
         if self.positions[self.positions_xy[agent_id]] == self.config.OBSTACLE:
-            raise KeyError("The cell is already occupied")
+            raise ValueError("The cell is already occupied")
         self.positions[self.positions_xy[agent_id]] = self.config.OBSTACLE
         return True
 
diff --git a/pogema/grid_config.py b/pogema/grid_config.py
index 78193af..cb39503 100644
--- a/pogema/grid_config.py
+++ b/pogema/grid_config.py
@@ -1,32 +1,64 @@
 import sys
 from typing import Literal
 
-from pydantic import field_validator, model_validator
+from pydantic import Field, field_validator, model_validator
 
 from pogema.utils import CommonSettings
 
 
 class GridConfig(CommonSettings):
-    on_target: Literal['finish', 'nothing', 'restart'] = 'finish'
-    seed: int | None = None
-    width: int | None = None
-    height: int | None = None
-    size: int = 8
-    density: float = 0.3
-    obs_radius: int = 5
-    agents_xy: list | None = None
-    targets_xy: list | None = None
-    num_agents: int | None = None
-    possible_agents_xy: list | None = None
-    possible_targets_xy: list | None = None
-    collision_system: Literal['block_both', 'priority', 'soft'] = 'priority'
-    persistent: bool = False
-    observation_type: Literal['POMAPF', 'MAPF', 'default'] = 'default'
-    map: list | str | None = None
-    map_name: str | None = None
-    integration: Literal['SampleFactory', 'gymnasium', 'PettingZoo'] | None = None
-    max_episode_steps: int = 64
-    auto_reset: bool | None = None
+    on_target: Literal['finish', 'nothing', 'restart'] = Field(
+        'finish',
+        description="Behavior when agent reaches target: "
+                    "'finish' (agent disappears), 'nothing' (agent stays, all must reach simultaneously), "
+                    "'restart' (agent gets new target, lifelong MAPF).",
+    )
+    seed: int | None = Field(None, description="Random seed for reproducibility.")
+    width: int | None = Field(None, description="Grid width. Must be paired with height.")
+    height: int | None = Field(None, description="Grid height. Must be paired with width.")
+    size: int = Field(8, description="Grid size (used as both width and height when they are not set).")
+    density: float = Field(0.3, description="Obstacle density in [0, 1] for random map generation.")
+    obs_radius: int = Field(
+        5, description="Observation radius. Each agent sees a (2*obs_radius+1) x (2*obs_radius+1) window.",
+    )
+    agents_xy: list[list[int]] | None = Field(
+        None, description="Fixed agent start positions as [[row, col], ...].",
+    )
+    targets_xy: list[list[int]] | list[list[list[int]]] | None = Field(
+        None,
+        description="Target positions: [[row, col], ...] for single targets, "
+                    "or [[[r1,c1],[r2,c2],...], ...] for goal sequences (lifelong MAPF).",
+    )
+    num_agents: int | None = Field(None, description="Number of agents. Auto-inferred from agents_xy or map if not set.")
+    possible_agents_xy: list[list[int]] | None = Field(
+        None, description="Pool of positions to randomly sample agent starts from.",
+    )
+    possible_targets_xy: list[list[int]] | None = Field(
+        None, description="Pool of positions to randomly sample targets from.",
+    )
+    collision_system: Literal['block_both', 'priority', 'soft'] = Field(
+        'priority',
+        description="Collision resolution: 'priority' (higher index wins), "
+                    "'block_both' (both agents stay), 'soft' (vertex and edge collision avoidance).",
+    )
+    persistent: bool = Field(False, description="Deprecated. Use env.enable_animation() instead.")
+    observation_type: Literal['POMAPF', 'MAPF', 'default'] = Field(
+        'default',
+        description="Observation format: 'default' (3-channel array), "
+                    "'POMAPF' (dict with obstacles/agents/xy/target_xy), "
+                    "'MAPF' (POMAPF + global state).",
+    )
+    map: list[list[int]] | str | None = Field(
+        None,
+        description="Custom map as a 2D list of 0/1 (free/obstacle) or a string with special characters "
+                    "(. # @ $ ! a-z A-Z).",
+    )
+    map_name: str | None = Field(None, description="Name of a registered map from the grid registry.")
+    integration: Literal['SampleFactory', 'gymnasium', 'PettingZoo'] | None = Field(
+        None, description="Framework integration: None (raw multi-agent), 'gymnasium', 'PettingZoo', or 'SampleFactory'.",
+    )
+    max_episode_steps: int = Field(64, description="Maximum number of steps per episode before truncation.")
+    auto_reset: bool | None = Field(None, description="Auto-reset on episode end (SampleFactory only).")
 
     @model_validator(mode='before')
     @classmethod
@@ -42,10 +74,10 @@ def process_map_and_defaults(cls, data):
                 )
                 if agents_xy and targets_xy and data.get('agents_xy') is not None and data.get(
                         'targets_xy') is not None:
-                    raise KeyError("""Can't create task. Please provide agents_xy and targets_xy only once.
-                Either with parameters or with a map.""")
+                    raise ValueError("Can't create task. Please provide agents_xy and targets_xy only once: "
+                                     "either with parameters or with a map.")
                 if (agents_xy or targets_xy) and (possible_agents_xy or possible_targets_xy):
-                    raise KeyError("""Can't create task. Mark either possible locations or precise ones.""")
+                    raise ValueError("Can't create task. Mark either possible locations or precise ones.")
                 elif agents_xy and targets_xy:
                     data['agents_xy'] = agents_xy
                     data['targets_xy'] = targets_xy
@@ -109,12 +141,12 @@ def validate_dimensions_and_positions(self):
         self.height = height
         self.size = size
 
-        if not (1 <= width <= 4096):
-            raise ValueError(f"width must be in [1, 4096], got {width}")
-        if not (1 <= height <= 4096):
-            raise ValueError(f"height must be in [1, 4096], got {height}")
-        if not (2 <= size <= 4096):
-            raise ValueError(f"size must be in [2, 4096], got {size}")
+        if not (1 <= width <= 8_388_608):
+            raise ValueError(f"width must be in [1, 8_388_608], got {width}")
+        if not (1 <= height <= 8_388_608):
+            raise ValueError(f"height must be in [1, 8_388_608], got {height}")
+        if not (2 <= size <= 8_388_608):
+            raise ValueError(f"size must be in [2, 8_388_608], got {size}")
 
         # Validate positions
         agents_xy = self.agents_xy
@@ -136,16 +168,19 @@ def validate_dimensions_and_positions(self):
     @field_validator('seed')
     @classmethod
     def seed_initialization(cls, v):
-        assert v is None or (0 <= v < sys.maxsize), f"seed must be in [0, {sys.maxsize}]"
+        if v is not None and not (0 <= v < sys.maxsize):
+            raise ValueError(f"seed must be in [0, {sys.maxsize})")
         return v
 
     @staticmethod
     def _validate_dimension(v, field_name):
         if v is not None:
             if field_name == 'size':
-                assert 2 <= v <= 4096, f"{field_name} must be in [2, 4096]"
+                if not (2 <= v <= 8_388_608):
+                    raise ValueError(f"{field_name} must be in [2, 8_388_608]")
             else:
-                assert 1 <= v <= 4096, f"{field_name} must be in [1, 4096]"
+                if not (1 <= v <= 8_388_608):
+                    raise ValueError(f"{field_name} must be in [1, 8_388_608]")
         return v
 
     @field_validator('size')
@@ -166,7 +201,8 @@ def height_restrictions(cls, v):
     @field_validator('density')
     @classmethod
     def density_restrictions(cls, v):
-        assert 0.0 <= v <= 1, "density must be in [0, 1]"
+        if not (0.0 <= v <= 1):
+            raise ValueError("density must be in [0, 1]")
         return v
 
     @field_validator('agents_xy')
@@ -225,18 +261,20 @@ def check_positions(v, width, height):
             if not isinstance(x, int) or not isinstance(y, int):
                 raise ValueError("Position coordinates must be integers")
             if not (0 <= x < height and 0 <= y < width):
-                raise IndexError(f"Position is out of bounds! {position} is not in [{0}, {height}] x [{0}, {width}]")
+                raise IndexError(f"Position {position} is out of bounds: row must be in [0, {height}), col in [0, {width})")
 
     @field_validator('num_agents')
     @classmethod
     def num_agents_must_be_positive(cls, v):
-        assert 1 <= v <= 10000000, "num_agents must be in [1, 10000000]"
+        if not (1 <= v <= 10_000_000):
+            raise ValueError("num_agents must be in [1, 10_000_000]")
         return v
 
     @field_validator('obs_radius')
     @classmethod
     def obs_radius_must_be_positive(cls, v):
-        assert 1 <= v <= 128, "obs_radius must be in [1, 128]"
+        if not (1 <= v <= 128):
+            raise ValueError("obs_radius must be in [1, 128]")
         return v
 
     @field_validator('map')
@@ -285,16 +323,18 @@ def str_map_to_list(str_map, free, obstacle):
                     possible_agents_xy.append(position)
                     possible_targets_xy.append(position)
                 else:
-                    raise KeyError(f"Unsupported symbol '{char}' at line {row_idx}")
+                    raise ValueError(f"Unsupported symbol '{char}' at line {row_idx}")
 
             if row:
-                assert len(obstacles[-1]) == len(row) if obstacles else True, f"Wrong string size for row {row_idx};"
+                if obstacles and len(obstacles[-1]) != len(row):
+                    raise ValueError(f"Inconsistent row width at row {row_idx}: expected {len(obstacles[-1])}, got {len(row)}")
                 obstacles.append(row)
 
         agents_xy = [[x, y] for _, (x, y) in sorted(agents.items())]
         targets_xy = [[x, y] for _, (x, y) in sorted(targets.items())]
 
-        assert len(targets_xy) == len(agents_xy), "Mismatch in number of agents and targets."
+        if len(targets_xy) != len(agents_xy):
+            raise ValueError(f"Mismatch in number of agents ({len(agents_xy)}) and targets ({len(targets_xy)}) in map.")
 
         if not any(char in special_chars for char in str_map):
             possible_agents_xy, possible_targets_xy = None, None
diff --git a/pogema/integrations/make_pogema.py b/pogema/integrations/make_pogema.py
index a7d5fda..130cb72 100644
--- a/pogema/integrations/make_pogema.py
+++ b/pogema/integrations/make_pogema.py
@@ -23,7 +23,7 @@ def step(self, action):
         return observations[0], rewards[0], terminated[0], truncated[0], infos[0]
 
     def reset(self, seed: int | None = None, return_info: bool = True, options: dict | None = None, ):
-        observations, infos = self.env.reset()
+        observations, infos = self.env.reset(seed=seed, options=options)
         if return_info:
             return observations[0], infos[0]
         else:
@@ -42,7 +42,7 @@ def make_pogema(grid_config: GridConfig | dict = GridConfig(), *args, **kwargs)
         grid_config = GridConfig(**grid_config)
 
     if grid_config.integration != 'SampleFactory' and grid_config.auto_reset:
-        raise KeyError(f"{grid_config.integration} does not support auto_reset")
+        raise ValueError(f"auto_reset is only supported with integration='SampleFactory', got '{grid_config.integration}'")
 
     if grid_config.integration is None:
         return _make_pogema(grid_config)
@@ -53,7 +53,8 @@ def make_pogema(grid_config: GridConfig | dict = GridConfig(), *args, **kwargs)
     elif grid_config.integration == 'gymnasium':
         return make_single_agent_gym(grid_config)
 
-    raise KeyError(grid_config.integration)
+    raise ValueError(f"Unknown integration: '{grid_config.integration}'. "
+                     f"Must be 'SampleFactory', 'gymnasium', 'PettingZoo', or None.")
 
 
 pogema_v0 = make_pogema
diff --git a/pogema/integrations/pettingzoo.py b/pogema/integrations/pettingzoo.py
index 677469b..18532be 100644
--- a/pogema/integrations/pettingzoo.py
+++ b/pogema/integrations/pettingzoo.py
@@ -26,16 +26,19 @@ def __init__(self, grid_config: GridConfig, render_mode='ansi'):
 
     @functools.cache
     def observation_space(self, agent):
-        assert agent in self.possible_agents
+        if agent not in self.possible_agents:
+            raise ValueError(f"Unknown agent '{agent}'. Possible agents: {self.possible_agents}")
         return self.pogema.observation_space
 
     @functools.cache
     def action_space(self, agent):
-        assert agent in self.possible_agents
+        if agent not in self.possible_agents:
+            raise ValueError(f"Unknown agent '{agent}'. Possible agents: {self.possible_agents}")
         return self.pogema.action_space
 
     def render(self, mode="human"):
-        assert mode == 'human'
+        if mode != 'human':
+            raise ValueError(f"Unsupported render mode '{mode}'. Only 'human' is supported.")
         return self.pogema.render()
 
     def reset(self, seed=None, options=None):
diff --git a/pogema/wrappers/base.py b/pogema/wrappers/base.py
index 517f684..052c3f0 100644
--- a/pogema/wrappers/base.py
+++ b/pogema/wrappers/base.py
@@ -102,6 +102,16 @@ def render_animation(self, animation_config=None):
     def animation_is_active(self):
         return self.env.animation_is_active
 
+    def __repr__(self):
+        gc = self.grid_config
+        return (
+            f"{type(self.unwrapped).__name__}("
+            f"num_agents={gc.num_agents}, "
+            f"size={gc.width}x{gc.height}, "
+            f"on_target='{gc.on_target}', "
+            f"collision='{gc.collision_system}')"
+        )
+
     # -- Fallback for any remaining forwarded names --
 
     def __getattr__(self, name):
diff --git a/pogema/wrappers/metrics.py b/pogema/wrappers/metrics.py
index 453106d..b4b0e22 100644
--- a/pogema/wrappers/metrics.py
+++ b/pogema/wrappers/metrics.py
@@ -9,10 +9,19 @@ class AbstractMetric(PogemaWrapper):
     def _compute_stats(self, step, is_on_goal, finished):
         raise NotImplementedError
 
+    def _reset_stats(self):
+        pass
+
     def __init__(self, env):
         super().__init__(env)
         self._current_step = 0
 
+    def reset(self, **kwargs):
+        result = self.env.reset(**kwargs)
+        self._current_step = 0
+        self._reset_stats()
+        return result
+
     def step(self, action):
         obs, reward, terminated, truncated, infos = self.env.step(action)
         finished = all(truncated) or all(terminated)
@@ -36,6 +45,9 @@ def __init__(self, env):
         super().__init__(env)
         self._solved_instances = 0
 
+    def _reset_stats(self):
+        self._solved_instances = 0
+
     def _compute_stats(self, step, is_on_goal, finished):
         for _agent_idx, on_goal in enumerate(is_on_goal):
             if on_goal:
@@ -72,6 +84,9 @@ def __init__(self, env):
         super().__init__(env)
         self._solve_time = [None for _ in range(self.unwrapped.get_num_agents())]
 
+    def _reset_stats(self):
+        self._solve_time = [None for _ in range(self.unwrapped.get_num_agents())]
+
     def _compute_stats(self, step, is_on_goal, finished):
         for idx, on_goal in enumerate(is_on_goal):
             if self._solve_time[idx] is None:
@@ -89,6 +104,9 @@ def __init__(self, env):
         super().__init__(env)
         self._solved_instances = 0
 
+    def _reset_stats(self):
+        self._solved_instances = 0
+
     def _compute_stats(self, step, is_on_goal, finished):
         self._solved_instances += sum(is_on_goal)
         if finished:
@@ -102,6 +120,9 @@ def __init__(self, env):
         super().__init__(env)
         self._solved_instances = 0
 
+    def _reset_stats(self):
+        self._solved_instances = 0
+
     def _compute_stats(self, step, is_on_goal, finished):
         self._solved_instances += sum(is_on_goal)
         if finished:
@@ -115,6 +136,9 @@ def __init__(self, env):
         super().__init__(env)
         self._solve_time = [None for _ in range(self.unwrapped.get_num_agents())]
 
+    def _reset_stats(self):
+        self._solve_time = [None for _ in range(self.unwrapped.get_num_agents())]
+
     def _compute_stats(self, step, is_on_goal, finished):
         for idx, on_goal in enumerate(is_on_goal):
             if self._solve_time[idx] is None and (on_goal or finished):
diff --git a/tests/test_grid.py b/tests/test_grid.py
index cab93ac..56390d7 100644
--- a/tests/test_grid.py
+++ b/tests/test_grid.py
@@ -51,10 +51,10 @@ def test_goals():
 
 
 def test_overflow():
-    with pytest.raises(OverflowError):
+    with pytest.raises(ValueError):
         Grid(GridConfig(seed=1, obs_radius=2, size=4, num_agents=100, density=0.0))
 
-    with pytest.raises(OverflowError):
+    with pytest.raises(ValueError):
         Grid(GridConfig(seed=1, obs_radius=2, size=4, num_agents=1, density=1.0))
 
 
@@ -71,7 +71,7 @@ def test_edge_cases():
     with pytest.raises(ValidationError):
         GridConfig(seed=1, obs_radius=2, size=4, num_agents=0, density=0.4)
 
-    with pytest.raises(OverflowError):
+    with pytest.raises(ValueError):
         Grid(GridConfig(seed=1, obs_radius=2, size=4, num_agents=1, density=1.0))
 
     with pytest.raises(ValidationError):
@@ -80,9 +80,9 @@ def test_edge_cases():
 
 def test_edge_cases_for_custom_map():
     test_map = [[0, 0, 0]]
-    with pytest.raises(OverflowError):
+    with pytest.raises(ValueError):
         Grid(GridConfig(seed=1, obs_radius=2, size=4, num_agents=2, map=test_map))
-    with pytest.raises(OverflowError):
+    with pytest.raises(ValueError):
         Grid(GridConfig(seed=2, obs_radius=2, size=4, num_agents=4, map=test_map))
 
 
@@ -143,7 +143,7 @@ def test_overflow_for_custom_map():
         [0, 1, 0, 1, 0],
         [0, 1, 0, 0, 1],
     ]
-    with pytest.raises(OverflowError):
+    with pytest.raises(ValueError):
         Grid(GridConfig(obs_radius=2, size=4, num_agents=5, density=0.3, map=test_map), num_retries=100)
 
 
@@ -199,7 +199,7 @@ def test_out_of_bounds_for_custom_positions():
 
 def test_duplicated_params():
     grid_map = "Aa"
-    with pytest.raises(KeyError):
+    with pytest.raises(ValueError):
         GridConfig(agents_xy=[[0, 0]], targets_xy=[[0, 0]], map=grid_map)
 
 
@@ -221,7 +221,7 @@ def test_custom_grid_with_specific_positions():
         !!!!!!!!!!!!!!!!!!
     """
     Grid(GridConfig(obs_radius=2, size=4, num_agents=24, map=grid_map))
-    with pytest.raises(OverflowError):
+    with pytest.raises(ValueError):
         Grid(GridConfig(obs_radius=2, size=4, num_agents=25, map=grid_map))
 
     grid_map = """
@@ -236,7 +236,7 @@ def test_custom_grid_with_specific_positions():
         !!!!!!!!!!!
     """
     Grid(GridConfig(obs_radius=2, num_agents=16, map=grid_map))
-    with pytest.raises(OverflowError):
+    with pytest.raises(ValueError):
         Grid(GridConfig(obs_radius=2, num_agents=17, map=grid_map))
 
     grid_map = """
@@ -246,7 +246,7 @@ def test_custom_grid_with_specific_positions():
             !@@!@@!.aB.
 
         """
-    with pytest.raises(KeyError):
+    with pytest.raises(ValueError):
         Grid(GridConfig(obs_radius=2, map=grid_map))
 
 
@@ -261,7 +261,7 @@ def test_restricted_grid():
     env = pogema_v0(grid_config=GridConfig(map=grid, num_agents=24, seed=0, obs_radius=2))
     env.reset()
 
-    with pytest.raises(OverflowError):
+    with pytest.raises(ValueError):
         env = pogema_v0(grid_config=GridConfig(map=grid, num_agents=25, seed=0, obs_radius=2))
         env.reset()
 
@@ -494,7 +494,7 @@ def test_goal_sequences_position_format():
             targets_xy=[[[2, 2, 3], [4, 4]]]
         )
 
-    with pytest.raises(ValueError, match="Position coordinates must be integers"):
+    with pytest.raises((ValueError, ValidationError)):
         GridConfig(
             width=8, height=8,
             agents_xy=[[0, 0]],

From 8e65b23c525dcf95ad26ddc259203e1352fde507 Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Mon, 2 Mar 2026 01:40:26 +0300
Subject: [PATCH 12/15] refactoring - Replace remaining asserts with proper
 exceptions   - Convert soft collision _revert_action from recursive to
 iterative   - Add SingleAgentWrapper multi-agent warning   - Remove
 AgentsDensityWrapper   - Fix PettingZoo render()/close() API   - Cache
 get_lifelong_targets_xy() (invalidate on reset)   - Add tests for A* policy,
 wrappers, and soft collisions   - Remove PyMARL reference from CLAUDE.md   -
 Document why connectivity check is not implemented

---
 pogema/__init__.py                  |  3 +--
 pogema/a_star_policy.py             |  3 ++-
 pogema/envs.py                      | 38 ++++++++++++++++++++---------
 pogema/grid_registry.py             |  3 ++-
 pogema/integrations/make_pogema.py  |  9 +++++++
 pogema/integrations/pettingzoo.py   |  6 ++---
 pogema/utils.py                     |  8 +++---
 pogema/wrappers/metrics.py          | 30 -----------------------
 pogema/wrappers/multi_time_limit.py |  3 ++-
 9 files changed, 50 insertions(+), 53 deletions(-)

diff --git a/pogema/__init__.py b/pogema/__init__.py
index 177bd3e..9488aaf 100644
--- a/pogema/__init__.py
+++ b/pogema/__init__.py
@@ -17,7 +17,6 @@
     NonDisappearEpLengthMetric,
     SumOfCostsAndMakespanMetric,
     LifeLongAverageThroughputMetric,
-    AgentsDensityWrapper,
     RuntimeMetricWrapper,
 )
 from pogema.wrappers.multi_time_limit import MultiTimeLimit
@@ -41,7 +40,7 @@
     'CSRMetric', 'ISRMetric', 'EpLengthMetric',
     'NonDisappearCSRMetric', 'NonDisappearISRMetric', 'NonDisappearEpLengthMetric',
     'SumOfCostsAndMakespanMetric', 'LifeLongAverageThroughputMetric',
-    'AgentsDensityWrapper', 'RuntimeMetricWrapper',
+    'RuntimeMetricWrapper',
 ]
 
 register(
diff --git a/pogema/a_star_policy.py b/pogema/a_star_policy.py
index 31ecb64..780e13d 100644
--- a/pogema/a_star_policy.py
+++ b/pogema/a_star_policy.py
@@ -24,7 +24,8 @@ def _increase_memory(self):
         m = self._memory
         r = self._memory.shape[0]
         self._memory = np.zeros(shape=(r * 2 + 1, r * 2 + 1))
-        assert self._try_to_insert(r, r, m, self._memory)
+        if not self._try_to_insert(r, r, m, self._memory):
+            raise RuntimeError("GridMemory invariant violation: failed to copy data into expanded memory")
 
     def update(self, x, y, obstacles):
         while True:
diff --git a/pogema/envs.py b/pogema/envs.py
index cd11847..72bf536 100644
--- a/pogema/envs.py
+++ b/pogema/envs.py
@@ -130,7 +130,9 @@ def __init__(self, grid_config=GridConfig(num_agents=2)):
             raise ValueError(f"Unknown observation type: {self.grid.config.observation_type}")
 
     def step(self, action: list):
-        assert len(action) == self.grid_config.num_agents
+        num_agents = self.grid_config.num_agents
+        if len(action) != num_agents:
+            raise ValueError(f"Expected {num_agents} actions, got {len(action)}")
         rewards = []
 
         terminated = []
@@ -219,14 +221,17 @@ def _get_infos(self):
         return infos
 
     def _revert_action(self, agent_idx, used_cells, cell, actions):
-        actions[agent_idx] = 0
-        used_cells[cell].remove(agent_idx)
-        new_cell = self.grid.positions_xy[agent_idx]
-        if new_cell in used_cells and len(used_cells[new_cell]) > 0:
-            used_cells[new_cell].append(agent_idx)
-            return self._revert_action(used_cells[new_cell][0], used_cells, new_cell, actions)
-        else:
-            used_cells.setdefault(new_cell, []).append(agent_idx)
+        while True:
+            actions[agent_idx] = 0
+            used_cells[cell].remove(agent_idx)
+            new_cell = self.grid.positions_xy[agent_idx]
+            if new_cell in used_cells and len(used_cells[new_cell]) > 0:
+                used_cells[new_cell].append(agent_idx)
+                agent_idx = used_cells[new_cell][0]
+                cell = new_cell
+            else:
+                used_cells.setdefault(new_cell, []).append(agent_idx)
+                break
         return actions, used_cells
 
     def move_agents(self, actions):
@@ -302,6 +307,7 @@ def __init__(self, grid_config=GridConfig(num_agents=2)):
         super().__init__(grid_config)
         self.current_goal_indices = [0] * grid_config.num_agents
         self.has_custom_sequences = grid_config.targets_xy is not None
+        self._lifelong_targets_cache: dict[bool, list] = {}
 
     def _initialize_grid(self):
         self.grid: GridLifeLong = GridLifeLong(grid_config=self.grid_config)
@@ -318,6 +324,9 @@ def get_lifelong_targets_xy(self, ignore_borders=False):
                 return [[[x + self.grid_config.obs_radius, y + self.grid_config.obs_radius] for x, y in sequence]
                         for sequence in self.grid_config.targets_xy]
 
+        if ignore_borders in self._lifelong_targets_cache:
+            return self._lifelong_targets_cache[ignore_borders]
+
         sequences = []
 
         main_rng = np.random.default_rng(self.grid_config.seed)
@@ -367,10 +376,13 @@ def get_lifelong_targets_xy(self, ignore_borders=False):
                 total_distance += abs(current_pos[0] - goal_coords[0]) + abs(current_pos[1] - goal_coords[1])
                 current_pos = goal_coords
             sequences.append(agent_sequence)
+
+        self._lifelong_targets_cache[ignore_borders] = sequences
         return sequences
 
     def reset(self, seed: int | None = None, return_info: bool = True, options: dict | None = None):
         self.current_goal_indices = [0] * self.grid_config.num_agents
+        self._lifelong_targets_cache = {}
         return super().reset(seed=seed, return_info=return_info, options=options)
 
     def _generate_new_target(self, agent_idx):
@@ -404,7 +416,9 @@ def _generate_new_target(self, agent_idx):
                                     self.grid.positions_xy[agent_idx])
 
     def step(self, action: list):
-        assert len(action) == self.grid_config.num_agents
+        num_agents = self.grid_config.num_agents
+        if len(action) != num_agents:
+            raise ValueError(f"Expected {num_agents} actions, got {len(action)}")
         rewards = []
 
         infos = [dict() for _ in range(self.grid_config.num_agents)]
@@ -442,7 +456,9 @@ def _initialize_grid(self):
         self.grid: Grid = Grid(grid_config=self.grid_config)
 
     def step(self, action: list):
-        assert len(action) == self.grid_config.num_agents
+        num_agents = self.grid_config.num_agents
+        if len(action) != num_agents:
+            raise ValueError(f"Expected {num_agents} actions, got {len(action)}")
 
         infos = [dict() for _ in range(self.grid_config.num_agents)]
 
diff --git a/pogema/grid_registry.py b/pogema/grid_registry.py
index a70cb82..f6ce9cb 100644
--- a/pogema/grid_registry.py
+++ b/pogema/grid_registry.py
@@ -41,7 +41,8 @@ def str_to_grid(self, grid_str):
                     raise KeyError(f"Unsupported symbol '{char}' at line {idx}")
             if row:
                 if obstacles:
-                    assert len(obstacles[-1]) == len(row), f"Wrong string size for row {idx};"
+                    if len(obstacles[-1]) != len(row):
+                        raise ValueError(f"Row {idx} has {len(row)} columns, expected {len(obstacles[-1])}")
                 obstacles.append(row)
         return obstacles, agents, targets
 
diff --git a/pogema/integrations/make_pogema.py b/pogema/integrations/make_pogema.py
index 130cb72..1e3af2b 100644
--- a/pogema/integrations/make_pogema.py
+++ b/pogema/integrations/make_pogema.py
@@ -1,3 +1,4 @@
+import warnings
 
 from pogema import GridConfig
 from pogema.envs import _make_pogema
@@ -31,6 +32,14 @@ def reset(self, seed: int | None = None, return_info: bool = True, options: dict
 
 
 def make_single_agent_gym(grid_config: GridConfig | dict = GridConfig()):
+    if grid_config.num_agents > 1:
+        warnings.warn(
+            f"SingleAgentWrapper is wrapping an environment with {grid_config.num_agents} agents. "
+            f"Only agent 0 will be controlled; agents 1-{grid_config.num_agents - 1} will take random actions. "
+            f"Use integration=None or integration='PettingZoo' for multi-agent control.",
+            UserWarning,
+            stacklevel=2,
+        )
     env = _make_pogema(grid_config)
     env = SingleAgentWrapper(env)
 
diff --git a/pogema/integrations/pettingzoo.py b/pogema/integrations/pettingzoo.py
index 18532be..5486085 100644
--- a/pogema/integrations/pettingzoo.py
+++ b/pogema/integrations/pettingzoo.py
@@ -36,9 +36,7 @@ def action_space(self, agent):
             raise ValueError(f"Unknown agent '{agent}'. Possible agents: {self.possible_agents}")
         return self.pogema.action_space
 
-    def render(self, mode="human"):
-        if mode != 'human':
-            raise ValueError(f"Unsupported render mode '{mode}'. Only 'human' is supported.")
+    def render(self):
         return self.pogema.render()
 
     def reset(self, seed=None, options=None):
@@ -72,4 +70,4 @@ def unwrapped(self):
         return self
 
     def close(self):
-        pass
+        self.pogema.close()
diff --git a/pogema/utils.py b/pogema/utils.py
index 3a5d8fd..1c41e80 100644
--- a/pogema/utils.py
+++ b/pogema/utils.py
@@ -31,12 +31,14 @@ def check_grid(obstacles, agents_xy, targets_xy):
     for start_xy, finish_xy in zip(agents_xy, targets_xy):
         s_x, s_y = start_xy
         if obstacles[s_x, s_y]:
-            raise KeyError(f'Cell is {s_x, s_y} occupied by obstacle.')
+            raise ValueError(f'Cell ({s_x}, {s_y}) is occupied by an obstacle.')
         f_x, f_y = finish_xy
         if obstacles[f_x, f_y]:
-            raise KeyError(f'Cell is {f_x, f_y} occupied by obstacle.')
+            raise ValueError(f'Cell ({f_x}, {f_y}) is occupied by an obstacle.')
 
-    # todo check connectivity of starts and finishes
+    # Connectivity check not implemented: GridLifeLong already warns on unreachable
+    # targets, and adding a mandatory check to Grid would be a breaking change for
+    # users who intentionally place agents/targets in disconnected components.
 
 
 def render_grid(obstacles, positions_xy=None, targets_xy=None, is_active=None, mode='human'):
diff --git a/pogema/wrappers/metrics.py b/pogema/wrappers/metrics.py
index b4b0e22..aae5e88 100644
--- a/pogema/wrappers/metrics.py
+++ b/pogema/wrappers/metrics.py
@@ -1,7 +1,5 @@
 import time
 
-import numpy as np
-
 from pogema.wrappers.base import PogemaWrapper
 
 
@@ -152,34 +150,6 @@ def _compute_stats(self, step, is_on_goal, finished):
             return result
 
 
-class AgentsDensityWrapper(PogemaWrapper):
-    def __init__(self, env):
-        super().__init__(env)
-        self._avg_agents_density = None
-
-    def count_agents(self, observations):
-        avg_agents_density = []
-        for obs in observations:
-            traversable_cells = np.size(obs['obstacles']) - np.count_nonzero(obs['obstacles'])
-            avg_agents_density.append(np.count_nonzero(obs['agents']) / traversable_cells)
-        self._avg_agents_density.append(np.mean(avg_agents_density))
-
-    def step(self, actions):
-        observations, rewards, terminated, truncated, infos = self.env.step(actions)
-        self.count_agents(observations)
-        if all(terminated) or all(truncated):
-            if 'metrics' not in infos[0]:
-                infos[0]['metrics'] = {}
-            infos[0]['metrics'].update(avg_agents_density=float(np.mean(self._avg_agents_density)))
-        return observations, rewards, terminated, truncated, infos
-
-    def reset(self, **kwargs):
-        self._avg_agents_density = []
-        observations, info = self.env.reset(**kwargs)
-        self.count_agents(observations)
-        return observations, info
-
-
 class RuntimeMetricWrapper(PogemaWrapper):
     def __init__(self, env):
         super().__init__(env)
diff --git a/pogema/wrappers/multi_time_limit.py b/pogema/wrappers/multi_time_limit.py
index 2e2e2a1..f6ccbcb 100644
--- a/pogema/wrappers/multi_time_limit.py
+++ b/pogema/wrappers/multi_time_limit.py
@@ -19,5 +19,6 @@ def reset(self, **kwargs):
         return self.env.reset(**kwargs)
 
     def set_elapsed_steps(self, elapsed_steps: int) -> None:
-        assert elapsed_steps >= 0
+        if elapsed_steps < 0:
+            raise ValueError(f"elapsed_steps must be non-negative, got {elapsed_steps}")
         self._elapsed_steps = elapsed_steps

From eb1c77c590d0c1ead3ec83119cd29ef6faa4c545 Mon Sep 17 00:00:00 2001
From: tviskaron <tviskaron@gmail.com>
Date: Sun, 29 Mar 2026 22:46:53 +0300
Subject: [PATCH 13/15] updated README.md with temporal github installation and
 more tests

---
 README.md                   |   9 +-
 tests/test_a_star_policy.py | 142 ++++++++++++++++++++++++
 tests/test_wrappers.py      | 209 ++++++++++++++++++++++++++++++++++++
 3 files changed, 358 insertions(+), 2 deletions(-)
 create mode 100644 tests/test_a_star_policy.py
 create mode 100644 tests/test_wrappers.py

diff --git a/README.md b/README.md
index f3ecc05..7a97236 100644
--- a/README.md
+++ b/README.md
@@ -7,6 +7,7 @@
 
 
 [![Downloads](https://static.pepy.tech/badge/pogema)](https://pepy.tech/project/pogema)
+[![Paper](https://img.shields.io/badge/Paper-ICLR%202025-1f4b99?logo=openreview&logoColor=white)](https://openreview.net/forum?id=6VgwE2tCRm)
 [![CI](https://github.com/Cognitive-AI-Systems/pogema/actions/workflows/CI.yml/badge.svg?branch=main)](https://github.com/Cognitive-AI-Systems/pogema/actions/workflows/CI.yml)
 [![CodeQL](https://github.com/Cognitive-AI-Systems/pogema/actions/workflows/codeql-analysis.yml/badge.svg)](https://github.com/Cognitive-AI-Systems/pogema/actions/workflows/codeql-analysis.yml) 
     
@@ -18,9 +19,13 @@ POGEMA stands for Partially-Observable Grid Environment for Multiple Agents. It
 
 ## Installation
 
-Just install from PyPI:
+For now, install directly from github:
 
-```pip install pogema```
+```bash
+pip install git+https://github.com/Cognitive-AI-Systems/pogema.git
+```
+
+This is a temporary installation option while we are working on Pogema 2.0. The current PyPI package still contains the older version. Once Pogema 2.0 is fully ready, it will also be published on PyPI with a simpler installation command.
 
 ## Using Example
 
diff --git a/tests/test_a_star_policy.py b/tests/test_a_star_policy.py
new file mode 100644
index 0000000..22c5858
--- /dev/null
+++ b/tests/test_a_star_policy.py
@@ -0,0 +1,142 @@
+import numpy as np
+import pytest
+
+from pogema import AStarAgent, BatchAStarAgent, GridConfig, pogema_v0
+
+
+def test_astar_agent_basic_pathfinding():
+    """AStarAgent should reach the target on a simple open map."""
+    gc = GridConfig(
+        map="....\n....\n....\n....",
+        agents_xy=[[0, 0]],
+        targets_xy=[[3, 3]],
+        observation_type='POMAPF',
+        on_target='finish',
+        max_episode_steps=64,
+    )
+    env = pogema_v0(gc)
+    obs, info = env.reset()
+
+    agent = AStarAgent()
+    for _ in range(64):
+        action = agent.act(obs[0])
+        obs, rewards, terminated, truncated, infos = env.step([action])
+        if all(terminated) or all(truncated):
+            break
+
+    assert rewards[0] == 1.0
+
+
+def test_astar_agent_clear_state():
+    """clear_state() should allow reuse across episodes without error."""
+    gc = GridConfig(
+        map="....\n....\n....\n....",
+        agents_xy=[[0, 0]],
+        targets_xy=[[1, 1]],
+        observation_type='POMAPF',
+        on_target='finish',
+        max_episode_steps=64,
+    )
+    env = pogema_v0(gc)
+
+    agent = AStarAgent()
+
+    for _episode in range(3):
+        obs, info = env.reset()
+        agent.clear_state()
+        for _ in range(64):
+            action = agent.act(obs[0])
+            obs, rewards, terminated, truncated, infos = env.step([action])
+            if all(terminated) or all(truncated):
+                break
+
+
+def test_astar_agent_detects_teleport():
+    """AStarAgent should raise if the agent teleports between calls."""
+    gc = GridConfig(
+        map="......\n......\n......\n......\n......\n......",
+        agents_xy=[[0, 0], [5, 5]],
+        targets_xy=[[5, 5], [0, 0]],
+        observation_type='POMAPF',
+        on_target='finish',
+        max_episode_steps=64,
+    )
+    env = pogema_v0(gc)
+    obs, _ = env.reset()
+
+    agent = AStarAgent()
+    # Move agent 0 a few steps to build up distance from origin
+    for _ in range(3):
+        action = agent.act(obs[0])
+        obs, _, terminated, truncated, _ = env.step([action, 0])
+        if all(terminated) or all(truncated):
+            break
+
+    # Feed agent 1's observation (at relative (0,0)) — agent 0 has moved ~3 steps away
+    with pytest.raises(IndexError, match="moved more than 1 step"):
+        agent.act(obs[1])
+
+
+def test_batch_astar_agent():
+    """BatchAStarAgent should handle multiple agents and reach targets."""
+    gc = GridConfig(
+        map="......\n......\n......\n......\n......\n......",
+        agents_xy=[[0, 0], [0, 5]],
+        targets_xy=[[5, 5], [5, 0]],
+        observation_type='POMAPF',
+        on_target='finish',
+        max_episode_steps=128,
+    )
+    env = pogema_v0(gc)
+    obs, _ = env.reset()
+
+    batch_agent = BatchAStarAgent()
+    solved = False
+    for _ in range(128):
+        actions = batch_agent.act(obs)
+        obs, rewards, terminated, truncated, infos = env.step(actions)
+        if all(terminated) or all(truncated):
+            solved = any(r > 0 for r in rewards)
+            break
+
+    assert solved
+
+
+def test_batch_astar_agent_reset_states():
+    """reset_states() should clear all agent state."""
+    batch_agent = BatchAStarAgent()
+
+    gc = GridConfig(
+        map="....\n....\n....\n....",
+        agents_xy=[[0, 0]],
+        targets_xy=[[1, 1]],
+        observation_type='POMAPF',
+        on_target='finish',
+        max_episode_steps=64,
+    )
+    env = pogema_v0(gc)
+
+    for _episode in range(2):
+        obs, _ = env.reset()
+        batch_agent.reset_states()
+        assert len(batch_agent.astar_agents) == 0
+        for _ in range(64):
+            actions = batch_agent.act(obs)
+            obs, rewards, terminated, truncated, infos = env.step(actions)
+            if all(terminated) or all(truncated):
+                break
+
+
+def test_grid_memory_expansion():
+    """GridMemory should expand when updating with distant coordinates."""
+    from pogema.a_star_policy import GridMemory
+
+    gm = GridMemory(start_r=2)
+    obstacles = np.zeros((5, 5), dtype=bool)
+    # Update at the origin — should fit in initial memory
+    gm.update(0, 0, obstacles)
+    assert not gm.is_obstacle(0, 0)
+
+    # Update far from center — should trigger expansion
+    gm.update(100, 100, obstacles)
+    assert not gm.is_obstacle(100, 100)
diff --git a/tests/test_wrappers.py b/tests/test_wrappers.py
new file mode 100644
index 0000000..1ae76a8
--- /dev/null
+++ b/tests/test_wrappers.py
@@ -0,0 +1,209 @@
+import pytest
+
+from pogema import GridConfig, RuntimeMetricWrapper, pogema_v0
+
+# ---------------------------------------------------------------------------
+# MultiTimeLimit
+# ---------------------------------------------------------------------------
+
+def test_multi_time_limit_truncates_at_exact_step():
+    """Episode should truncate at exactly max_episode_steps."""
+    max_steps = 16
+    gc = GridConfig(num_agents=2, size=8, seed=42, max_episode_steps=max_steps)
+    env = pogema_v0(gc)
+    env.reset()
+
+    for step in range(max_steps):
+        obs, rewards, terminated, truncated, infos = env.step(
+            [0] * gc.num_agents  # noop — agents won't reach goals
+        )
+        if step < max_steps - 1:
+            assert not all(truncated), f"Truncated too early at step {step}"
+    assert all(truncated), "Should be truncated at max_episode_steps"
+
+
+def test_multi_time_limit_set_elapsed_steps():
+    """set_elapsed_steps() should advance the internal counter."""
+    gc = GridConfig(num_agents=1, size=6, seed=42, max_episode_steps=10)
+    env = pogema_v0(gc)
+    env.reset()
+
+    # Jump to step 9
+    env.set_elapsed_steps(9)
+    _, _, _, truncated, _ = env.step([0])
+    assert all(truncated)
+
+
+def test_multi_time_limit_set_negative_raises():
+    gc = GridConfig(num_agents=1, size=6, seed=42, max_episode_steps=10)
+    env = pogema_v0(gc)
+    env.reset()
+    with pytest.raises(ValueError, match="non-negative"):
+        env.set_elapsed_steps(-1)
+
+
+def test_multi_time_limit_reset_clears():
+    """reset() should clear elapsed steps."""
+    gc = GridConfig(num_agents=1, size=6, seed=42, max_episode_steps=10)
+    env = pogema_v0(gc)
+    env.reset()
+
+    for _ in range(5):
+        env.step([0])
+
+    env.reset()
+    # After reset, we should be able to take max_episode_steps again
+    for step in range(10):
+        _, _, _, truncated, _ = env.step([0])
+        if step < 9:
+            assert not all(truncated)
+    assert all(truncated)
+
+
+# ---------------------------------------------------------------------------
+# SumOfCostsAndMakespanMetric
+# ---------------------------------------------------------------------------
+
+def test_sum_of_costs_and_makespan_known_scenario():
+    """With known map and seed, SoC and makespan should have expected values."""
+    gc = GridConfig(
+        map="......\n......\n......\n......\n......\n......",
+        agents_xy=[[0, 0], [0, 1]],
+        targets_xy=[[0, 1], [0, 0]],
+        on_target='nothing',
+        max_episode_steps=64,
+        collision_system='priority',
+    )
+    env = pogema_v0(gc)
+    env.reset()
+
+    # Manually solve: swap positions
+    # Agent 0 moves right (to [0,1]), Agent 1 moves left (to [0,0])
+    # With priority collision, higher-index agent wins — so agent 1 moves first
+    # Both should reach goals
+    for _ in range(64):
+        obs, rewards, terminated, truncated, infos = env.step([4, 3])  # right, left
+        if all(terminated) or all(truncated):
+            break
+
+    assert 'metrics' in infos[0]
+    assert 'SoC' in infos[0]['metrics']
+    assert 'makespan' in infos[0]['metrics']
+    assert infos[0]['metrics']['SoC'] >= 2  # At minimum 2 (one step each)
+    assert infos[0]['metrics']['makespan'] >= 1
+
+
+def test_sum_of_costs_truncated():
+    """When episode truncates, SoC/makespan should still be reported."""
+    gc = GridConfig(
+        num_agents=2, size=8, seed=42, on_target='nothing', max_episode_steps=8
+    )
+    env = pogema_v0(gc)
+    env.reset()
+
+    for _ in range(8):
+        obs, rewards, terminated, truncated, infos = env.step([0, 0])
+        if all(truncated):
+            break
+
+    assert 'metrics' in infos[0]
+    assert 'SoC' in infos[0]['metrics']
+
+
+# ---------------------------------------------------------------------------
+# RuntimeMetricWrapper
+# ---------------------------------------------------------------------------
+
+def test_runtime_metric_wrapper():
+    """RuntimeMetricWrapper should add a positive 'runtime' to metrics."""
+    gc = GridConfig(num_agents=2, size=6, seed=42, max_episode_steps=16)
+    env = pogema_v0(gc)
+    env = RuntimeMetricWrapper(env)
+    env.reset()
+
+    for _ in range(16):
+        obs, rewards, terminated, truncated, infos = env.step(
+            env.unwrapped.sample_actions()
+        )
+        if all(terminated) or all(truncated):
+            break
+
+    assert 'metrics' in infos[0]
+    assert 'runtime' in infos[0]['metrics']
+    assert infos[0]['metrics']['runtime'] >= 0.0
+
+
+def test_runtime_metric_reset_clears():
+    """RuntimeMetricWrapper should reset timing on env.reset()."""
+    gc = GridConfig(num_agents=2, size=6, seed=42, max_episode_steps=8)
+    env = pogema_v0(gc)
+    env = RuntimeMetricWrapper(env)
+
+    for _episode in range(2):
+        env.reset()
+        for _ in range(8):
+            obs, rewards, terminated, truncated, infos = env.step(
+                env.unwrapped.sample_actions()
+            )
+            if all(terminated) or all(truncated):
+                break
+        assert 'metrics' in infos[0]
+        assert 'runtime' in infos[0]['metrics']
+
+
+# ---------------------------------------------------------------------------
+# Soft collision edge cases
+# ---------------------------------------------------------------------------
+
+def test_soft_collision_no_crash():
+    """Soft collision system should not crash with many agents in tight space."""
+    gc = GridConfig(
+        num_agents=32, size=16, density=0.1, seed=42,
+        collision_system='soft', max_episode_steps=100,
+    )
+    env = pogema_v0(gc)
+    env.reset()
+    for _ in range(100):
+        actions = env.unwrapped.sample_actions()
+        env.step(actions.tolist())
+
+
+def test_soft_collision_cascading_revert():
+    """Soft collision cascading reverts should not error or cause inconsistency."""
+    gc = GridConfig(
+        num_agents=8, size=8, density=0.0, seed=7,
+        collision_system='soft', max_episode_steps=50,
+    )
+    env = pogema_v0(gc)
+    env.reset()
+    for _ in range(50):
+        # All agents try to move in same direction → forces collision resolution
+        actions = [1] * gc.num_agents
+        obs, rewards, terminated, truncated, infos = env.step(actions)
+        if all(terminated) or all(truncated):
+            break
+
+
+def test_soft_collision_edge_swap():
+    """Two agents trying to swap positions should both be reverted in soft mode."""
+    gc = GridConfig(
+        map="....\n....\n....\n....",
+        agents_xy=[[1, 1], [1, 2]],
+        targets_xy=[[1, 2], [1, 1]],
+        collision_system='soft',
+        on_target='nothing',
+        max_episode_steps=4,
+    )
+    env = pogema_v0(gc)
+    env.reset()
+
+    agents_before = [tuple(pos) for pos in env.unwrapped.get_agents_xy(ignore_borders=True)]
+
+    # Agent 0 moves right, Agent 1 moves left — edge collision
+    env.step([4, 3])
+
+    agents_after = [tuple(pos) for pos in env.unwrapped.get_agents_xy(ignore_borders=True)]
+    # Both should stay in place due to edge collision
+    assert agents_before == agents_after, (
+        f"Edge swap should be reverted: before={agents_before}, after={agents_after}"
+    )

From ad0d5932108fa1dab4711171dbffd9da3f631b2b Mon Sep 17 00:00:00 2001
From: Alexey Skrynnik <Tviskaron@gmail.com>
Date: Sun, 29 Mar 2026 23:08:13 +0300
Subject: [PATCH 14/15] docs and preparations for Pogema 2.0 (#47)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* Migrate to gymnasium >= 1.0 and modernize build tooling

- Use `env.unwrapped` for pogema-specific attributes (gymnasium >= 1.0 removed Wrapper.__getattr__ forwarding)
- Replace flake8 with ruff, migrate CI to uv
- Remove stale setup.py, requirements.txt, build.sh
- Misc pyproject.toml cleanup (numpy bound, classifiers, requires-python)

* - migrated to newer version of checks in pydantic
- fixed ruff checks

* Improvements:
- Removed PyMARL stuff
- Add PogemaWrapper base class with explicit method forwarding (using base.py)
- AnimationWrapper - enable/disable/save API, zero-overhead when inactive
- Soft collision_system by default
- Trimming for terminal render

* hotfix

* hotfix

* fix for animation.py and tests

* Removing CodeFactor

* update codeql

* ruff "W", "I", "UP", "B" flags, and corresponding fixes, plus fixed seeding in reset

* minor fix for version history

* refactoring:
- Replace assert with raise ValueError in all validators (safe under python -O)
- Fix SingleAgentWrapper.reset() silently dropping seed parameter
- Fix wrong exception types: KeyError/OverflowError → ValueError across codebase
- Add reset() to metric wrappers to clear stale state on mid-episode reset
- Fix ActionsSampler seed not updating on reset(seed=...)
- Improve error messages (typos, unclear bounds notation, missing guidance)
- Add Field(description=...) and parameterized type hints to all GridConfig fields
- Add __repr__ to PogemaWrapper showing config summary
- Export missing public classes in __all__ (metrics, MultiTimeLimit, register_grid, etc.)
- Raise dimension limit from 4096 to 8,388,608 (2^23)
- Fix old-style type hint (int, int) → tuple[int, int] in a_star_policy.py

* refactoring
- Replace remaining asserts with proper exceptions
  - Convert soft collision _revert_action from recursive to iterative
  - Add SingleAgentWrapper multi-agent warning
  - Remove AgentsDensityWrapper
  - Fix PettingZoo render()/close() API
  - Cache get_lifelong_targets_xy() (invalidate on reset)
  - Add tests for A* policy, wrappers, and soft collisions
  - Remove PyMARL reference from CLAUDE.md
  - Document why connectivity check is not implemented

* updated README.md with temporal github installation and more tests

* add docs

* building docs action

* hotfix for Config value 'theme'
---
 docs/editor.html | 1776 ++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 1776 insertions(+)
 create mode 100644 docs/editor.html

diff --git a/docs/editor.html b/docs/editor.html
new file mode 100644
index 0000000..b021145
--- /dev/null
+++ b/docs/editor.html
@@ -0,0 +1,1776 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+<title>Pogema Editor</title>
+<script>
+  // Apply theme before first paint: sessionStorage overrides URL param
+  (function() {
+    var saved = sessionStorage.getItem('pogema-editor-theme');
+    var isNight = saved ? saved === 'night' : new URLSearchParams(window.location.search).get('theme') === 'slate';
+    if (isNight) document.documentElement.classList.add('night');
+  })();
+</script>
+<style>
+  :root {
+    --move-dur: 0.12s;
+    --grid-line-color: #84a1ae;
+    --grid-obstacle-color: #84a1ae;
+  }
+  * { margin: 0; padding: 0; box-sizing: border-box; }
+  body {
+    font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif;
+    display: flex;
+    height: 100vh;
+    overflow: hidden;
+    background: var(--bg);
+    color: var(--fg);
+    transition: background 0.4s, color 0.4s;
+  }
+  #grid-container {
+    flex: 1;
+    display: flex;
+    align-items: center;
+    justify-content: center;
+    overflow: auto;
+    padding: 24px;
+    background: var(--bg);
+  }
+  svg { overflow: visible; }
+  svg text { pointer-events: none; user-select: none; }
+  .grid-line {
+    stroke: var(--grid-line-color);
+    stroke-width: 10;
+    pointer-events: none;
+    transition: stroke 0.4s;
+  }
+  .obstacle {
+    fill: var(--grid-obstacle-color);
+    transition: fill 0.4s;
+  }
+  .cell-hit { fill: transparent; }
+  .agent-circle { cursor: grab; transition: cx var(--move-dur) linear, cy var(--move-dur) linear, r 0.15s ease; }
+  .target-circle { fill: none; stroke-width: 10; }
+  .dragging { cursor: grabbing !important; opacity: 0.72; }
+  .agent-circle, .target-circle, .target-hit { transition: cx var(--move-dur) linear, cy var(--move-dur) linear; }
+  .agent-label {
+    font-size: 28px;
+    font-weight: bold;
+    fill: #fff;
+    text-anchor: middle;
+    dominant-baseline: central;
+    transition: x var(--move-dur) linear, y var(--move-dur) linear;
+  }
+  .selected-ring,
+  .target-select-ring {
+    fill: none;
+    stroke: var(--card-selected);
+    stroke-width: 8;
+    stroke-dasharray: 20 8;
+    pointer-events: none;
+    transition: cx var(--move-dur) linear, cy var(--move-dur) linear;
+    animation: dash-spin 1s linear infinite;
+  }
+  .selected-ring.active-focus,
+  .target-select-ring.active-focus {
+    stroke-width: 10;
+    stroke-dasharray: none;
+    animation: none;
+  }
+  @keyframes dash-spin { to { stroke-dashoffset: -56; } }
+
+  #left-panel,
+  #panel {
+    width: 280px;
+    padding: 18px;
+    overflow-y: auto;
+    display: flex;
+    flex-direction: column;
+    gap: 14px;
+    background: var(--panel-bg);
+    border-color: var(--panel-border);
+    color: var(--fg);
+    transition: background 0.4s, border-color 0.4s, color 0.4s;
+  }
+  #left-panel { border-right: 2px solid var(--panel-border); }
+  #panel { border-left: 2px solid var(--panel-border); }
+
+  .panel-section {
+    display: flex;
+    flex-direction: column;
+    gap: 10px;
+    padding-top: 12px;
+    border-top: 1px solid var(--section-border);
+  }
+  .panel-section:first-child { padding-top: 0; border-top: none; }
+  .panel-section.tight { gap: 8px; }
+
+  .section-head {
+    display: flex;
+    align-items: center;
+    justify-content: space-between;
+    gap: 10px;
+  }
+  h2 {
+    font-size: 16px;
+    color: #e94560;
+    margin: 0;
+  }
+  .panel-title {
+    font-size: 14px;
+    font-weight: bold;
+  }
+  .agent-title-group {
+    display: flex;
+    align-items: baseline;
+    gap: 8px;
+  }
+  .agent-count {
+    font-size: 12px;
+    opacity: 0.72;
+  }
+  .panel-note {
+    font-size: 11px;
+    opacity: 0.72;
+    text-align: right;
+  }
+
+  .gen-row input[type=number] {
+    width: 100%;
+    padding: 7px 8px;
+    border-radius: 6px;
+    border: 1px solid var(--input-border);
+    font-size: 12px;
+    text-align: center;
+    background: var(--input-bg);
+    color: var(--fg);
+  }
+
+  .chip-row,
+  .action-row {
+    display: flex;
+    flex-wrap: wrap;
+    gap: 8px;
+  }
+  .size-chip,
+  .panel-btn,
+  .tool-btn,
+  #theme-toggle,
+  #add-agent,
+  .agent-icon-btn {
+    border: 2px solid var(--btn-border);
+    border-radius: 8px;
+    background: none;
+    color: inherit;
+    cursor: pointer;
+    transition: background 0.2s, color 0.2s, border-color 0.2s, opacity 0.2s;
+  }
+  .size-chip,
+  .tool-btn {
+    padding: 7px 10px;
+    font-size: 12px;
+    font-weight: 700;
+  }
+  .size-chip { min-width: 58px; }
+  .tool-btn { flex: 1 1 46%; }
+  .panel-btn {
+    width: 100%;
+    padding: 9px 12px;
+    font-size: 13px;
+    font-weight: bold;
+  }
+  .size-chip:hover:not(:disabled),
+  .panel-btn:hover:not(:disabled),
+  .tool-btn:hover:not(:disabled),
+  #theme-toggle:hover,
+  #add-agent:hover:not(:disabled),
+  .agent-icon-btn:hover:not(:disabled) {
+    border-color: var(--btn-hover);
+    background: var(--btn-hover-bg);
+  }
+  button:disabled { opacity: 0.38; cursor: default; }
+
+  .gen-row {
+    display: flex;
+    align-items: center;
+    gap: 8px;
+    overflow: hidden;
+  }
+  .gen-row label {
+    font-size: 12px;
+    font-weight: bold;
+    min-width: 56px;
+    white-space: nowrap;
+  }
+  .gen-row input[type=range] { flex: 1; min-width: 0; accent-color: var(--accent-range); }
+  .gen-row input[type=number] { width: 66px; }
+
+  .stats-grid {
+    display: grid;
+    grid-template-columns: repeat(2, minmax(0, 1fr));
+    gap: 8px;
+  }
+  .resize-pad {
+    display: grid;
+    grid-template-columns: repeat(3, minmax(0, 1fr));
+    gap: 8px;
+    align-items: stretch;
+    padding: 0;
+    border: none;
+    border-radius: 0;
+  }
+  .resize-pad .tool-btn {
+    min-height: 44px;
+    width: 100%;
+    padding: 7px 8px;
+    font-size: 18px;
+    line-height: 1;
+  }
+  .resize-mode-toggle {
+    font-size: 22px !important;
+    font-weight: 800;
+    transition: none;
+  }
+  .stat-card {
+    border-radius: 8px;
+    padding: 9px 10px;
+    display: flex;
+    flex-direction: column;
+    gap: 3px;
+    background: var(--stat-bg);
+    border: 1px solid var(--stat-border);
+  }
+  .stat-label {
+    font-size: 11px;
+    opacity: 0.72;
+    text-transform: uppercase;
+    letter-spacing: 0.04em;
+  }
+  .stat-value {
+    font-size: 14px;
+    font-weight: 700;
+  }
+  #agent-list {
+    display: flex;
+    flex-direction: column;
+    gap: 8px;
+  }
+  .agent-card {
+    border-radius: 10px;
+    padding: 12px 14px;
+    cursor: pointer;
+    display: flex;
+    align-items: center;
+    gap: 10px;
+    background: var(--card-bg);
+    box-shadow: var(--card-shadow);
+    border: 2px solid transparent;
+    transition: border-color 0.15s, background 0.4s, box-shadow 0.4s;
+  }
+  .agent-card.selected { border-color: var(--card-selected); }
+  .agent-card:hover { border-color: var(--card-hover); }
+  .agent-inspector {
+    flex-direction: column;
+    align-items: stretch;
+    gap: 12px;
+    cursor: default;
+  }
+  .agent-inspector:hover { border-color: transparent; }
+  .agent-inspector-head {
+    display: flex;
+    align-items: center;
+    gap: 10px;
+  }
+  .agent-inspector-info {
+    display: flex;
+    align-items: center;
+    gap: 10px;
+    min-width: 0;
+  }
+  .agent-inspector-title {
+    font-size: 14px;
+    font-weight: 700;
+  }
+  .agent-inspector-meta {
+    font-size: 12px;
+    opacity: 0.72;
+  }
+  .agent-header-actions {
+    display: flex;
+    align-items: center;
+    gap: 6px;
+  }
+  .agent-inspector-grid {
+    display: grid;
+    grid-template-columns: auto 1fr;
+    gap: 6px 10px;
+    align-items: baseline;
+    font-size: 13px;
+  }
+  .agent-inspector-grid strong {
+    font-size: 11px;
+    letter-spacing: 0.04em;
+    opacity: 0.72;
+    text-transform: uppercase;
+  }
+  .agent-dot-wrapper {
+    position: relative;
+    width: 28px;
+    height: 28px;
+    flex-shrink: 0;
+  }
+  .agent-dot {
+    width: 28px;
+    height: 28px;
+    border-radius: 50%;
+    box-shadow: 0 2px 6px rgba(0,0,0,0.2);
+    cursor: pointer;
+  }
+  .agent-color-input {
+    position: absolute;
+    inset: 0;
+    opacity: 0;
+    width: 100%;
+    height: 100%;
+    cursor: pointer;
+    border: none;
+    padding: 0;
+  }
+  .mode-toggle {
+    display: flex;
+    align-items: center;
+    gap: 6px;
+  }
+  .mode-icon {
+    cursor: pointer;
+    transition: opacity 0.15s;
+  }
+  .mode-icon:hover { opacity: 0.8 !important; }
+  .agent-info {
+    font-size: 13px;
+    line-height: 1.45;
+  }
+  .agent-info strong { font-size: 14px; }
+
+  #theme-toggle {
+    padding: 6px 12px;
+    font-size: 14px;
+    font-weight: bold;
+  }
+  #add-agent,
+  .agent-icon-btn {
+    width: 32px;
+    height: 32px;
+    padding: 0;
+    line-height: 1;
+    font-size: 20px;
+    display: inline-flex;
+    align-items: center;
+    justify-content: center;
+  }
+
+  #instructions,
+  #workflow-instructions {
+    font-size: 12px;
+    color: var(--instructions-color);
+    line-height: 1.55;
+  }
+  #instructions kbd {
+    padding: 1px 5px;
+    border-radius: 3px;
+    font-family: monospace;
+    background: var(--kbd-bg);
+    color: var(--fg);
+    transition: background 0.4s;
+  }
+
+  body.day {
+    --bg: #ffffff;
+    --fg: #222;
+    --panel-bg: #f7f8fa;
+    --panel-border: #d8d1c7;
+    --section-border: #d8d1c7;
+    --btn-border: #c7d1d7;
+    --btn-hover: #ffd700;
+    --btn-hover-bg: rgba(255, 215, 0, 0.12);
+    --card-bg: #fff;
+    --card-shadow: 0 1px 4px rgba(0,0,0,0.07);
+    --stat-bg: #f7f8fa;
+    --stat-border: #d8d1c7;
+    --input-border: #c9c1b6;
+    --input-bg: #fff;
+    --kbd-bg: #d8ddd9;
+    --status-bg: #eef1f3;
+    --grid-line-color: #84a1ae;
+    --grid-obstacle-color: #84a1ae;
+    --accent-range: #e94560;
+    --card-selected: #ffd700;
+    --card-hover: #e94560;
+    --instructions-color: #888;
+  }
+  body.day .stat-card .stat-label { opacity: 0.9; }
+
+  html.night body,
+  body.night {
+    --bg: #202028;
+    --fg: #f2f2f2;
+    --panel-bg: #262730;
+    --panel-border: #3c5360;
+    --section-border: #344754;
+    --btn-border: #4a6474;
+    --btn-hover: #FFD700;
+    --btn-hover-bg: rgba(255, 215, 0, 0.1);
+    --card-bg: #2c3340;
+    --card-shadow: 0 1px 5px rgba(0,0,0,0.25);
+    --stat-bg: #2a3038;
+    --stat-border: transparent;
+    --input-border: #4a6474;
+    --input-bg: #232831;
+    --kbd-bg: #2a3038;
+    --status-bg: #262d36;
+    --grid-line-color: #4d839a;
+    --grid-obstacle-color: #4d839a;
+    --accent-range: #d63066;
+    --card-selected: #FFD700;
+    --card-hover: #d63066;
+    --instructions-color: #b8ced9;
+  }
+
+  @media (max-width: 1200px) {
+    #left-panel,
+    #panel { width: 250px; }
+  }
+
+  @media (max-width: 980px) {
+    body {
+      flex-direction: column;
+      height: auto;
+      min-height: 100vh;
+      overflow: auto;
+    }
+    #left-panel,
+    #panel {
+      width: 100%;
+      border: none;
+    }
+    #left-panel { border-bottom: 2px solid; }
+    #panel { border-top: 2px solid; }
+    #grid-container {
+      min-height: 55vh;
+      order: 2;
+    }
+  }
+</style>
+</head>
+<body>
+<div id="left-panel">
+  <div class="panel-section">
+    <div class="section-head">
+      <h2>Map Size</h2>
+    </div>
+    <div class="resize-pad" id="resize-controls">
+      <button class="tool-btn" data-resize-direction="top-left" title="Resize top-left corner">↖</button>
+      <button class="tool-btn" data-resize-direction="top" title="Resize top edge">↑</button>
+      <button class="tool-btn" data-resize-direction="top-right" title="Resize top-right corner">↗</button>
+      <button class="tool-btn" data-resize-direction="left" title="Resize left edge">←</button>
+      <button id="resize-mode-toggle" class="tool-btn resize-mode-toggle" title="Toggle grow or shrink mode">+</button>
+      <button class="tool-btn" data-resize-direction="right" title="Resize right edge">→</button>
+      <button class="tool-btn" data-resize-direction="bottom-left" title="Resize bottom-left corner">↙</button>
+      <button class="tool-btn" data-resize-direction="bottom" title="Resize bottom edge">↓</button>
+      <button class="tool-btn" data-resize-direction="bottom-right" title="Resize bottom-right corner">↘</button>
+    </div>
+  </div>
+
+  <div class="panel-section">
+    <div class="section-head">
+      <h2>Quick Sizes</h2>
+    </div>
+    <div class="chip-row" id="size-presets">
+      <button class="size-chip" data-rows="8" data-cols="8">8×8</button>
+      <button class="size-chip" data-rows="16" data-cols="16">16×16</button>
+      <button class="size-chip" data-rows="32" data-cols="32">32×32</button>
+      <!-- <button class="size-chip" data-rows="64" data-cols="64">64×64</button> -->
+    </div>
+  </div>
+
+  <div class="panel-section">
+    <div class="section-head">
+      <h2>Obstacles</h2>
+    </div>
+    <div class="action-row">
+      <button id="btn-clear-obstacles" class="tool-btn">Clear</button>
+      <button id="btn-randomize" class="tool-btn">Randomize</button>
+    </div>
+    <div class="gen-row">
+      <label>Density</label>
+      <input type="range" id="density-slider" min="0" max="70" value="18">
+      <input type="number" id="density-input" min="0" max="70" value="18">
+    </div>
+    <div class="stats-grid">
+      <div class="stat-card">
+        <span class="stat-label">Size</span>
+        <span class="stat-value" id="stat-size">16×16</span>
+      </div>
+      <div class="stat-card">
+        <span class="stat-label">Obstacles</span>
+        <span class="stat-value" id="stat-obstacles">0</span>
+      </div>
+      <div class="stat-card">
+        <span class="stat-label">Free Cells</span>
+        <span class="stat-value" id="stat-free">256</span>
+      </div>
+      <div class="stat-card">
+        <span class="stat-label">Obstacle %</span>
+        <span class="stat-value" id="stat-density">0.0%</span>
+      </div>
+    </div>
+  </div>
+
+  <div class="panel-section">
+    <div id="workflow-instructions">
+      <strong>Workflow</strong><br>
+      Set map size, randomize or clear obstacles, edit them, generate agents and targets, then copy the Pogema snippet.
+    </div>
+  </div>
+
+</div>
+
+<div id="grid-container"></div>
+
+<div id="panel">
+  <div class="section-head">
+    <h2>Pogema Editor</h2>
+    <button id="theme-toggle" title="Toggle theme">&#9790;</button>
+  </div>
+  <div class="section-head">
+    <div class="agent-title-group">
+      <span class="panel-title">Agents</span>
+      <span id="agent-count" class="agent-count">0</span>
+    </div>
+    <div class="agent-header-actions">
+      <button id="remove-agent" class="agent-icon-btn remove" title="Remove selected agent">&#8722;</button>
+      <button id="add-agent" title="Add agent">+</button>
+      <button id="toggle-numbering" class="agent-icon-btn" title="Toggle agent numbering">#</button>
+      <button id="toggle-selection" class="agent-icon-btn" title="Toggle selection rings">&#9675;</button>
+    </div>
+  </div>
+  <div id="agent-list"></div>
+  <div id="instructions">
+    <strong>Controls</strong><br>
+    <kbd>Tab</kbd> / <kbd>Shift+Tab</kbd> — cycle agents<br>
+    <kbd>Space</kbd> — toggle agent / target<br>
+    <kbd>0</kbd>-<kbd>9</kbd> — select agent by ID<br>
+    <kbd>+</kbd> / <kbd>-</kbd> — add / remove agent<br>
+    <kbd>Arrows</kbd> / <kbd>HJKL</kbd> — move<br>
+    <kbd>Drag</kbd> agents or targets with the mouse
+  </div>
+  <div class="panel-section tight">
+    <h2>Generate agents</h2>
+    <div class="gen-row">
+      <label>Agents</label>
+      <input type="range" id="agent-count-slider" min="1" max="16" value="8">
+      <input type="number" id="agent-count-input" min="1" max="16" value="8">
+    </div>
+    <button id="btn-generate" class="panel-btn primary">Generate Agents &amp; Targets</button>
+  </div>
+
+  <div class="panel-section tight">
+    <button id="copy-pogema" class="panel-btn accent">&#128203; Copy Pogema Snippet</button>
+    <button id="download-svg" class="panel-btn">&#10515; Download SVG</button>
+  </div>
+</div>
+
+<datalist id="agent-colors">
+  <option>#c1433c</option>
+  <option>#2e6f9e</option>
+  <option>#6e81af</option>
+  <option>#00b9c8</option>
+  <option>#72d5c8</option>
+  <option>#0ea08c</option>
+  <option>#8f7b66</option>
+</datalist>
+
+<script>
+(function() {
+  const CELL = 100;
+  const RADIUS = 35;
+  const CORNER = 15;
+  const COLORS = ['#c1433c', '#2e6f9e', '#6e81af', '#00b9c8', '#72d5c8', '#0ea08c', '#8f7b66'];
+  const DIR = { up: [-1, 0], down: [1, 0], left: [0, -1], right: [0, 1] };
+  const RESIZE_GLYPHS = {
+    add: {
+      'top-left': '↖',
+      top: '↑',
+      'top-right': '↗',
+      left: '←',
+      right: '→',
+      'bottom-left': '↙',
+      bottom: '↓',
+      'bottom-right': '↘'
+    },
+    remove: {
+      'top-left': '↘',
+      top: '↓',
+      'top-right': '↙',
+      left: '→',
+      right: '←',
+      'bottom-left': '↗',
+      bottom: '↑',
+      'bottom-right': '↖'
+    }
+  };
+  const RESIZE_ACTIONS = {
+    'add-top': { rowsDelta: 1, colsDelta: 0, rowOffset: 1, colOffset: 0 },
+    'remove-top': { rowsDelta: -1, colsDelta: 0, rowOffset: -1, colOffset: 0 },
+    'add-bottom': { rowsDelta: 1, colsDelta: 0, rowOffset: 0, colOffset: 0 },
+    'remove-bottom': { rowsDelta: -1, colsDelta: 0, rowOffset: 0, colOffset: 0 },
+    'add-left': { rowsDelta: 0, colsDelta: 1, rowOffset: 0, colOffset: 1 },
+    'remove-left': { rowsDelta: 0, colsDelta: -1, rowOffset: 0, colOffset: -1 },
+    'add-right': { rowsDelta: 0, colsDelta: 1, rowOffset: 0, colOffset: 0 },
+    'remove-right': { rowsDelta: 0, colsDelta: -1, rowOffset: 0, colOffset: 0 },
+    'add-top-left': { rowsDelta: 1, colsDelta: 1, rowOffset: 1, colOffset: 1 },
+    'remove-top-left': { rowsDelta: -1, colsDelta: -1, rowOffset: -1, colOffset: -1 },
+    'add-top-right': { rowsDelta: 1, colsDelta: 1, rowOffset: 1, colOffset: 0 },
+    'remove-top-right': { rowsDelta: -1, colsDelta: -1, rowOffset: -1, colOffset: 0 },
+    'add-bottom-left': { rowsDelta: 1, colsDelta: 1, rowOffset: 0, colOffset: 1 },
+    'remove-bottom-left': { rowsDelta: -1, colsDelta: -1, rowOffset: 0, colOffset: -1 },
+    'add-bottom-right': { rowsDelta: 1, colsDelta: 1, rowOffset: 0, colOffset: 0 },
+    'remove-bottom-right': { rowsDelta: -1, colsDelta: -1, rowOffset: 0, colOffset: 0 }
+  };
+  const PAD = CELL / 2;
+  const NS = 'http://www.w3.org/2000/svg';
+  const MOVE_INTERVAL = 120;
+  const MAX_DIMENSION = 64;
+  const MIN_DIMENSION = 2;
+
+  let ROWS = 16;
+  let COLS = 16;
+  const obstacles = new Set();
+  const agents = [];
+  let selectedAgent = null;
+  let selectionMode = 'agent';
+  let nextAgentId = 0;
+  let svg;
+  let obsGroup;
+  let targetHitGroup;
+  let targetGroup;
+  let agentGroup;
+  let labelGroup;
+  let resizeMode = 'add';
+  let paintSession = null;
+  const obsElements = {};
+
+  const gridContainer = document.getElementById('grid-container');
+  const densitySlider = document.getElementById('density-slider');
+  const densityInput = document.getElementById('density-input');
+  const sizePresetButtons = [...document.querySelectorAll('#size-presets .size-chip')];
+  const resizeButtons = [...document.querySelectorAll('#resize-controls [data-resize-direction]')];
+  const resizeModeToggle = document.getElementById('resize-mode-toggle');
+
+  const statSize = document.getElementById('stat-size');
+  const statObstacles = document.getElementById('stat-obstacles');
+  const statFree = document.getElementById('stat-free');
+  const statDensity = document.getElementById('stat-density');
+
+  const agentCountEl = document.getElementById('agent-count');
+  const agentListEl = document.getElementById('agent-list');
+  const agentCountSlider = document.getElementById('agent-count-slider');
+  const agentCountInput = document.getElementById('agent-count-input');
+  const generateBtn = document.getElementById('btn-generate');
+  const addAgentBtn = document.getElementById('add-agent');
+  const removeAgentBtn = document.getElementById('remove-agent');
+  const toggleNumberingBtn = document.getElementById('toggle-numbering');
+  const toggleSelectionBtn = document.getElementById('toggle-selection');
+  let showNumbering = true;
+  let showSelection = true;
+  const copyBtn = document.getElementById('copy-pogema');
+  const downloadSvgBtn = document.getElementById('download-svg');
+  const randomizeBtn = document.getElementById('btn-randomize');
+  const clearObstaclesBtn = document.getElementById('btn-clear-obstacles');
+  const toggleBtn = document.getElementById('theme-toggle');
+
+  function key(r, c) { return r + ',' + c; }
+  function cxPos(c) { return PAD + c * CELL + CELL / 2; }
+  function cyPos(r) { return PAD + r * CELL + CELL / 2; }
+  function clamp(value, min, max) { return Math.max(min, Math.min(max, value)); }
+
+  function clampCountInput(input, min, max, fallback) {
+    let value = parseInt(input.value, 10);
+    if (Number.isNaN(value)) value = fallback;
+    value = clamp(value, min, max);
+    input.value = value;
+    return value;
+  }
+
+  function createSeededRandom(seed) {
+    let t = seed >>> 0;
+    return function() {
+      t += 0x6d2b79f5;
+      let v = Math.imul(t ^ (t >>> 15), t | 1);
+      v ^= v + Math.imul(v ^ (v >>> 7), v | 61);
+      return ((v ^ (v >>> 14)) >>> 0) / 4294967296;
+    };
+  }
+
+  function shuffleInPlace(items, rng) {
+    for (let i = items.length - 1; i > 0; i--) {
+      const j = Math.floor(rng() * (i + 1));
+      [items[i], items[j]] = [items[j], items[i]];
+    }
+    return items;
+  }
+
+  function bindRangeNumberInput(range, input, getBounds, fallback) {
+    range.addEventListener('input', () => {
+      input.value = range.value;
+    });
+    input.addEventListener('change', () => {
+      const { min, max } = getBounds();
+      const value = clampCountInput(input, min, max, fallback);
+      range.value = value;
+    });
+  }
+
+  function forEachCell(rows, cols, visit) {
+    for (let r = 0; r < rows; r++) {
+      for (let c = 0; c < cols; c++) visit(r, c);
+    }
+  }
+
+  function getMapArray() {
+    const rows = [];
+    forEachCell(ROWS, COLS, (r, c) => {
+      if (!rows[r]) rows[r] = '';
+      rows[r] += obstacles.has(key(r, c)) ? '#' : '.';
+    });
+    return rows;
+  }
+
+  function getObstacleCoords() {
+    return [...obstacles].map((item) => item.split(',').map(Number));
+  }
+
+  function getFreeCellCount() {
+    return ROWS * COLS - obstacles.size;
+  }
+
+  function cellHasAgent(r, c, excludeId) {
+    return agents.some((agent) => agent.id !== excludeId && agent.row === r && agent.col === c);
+  }
+
+  function cellHasTarget(r, c, excludeId) {
+    return agents.some((agent) => agent.id !== excludeId && agent.targetRow === r && agent.targetCol === c);
+  }
+
+  function randomFreeCell(extraTaken) {
+    const taken = new Set(extraTaken || []);
+    agents.forEach((agent) => taken.add(key(agent.row, agent.col)));
+    const free = [];
+    forEachCell(ROWS, COLS, (r, c) => {
+      const cellKey = key(r, c);
+      if (!obstacles.has(cellKey) && !taken.has(cellKey)) free.push([r, c]);
+    });
+    if (!free.length) return null;
+    return free[Math.floor(Math.random() * free.length)];
+  }
+
+  function buildSVG() {
+    if (svg) svg.remove();
+
+    const stroke = 10;
+    const svgW = COLS * CELL + CELL;
+    const svgH = ROWS * CELL + CELL;
+    const vbX = -stroke / 2;
+    const vbY = -stroke / 2;
+    const vbW = svgW + stroke;
+    const vbH = svgH + stroke;
+
+    svg = document.createElementNS(NS, 'svg');
+    svg.setAttribute('width', vbW);
+    svg.setAttribute('height', vbH);
+    svg.setAttribute('viewBox', `${vbX} ${vbY} ${vbW} ${vbH}`);
+    svg.style.maxWidth = '100%';
+    svg.style.maxHeight = '100%';
+    gridContainer.appendChild(svg);
+
+    const bgGroup = document.createElementNS(NS, 'g');
+    svg.appendChild(bgGroup);
+    forEachCell(ROWS, COLS, (r, c) => {
+      const rect = document.createElementNS(NS, 'rect');
+      rect.setAttribute('x', PAD + c * CELL);
+      rect.setAttribute('y', PAD + r * CELL);
+      rect.setAttribute('width', CELL);
+      rect.setAttribute('height', CELL);
+      rect.classList.add('cell-hit');
+      bindCellInteractions(rect, r, c);
+      bgGroup.appendChild(rect);
+    });
+
+    const lineGroup = document.createElementNS(NS, 'g');
+    svg.appendChild(lineGroup);
+    for (let r = 0; r <= ROWS; r++) {
+      const line = document.createElementNS(NS, 'line');
+      const y = PAD + r * CELL;
+      line.setAttribute('x1', 0);
+      line.setAttribute('y1', y);
+      line.setAttribute('x2', svgW);
+      line.setAttribute('y2', y);
+      line.classList.add('grid-line');
+      lineGroup.appendChild(line);
+    }
+    for (let c = 0; c <= COLS; c++) {
+      const line = document.createElementNS(NS, 'line');
+      const x = PAD + c * CELL;
+      line.setAttribute('x1', x);
+      line.setAttribute('y1', 0);
+      line.setAttribute('x2', x);
+      line.setAttribute('y2', svgH);
+      line.classList.add('grid-line');
+      lineGroup.appendChild(line);
+    }
+
+    obsGroup = document.createElementNS(NS, 'g');
+    targetHitGroup = document.createElementNS(NS, 'g');
+    agentGroup = document.createElementNS(NS, 'g');
+    targetGroup = document.createElementNS(NS, 'g');
+    labelGroup = document.createElementNS(NS, 'g');
+    svg.appendChild(obsGroup);
+    svg.appendChild(targetHitGroup);
+    svg.appendChild(agentGroup);
+    svg.appendChild(targetGroup);
+    svg.appendChild(labelGroup);
+
+    Object.keys(obsElements).forEach((entryKey) => delete obsElements[entryKey]);
+    obstacles.forEach((entryKey) => {
+      const [r, c] = entryKey.split(',').map(Number);
+      drawObstacle(r, c);
+    });
+
+    agents.forEach((agent) => {
+      createAgentElements(agent);
+      setAgentVisualPosition(agent);
+      setTargetVisualPosition(agent);
+    });
+  }
+
+  function bindCellInteractions(element, r, c) {
+    element.addEventListener('mousedown', (event) => onCellPointerDown(r, c, event));
+    element.addEventListener('mouseenter', () => onCellPointerEnter(r, c));
+    element.addEventListener('dragstart', (event) => event.preventDefault());
+  }
+
+  function moveAgentPart(agent, mode, row, col, dr, dc) {
+    if (dr !== undefined && dc !== undefined) {
+      let r = row, c = col;
+      let found = false;
+      while (r >= 0 && r < ROWS && c >= 0 && c < COLS) {
+        if (!obstacles.has(key(r, c)) && !(mode === 'agent' && cellHasAgent(r, c, agent.id))) {
+          row = r; col = c; found = true; break;
+        }
+        r += dr; c += dc;
+      }
+      if (!found) return false;
+    }
+    if (row < 0 || row >= ROWS || col < 0 || col >= COLS) return false;
+    if (obstacles.has(key(row, col))) return false;
+    if (mode === 'agent' && cellHasAgent(row, col, agent.id)) return false;
+
+    if (mode === 'agent') {
+      agent.row = row;
+      agent.col = col;
+      updateAgentPos(agent);
+    } else {
+      agent.targetRow = row;
+      agent.targetCol = col;
+      updateTargetPos(agent);
+    }
+    return true;
+  }
+
+  function drawObstacle(r, c) {
+    const itemKey = key(r, c);
+    if (obsElements[itemKey]) return;
+    const obstacleInset = 15;
+    const obstacleSize = CELL - obstacleInset * 2;
+    const rect = document.createElementNS(NS, 'rect');
+    rect.classList.add('obstacle');
+    rect.setAttribute('x', PAD + c * CELL + obstacleInset);
+    rect.setAttribute('y', PAD + r * CELL + obstacleInset);
+    rect.setAttribute('width', obstacleSize);
+    rect.setAttribute('height', obstacleSize);
+    rect.setAttribute('rx', CORNER);
+    rect.setAttribute('ry', CORNER);
+    bindCellInteractions(rect, r, c);
+    obsGroup.appendChild(rect);
+    obsElements[itemKey] = rect;
+  }
+
+  function removeObsEl(r, c) {
+    const itemKey = key(r, c);
+    if (obsElements[itemKey]) {
+      obsElements[itemKey].remove();
+      delete obsElements[itemKey];
+    }
+  }
+
+  function createAgentElements(agent, targetHitMount = targetHitGroup, targetMount = targetGroup, agentMount = agentGroup, labelMount = labelGroup) {
+    const targetSelect = document.createElementNS(NS, 'circle');
+    targetSelect.setAttribute('r', RADIUS + 10);
+    targetSelect.classList.add('target-select-ring');
+    targetSelect.style.display = 'none';
+    targetHitMount.appendChild(targetSelect);
+    agent.targetSelectEl = targetSelect;
+
+    const targetHit = document.createElementNS(NS, 'circle');
+    targetHit.setAttribute('r', RADIUS + 10);
+    targetHit.setAttribute('fill', 'transparent');
+    targetHit.setAttribute('stroke', 'transparent');
+    targetHit.setAttribute('stroke-width', '10');
+    targetHit.style.cursor = 'grab';
+    targetHit.addEventListener('click', (event) => {
+      event.stopPropagation();
+      selectAgent(agent.id, 'target');
+    });
+    targetHit.addEventListener('mousedown', (event) => {
+      event.stopPropagation();
+      startDrag(event, agent, 'target');
+    });
+    targetHitMount.appendChild(targetHit);
+    agent.targetHitEl = targetHit;
+
+    const targetCircle = document.createElementNS(NS, 'circle');
+    targetCircle.setAttribute('r', RADIUS);
+    targetCircle.setAttribute('stroke', agent.color);
+    targetCircle.classList.add('target-circle');
+    targetCircle.style.pointerEvents = 'none';
+    targetMount.appendChild(targetCircle);
+    agent.targetEl = targetCircle;
+
+    const selectCircle = document.createElementNS(NS, 'circle');
+    selectCircle.setAttribute('r', RADIUS + 8);
+    selectCircle.classList.add('selected-ring');
+    selectCircle.style.display = 'none';
+    agentMount.appendChild(selectCircle);
+    agent.selectEl = selectCircle;
+
+    const agentCircle = document.createElementNS(NS, 'circle');
+    agentCircle.setAttribute('r', RADIUS);
+    agentCircle.setAttribute('fill', agent.color);
+    agentCircle.classList.add('agent-circle');
+    agentCircle.addEventListener('click', (event) => {
+      event.stopPropagation();
+      selectAgent(agent.id, 'agent');
+    });
+    agentCircle.addEventListener('mousedown', (event) => {
+      event.stopPropagation();
+      startDrag(event, agent, 'agent');
+    });
+    agentMount.appendChild(agentCircle);
+    agent.circleEl = agentCircle;
+
+    const label = document.createElementNS(NS, 'text');
+    label.classList.add('agent-label');
+    label.textContent = agent.id;
+    labelMount.appendChild(label);
+    agent.labelEl = label;
+  }
+
+  function removeAgentElements(agent) {
+    [agent.circleEl, agent.labelEl, agent.targetEl, agent.targetHitEl, agent.selectEl, agent.targetSelectEl]
+      .forEach((element) => { if (element) element.remove(); });
+  }
+
+  function setAgentVisualPosition(agent) {
+    const x = cxPos(agent.col);
+    const y = cyPos(agent.row);
+    agent.circleEl.setAttribute('cx', x);
+    agent.circleEl.setAttribute('cy', y);
+    agent.labelEl.setAttribute('x', x);
+    agent.labelEl.setAttribute('y', y);
+    agent.selectEl.setAttribute('cx', x);
+    agent.selectEl.setAttribute('cy', y);
+  }
+
+  function updateAgentPos(agent, syncPanel = true) {
+    setAgentVisualPosition(agent);
+    if (syncPanel) updatePanel();
+  }
+
+  function setTargetVisualPosition(agent) {
+    const x = cxPos(agent.targetCol);
+    const y = cyPos(agent.targetRow);
+    agent.targetEl.setAttribute('cx', x);
+    agent.targetEl.setAttribute('cy', y);
+    agent.targetSelectEl.setAttribute('cx', x);
+    agent.targetSelectEl.setAttribute('cy', y);
+    agent.targetHitEl.setAttribute('cx', x);
+    agent.targetHitEl.setAttribute('cy', y);
+  }
+
+  function updateTargetPos(agent, syncPanel = true) {
+    setTargetVisualPosition(agent);
+    if (syncPanel) updatePanel();
+  }
+
+  function startDrag(event, agent, mode) {
+    event.preventDefault();
+    selectAgent(agent.id, mode);
+    const element = mode === 'agent' ? agent.circleEl : agent.targetEl;
+    element.classList.add('dragging');
+
+    let lastR = mode === 'agent' ? agent.row : agent.targetRow;
+    let lastC = mode === 'agent' ? agent.col : agent.targetCol;
+
+    function svgCoords(evt) {
+      const rect = svg.getBoundingClientRect();
+      const vb = svg.viewBox.baseVal;
+      const svgAspect = vb.width / vb.height;
+      const boxAspect = rect.width / rect.height;
+      let scale, offsetX, offsetY;
+      if (boxAspect > svgAspect) {
+        scale = rect.height / vb.height;
+        offsetX = (rect.width - vb.width * scale) / 2;
+        offsetY = 0;
+      } else {
+        scale = rect.width / vb.width;
+        offsetX = 0;
+        offsetY = (rect.height - vb.height * scale) / 2;
+      }
+      const x = (evt.clientX - rect.left - offsetX) / scale + vb.x;
+      const y = (evt.clientY - rect.top - offsetY) / scale + vb.y;
+      const c = Math.round((x - PAD - CELL / 2) / CELL);
+      const r = Math.round((y - PAD - CELL / 2) / CELL);
+      return { r: clamp(r, 0, ROWS - 1), c: clamp(c, 0, COLS - 1) };
+    }
+
+    function onMove(evt) {
+      const { r, c } = svgCoords(evt);
+      if (r === lastR && c === lastC) return;
+      if (!moveAgentPart(agent, mode, r, c)) return;
+      lastR = r;
+      lastC = c;
+    }
+
+    function onUp() {
+      element.classList.remove('dragging');
+      window.removeEventListener('mousemove', onMove);
+      window.removeEventListener('mouseup', onUp);
+    }
+
+    window.addEventListener('mousemove', onMove);
+    window.addEventListener('mouseup', onUp);
+  }
+
+  function selectAgent(id, mode, syncPanel = true) {
+    const previous = agents.find((agent) => agent.id === selectedAgent);
+    if (previous) {
+      previous.selectEl.style.display = 'none';
+      previous.targetSelectEl.style.display = 'none';
+      previous.labelEl.style.display = showNumbering ? '' : 'none';
+      previous.selectEl.classList.remove('active-focus');
+      previous.targetSelectEl.classList.remove('active-focus');
+    }
+
+    selectedAgent = id;
+    if (mode) selectionMode = mode;
+
+    const current = agents.find((agent) => agent.id === id);
+    if (current) {
+      current.selectEl.style.display = showSelection ? '' : 'none';
+      current.targetSelectEl.style.display = showSelection ? '' : 'none';
+      current.labelEl.style.display = 'none';
+      applyFocusRing(current);
+    }
+
+    if (syncPanel) updatePanel();
+  }
+
+  function applyFocusRing(agent) {
+    agent.selectEl.classList.toggle('active-focus', selectionMode === 'agent');
+    agent.targetSelectEl.classList.toggle('active-focus', selectionMode === 'target');
+  }
+
+  function onCellPointerDown(r, c, event) {
+    if (event.button !== 0) return;
+    event.preventDefault();
+    paintSession = { visited: new Set() };
+    applyToolAtCell(r, c, paintSession);
+  }
+
+  function onCellPointerEnter(r, c) {
+    if (!paintSession) return;
+    applyToolAtCell(r, c, paintSession);
+  }
+
+  function applyToolAtCell(r, c, session) {
+    const itemKey = key(r, c);
+    if (session.visited.has(itemKey)) return;
+    session.visited.add(itemKey);
+
+    if (obstacles.has(itemKey)) gridAPI.removeObstacle(r, c);
+    else gridAPI.addObstacle(r, c);
+  }
+
+  window.addEventListener('mouseup', () => {
+    if (!paintSession) return;
+    paintSession = null;
+  });
+
+  function updatePanel() {
+    agentListEl.innerHTML = '';
+    agentCountEl.textContent = String(agents.length);
+    if (!agents.length) {
+      removeAgentBtn.disabled = true;
+      const emptyCard = document.createElement('div');
+      emptyCard.className = 'agent-card';
+      emptyCard.innerHTML = '<div class="agent-info"><strong>No agents yet</strong><br>Use the add button or local generate.</div>';
+      emptyCard.style.cursor = 'default';
+      agentListEl.appendChild(emptyCard);
+      return;
+    }
+
+    let currentIndex = agents.findIndex((agent) => agent.id === selectedAgent);
+    if (currentIndex === -1) currentIndex = 0;
+    const agent = agents[currentIndex];
+    removeAgentBtn.disabled = false;
+
+    const card = document.createElement('div');
+    card.className = 'agent-card agent-inspector';
+    card.innerHTML = `
+      <div class="agent-inspector-head">
+        <div class="agent-inspector-info">
+          <div class="agent-dot-wrapper">
+            <div class="agent-dot" style="background:${agent.color}"></div>
+            <input type="color" class="agent-color-input" value="${agent.color}" list="agent-colors">
+          </div>
+          <div>
+            <div class="agent-inspector-title">Agent ${agent.id}</div>
+          </div>
+        </div>
+      </div>
+      <div class="agent-inspector-grid">
+        <strong>Pos</strong><span>(${agent.row}, ${agent.col})</span>
+        <strong>Target</strong><span>(${agent.targetRow}, ${agent.targetCol})</span>
+        <!-- <strong>Mode</strong>
+        <span class="mode-toggle">
+          <svg class="mode-icon" data-mode="agent" width="22" height="22" viewBox="0 0 22 22">
+            <circle cx="11" cy="11" r="8" fill="${agent.color}" stroke="none"
+              opacity="${selectionMode === 'agent' ? 1 : 0.3}" />
+          </svg>
+          <svg class="mode-icon" data-mode="target" width="22" height="22" viewBox="0 0 22 22">
+            <circle cx="11" cy="11" r="7" fill="none" stroke="${agent.color}" stroke-width="3"
+              opacity="${selectionMode === 'target' ? 1 : 0.3}" />
+          </svg>
+        </span> -->
+      </div>
+    `;
+    agentListEl.appendChild(card);
+
+    /* card.querySelectorAll('.mode-icon').forEach(icon => {
+      icon.addEventListener('click', () => {
+        selectionMode = icon.dataset.mode;
+        const current = agents.find(a => a.id === selectedAgent);
+        if (current) applyFocusRing(current);
+        updatePanel();
+      });
+    }); */
+
+    const colorInput = card.querySelector('.agent-color-input');
+    if (colorInput) {
+      colorInput.addEventListener('input', (e) => {
+        const newColor = e.target.value;
+        agent.color = newColor;
+        agent.circleEl.setAttribute('fill', newColor);
+        agent.targetEl.setAttribute('stroke', newColor);
+        card.querySelector('.agent-dot').style.background = newColor;
+      });
+      colorInput.addEventListener('change', () => colorInput.blur());
+    }
+  }
+
+  const dirMap = {
+    ArrowUp: 'up', ArrowDown: 'down', ArrowLeft: 'left', ArrowRight: 'right',
+    h: 'left', j: 'down', k: 'up', l: 'right'
+    // w: 'up', a: 'left', s: 'down', d: 'right'
+  };
+  const heldKeys = new Set();
+  let moveTimer = null;
+
+  function processHeldKeys() {
+    if (selectedAgent === null || heldKeys.size === 0) {
+      clearInterval(moveTimer);
+      moveTimer = null;
+      return;
+    }
+
+    let dr = 0;
+    let dc = 0;
+    for (const held of heldKeys) {
+      const direction = DIR[dirMap[held]];
+      if (direction) {
+        dr += direction[0];
+        dc += direction[1];
+      }
+    }
+    dr = Math.sign(dr);
+    dc = Math.sign(dc);
+    if (dr === 0 && dc === 0) return;
+
+    const agent = agents.find((entry) => entry.id === selectedAgent);
+    if (!agent) return;
+
+    if (selectionMode === 'target') {
+      const nextRow = agent.targetRow + dr;
+      const nextCol = agent.targetCol + dc;
+      moveAgentPart(agent, 'target', nextRow, nextCol, dr, dc);
+    } else {
+      const nextRow = agent.row + dr;
+      const nextCol = agent.col + dc;
+      moveAgentPart(agent, 'agent', nextRow, nextCol, dr, dc);
+    }
+  }
+
+  document.addEventListener('keydown', (event) => {
+    const tag = event.target.tagName;
+    if (tag === 'TEXTAREA' || tag === 'SELECT') return;
+    if (tag === 'INPUT') {
+      const t = event.target.type;
+      if (t === 'range') { event.target.blur(); }
+      else if (t === 'color') return;
+      else if (t === 'number') {
+        if (dirMap[event.key] || event.key === 'Tab' || event.key === ' ') event.target.blur();
+        else return;
+      }
+      else return;
+    }
+
+    if (event.key === 'Tab') {
+      event.preventDefault();
+      if (!agents.length) return;
+      const currentIndex = agents.findIndex((agent) => agent.id === selectedAgent);
+      let nextIndex;
+      if (event.shiftKey) {
+        nextIndex = currentIndex <= 0 ? agents.length - 1 : currentIndex - 1;
+      } else {
+        nextIndex = currentIndex === -1 || currentIndex >= agents.length - 1 ? 0 : currentIndex + 1;
+      }
+      selectAgent(agents[nextIndex].id, selectionMode);
+      return;
+    }
+
+    if (event.key === ' ') {
+      event.preventDefault();
+      if (selectedAgent === null) return;
+      selectionMode = selectionMode === 'agent' ? 'target' : 'agent';
+      const current = agents.find((agent) => agent.id === selectedAgent);
+      if (current) applyFocusRing(current);
+      updatePanel();
+      return;
+    }
+
+    if (event.key >= '0' && event.key <= '9') {
+      const id = parseInt(event.key, 10);
+      const agent = agents.find((agent) => agent.id === id);
+      if (agent) selectAgent(id, selectionMode);
+      return;
+    }
+
+    if ((event.key === '+' || event.key === '=') && !event.ctrlKey && !event.metaKey && !event.altKey) {
+      gridAPI.addAgent();
+      return;
+    }
+
+    if (event.key === '-' && !event.ctrlKey && !event.metaKey && !event.altKey) {
+      if (!agents.length) return;
+      const currentIndex = agents.findIndex((agent) => agent.id === selectedAgent);
+      const agent = agents[currentIndex === -1 ? 0 : currentIndex];
+      if (agent) gridAPI.removeAgent(agent.id);
+      return;
+    }
+
+    if (!dirMap[event.key]) return;
+    event.preventDefault();
+    if (heldKeys.has(event.key)) return;
+    heldKeys.add(event.key);
+    if (!moveTimer) {
+      processHeldKeys();
+      moveTimer = setInterval(processHeldKeys, MOVE_INTERVAL);
+    }
+  });
+
+  document.addEventListener('keyup', (event) => {
+    heldKeys.delete(event.key);
+    if (heldKeys.size === 0 && moveTimer) {
+      clearInterval(moveTimer);
+      moveTimer = null;
+    }
+  });
+
+  function createAgentRecord(row, col, targetRow, targetCol) {
+    if (row == null || col == null) {
+      const position = randomFreeCell();
+      if (!position) return null;
+      row = position[0];
+      col = position[1];
+    }
+    if (row < 0 || row >= ROWS || col < 0 || col >= COLS) return null;
+    if (obstacles.has(key(row, col)) || cellHasAgent(row, col)) return null;
+
+    if (targetRow == null || targetCol == null) {
+      const takenTargets = new Set();
+      agents.forEach((agent) => takenTargets.add(key(agent.targetRow, agent.targetCol)));
+      const availableTargets = [];
+      const fallbackTargets = [];
+      forEachCell(ROWS, COLS, (r, c) => {
+        const cellKey = key(r, c);
+        if (obstacles.has(cellKey) || takenTargets.has(cellKey)) return;
+        fallbackTargets.push([r, c]);
+        if (r !== row || c !== col) availableTargets.push([r, c]);
+      });
+      const choices = availableTargets.length ? availableTargets : fallbackTargets;
+      const target = choices[Math.floor(Math.random() * choices.length)];
+      if (!target) return null;
+      targetRow = target[0];
+      targetCol = target[1];
+    }
+
+    if (targetRow < 0 || targetRow >= ROWS || targetCol < 0 || targetCol >= COLS) return null;
+    if (obstacles.has(key(targetRow, targetCol))) return null;
+
+    const id = nextAgentId++;
+    const color = COLORS[id % COLORS.length];
+    return { id, row, col, targetRow, targetCol, color };
+  }
+
+  function insertAgent(agent, { targetHitMount = targetHitGroup, targetMount = targetGroup, agentMount = agentGroup, labelMount = labelGroup, select = true, syncPanel = true } = {}) {
+    agents.push(agent);
+    createAgentElements(agent, targetHitMount, targetMount, agentMount, labelMount);
+    if (!showNumbering) agent.labelEl.style.display = 'none';
+    setAgentVisualPosition(agent);
+    setTargetVisualPosition(agent);
+
+    if (select) selectAgent(agent.id, 'agent', syncPanel);
+    else if (syncPanel) updatePanel();
+    return agent.id;
+  }
+
+  const gridAPI = {
+    moveAgent(agentId, direction) {
+      const agent = agents.find((entry) => entry.id === agentId);
+      if (!agent) return false;
+      const delta = DIR[direction];
+      if (!delta) return false;
+      return moveAgentPart(agent, 'agent', agent.row + delta[0], agent.col + delta[1]);
+    },
+    moveAgentTo(agentId, row, col) {
+      const agent = agents.find((entry) => entry.id === agentId);
+      if (!agent) return false;
+      return moveAgentPart(agent, 'agent', row, col);
+    },
+    addObstacle(row, col) {
+      if (row < 0 || row >= ROWS || col < 0 || col >= COLS) return false;
+      const itemKey = key(row, col);
+      if (obstacles.has(itemKey)) return false;
+      if (cellHasAgent(row, col) || cellHasTarget(row, col)) return false;
+      obstacles.add(itemKey);
+      drawObstacle(row, col);
+      updateMapStats();
+      updateGenerateControls();
+      return true;
+    },
+    removeObstacle(row, col) {
+      const itemKey = key(row, col);
+      if (!obstacles.has(itemKey)) return false;
+      obstacles.delete(itemKey);
+      removeObsEl(row, col);
+      updateMapStats();
+      updateGenerateControls();
+      return true;
+    },
+    clearObstacles() {
+      [...obstacles].forEach((itemKey) => {
+        const [r, c] = itemKey.split(',').map(Number);
+        obstacles.delete(itemKey);
+        removeObsEl(r, c);
+      });
+      updateMapStats();
+      updateGenerateControls();
+      return true;
+    },
+    addAgent(row, col, targetRow, targetCol) {
+      const agent = createAgentRecord(row, col, targetRow, targetCol);
+      if (!agent) return null;
+      return insertAgent(agent);
+    },
+    removeAgent(agentId) {
+      const index = agents.findIndex((agent) => agent.id === agentId);
+      if (index === -1) return false;
+      const agent = agents[index];
+      const wasSelected = selectedAgent === agentId;
+      const nextSelectedAgent = agents[index + 1] || agents[index - 1] || null;
+      removeAgentElements(agent);
+      agents.splice(index, 1);
+      if (wasSelected) {
+        selectedAgent = null;
+        if (nextSelectedAgent && agents.includes(nextSelectedAgent)) {
+          selectAgent(nextSelectedAgent.id, selectionMode, false);
+        }
+      }
+      if (agents.length === 0) nextAgentId = 0;
+      updatePanel();
+      return true;
+    },
+    getState() {
+      return {
+        rows: ROWS,
+        cols: COLS,
+        obstacles: getObstacleCoords(),
+        agents: agents.map((agent) => ({
+          id: agent.id,
+          row: agent.row,
+          col: agent.col,
+          targetRow: agent.targetRow,
+          targetCol: agent.targetCol,
+          color: agent.color
+        }))
+      };
+    },
+    loadConfig(config) {
+      agents.forEach((agent) => removeAgentElements(agent));
+      agents.length = 0;
+      obstacles.clear();
+      Object.keys(obsElements).forEach((itemKey) => delete obsElements[itemKey]);
+      selectedAgent = null;
+      nextAgentId = 0;
+
+      ROWS = config.rows;
+      COLS = config.cols;
+
+      if (config.obstacles) {
+        config.obstacles.forEach(([r, c]) => obstacles.add(key(r, c)));
+      }
+
+      buildSVG();
+
+      if (config.agents) {
+        const targetHitFragment = document.createDocumentFragment();
+        const targetFragment = document.createDocumentFragment();
+        const agentFragment = document.createDocumentFragment();
+        const labelFragment = document.createDocumentFragment();
+        config.agents.forEach((agent) => {
+          const nextAgent = createAgentRecord(agent.row, agent.col, agent.targetRow, agent.targetCol);
+          if (!nextAgent) return;
+          insertAgent(nextAgent, {
+            targetHitMount: targetHitFragment,
+            targetMount: targetFragment,
+            agentMount: agentFragment,
+            labelMount: labelFragment,
+            select: false,
+            syncPanel: false
+          });
+        });
+        targetHitGroup.appendChild(targetHitFragment);
+        targetGroup.appendChild(targetFragment);
+        agentGroup.appendChild(agentFragment);
+        labelGroup.appendChild(labelFragment);
+      }
+      if (agents.length) selectAgent(agents[0].id, 'agent');
+      else updatePanel();
+      updateMapStats();
+      updateGenerateControls();
+      updateResizeControls();
+    }
+  };
+
+  function copyText(text) {
+    return navigator.clipboard.writeText(text);
+  }
+
+  function generatePogemaSnippet() {
+    const mapText = getMapArray().map((row) => '    ' + row).join('\n');
+    const agentsXY = agents.map((agent) => `[${agent.row}, ${agent.col}]`).join(', ');
+    const targetsXY = agents.map((agent) => `[${agent.targetRow}, ${agent.targetCol}]`).join(', ');
+    return `grid_config = GridConfig(\n    map="""\n${mapText}\n    """,\n    agents_xy=[${agentsXY}],\n    targets_xy=[${targetsXY}],\n)`;
+  }
+
+  function downloadCurrentSvg() {
+    if (!svg) return;
+    const exportedSvg = svg.cloneNode(true);
+    exportedSvg.removeAttribute('style');
+    exportedSvg.removeAttribute('width');
+    exportedSvg.removeAttribute('height');
+    exportedSvg.setAttribute('preserveAspectRatio', 'xMidYMid meet');
+    const lineColor = '#84a1ae';
+    const obstacleColor = '#84a1ae';
+    exportedSvg.querySelectorAll('.cell-hit, .target-hit, .selected-ring, .target-select-ring, circle[fill="transparent"][stroke="transparent"]').forEach((element) => element.remove());
+    exportedSvg.querySelectorAll('g').forEach(g => {
+      if (!g.children.length) g.remove();
+    });
+    exportedSvg.querySelectorAll('.grid-line').forEach((line) => {
+      line.setAttribute('stroke', lineColor);
+      line.setAttribute('stroke-width', '10');
+    });
+    exportedSvg.querySelectorAll('.obstacle').forEach((rect) => {
+      rect.setAttribute('fill', obstacleColor);
+    });
+    exportedSvg.querySelectorAll('.target-circle').forEach((circle) => {
+      circle.setAttribute('fill', 'none');
+      circle.setAttribute('stroke-width', '10');
+    });
+    exportedSvg.querySelectorAll('.agent-label').forEach((label) => {
+      label.setAttribute('fill', '#fff');
+      label.setAttribute('font-size', '28');
+      label.setAttribute('font-weight', 'bold');
+      label.setAttribute('text-anchor', 'middle');
+      label.setAttribute('dominant-baseline', 'central');
+      label.style.removeProperty('display');
+    });
+    const serialized = new XMLSerializer().serializeToString(exportedSvg);
+    const svgText = serialized.startsWith('<?xml')
+      ? serialized
+      : `<?xml version="1.0" encoding="UTF-8"?>\n${serialized}`;
+    const blob = new Blob([svgText], { type: 'image/svg+xml;charset=utf-8' });
+    const url = URL.createObjectURL(blob);
+    const link = document.createElement('a');
+    link.href = url;
+    link.download = `pogema-map-${ROWS}x${COLS}.svg`;
+    document.body.appendChild(link);
+    link.click();
+    link.remove();
+    setTimeout(() => URL.revokeObjectURL(url), 0);
+  }
+
+  function updateMapStats() {
+    const freeCells = getFreeCellCount();
+    statSize.textContent = `${ROWS}×${COLS}`;
+    statObstacles.textContent = String(obstacles.size);
+    statFree.textContent = String(freeCells);
+    statDensity.textContent = `${((obstacles.size / (ROWS * COLS)) * 100).toFixed(1)}%`;
+  }
+
+
+  function updateGenerateControls() {
+    const maxAgents = getFreeCellCount();
+    const normalizedMax = Math.max(1, maxAgents);
+    agentCountSlider.min = 1;
+    agentCountSlider.max = normalizedMax;
+    agentCountInput.min = 1;
+    agentCountInput.max = normalizedMax;
+
+    const nextValue = clampCountInput(agentCountInput, 1, normalizedMax, Math.min(8, normalizedMax));
+    agentCountSlider.value = nextValue;
+    generateBtn.disabled = maxAgents < 1;
+    if (maxAgents < 1) {
+      generateBtn.textContent = 'Need More Free Cells';
+    } else {
+      generateBtn.textContent = 'Generate Agents & Targets';
+    }
+  }
+
+  function loadRandomMap(rows, cols, density, seed) {
+    const rng = createSeededRandom(seed);
+    const obstacleCoords = [];
+    forEachCell(rows, cols, (r, c) => {
+      if (rng() < density / 100) obstacleCoords.push([r, c]);
+    });
+    gridAPI.loadConfig({
+      rows,
+      cols,
+      obstacles: obstacleCoords,
+      agents: []
+    });
+  }
+
+
+  function getResizedObstacles(nextRows, nextCols, rowOffset, colOffset) {
+    return getObstacleCoords()
+      .map(([r, c]) => [r + rowOffset, c + colOffset])
+      .filter(([r, c]) => r >= 0 && r < nextRows && c >= 0 && c < nextCols);
+  }
+
+  function resizeMap(nextRows, nextCols, rowOffset, colOffset) {
+    const nextObstacles = getResizedObstacles(nextRows, nextCols, rowOffset, colOffset);
+    gridAPI.loadConfig({
+      rows: nextRows,
+      cols: nextCols,
+      obstacles: nextObstacles,
+      agents: []
+    });
+  }
+
+  function resizeMapCentered(nextRows, nextCols) {
+    const rowOffset = Math.floor((nextRows - ROWS) / 2);
+    const colOffset = Math.floor((nextCols - COLS) / 2);
+    resizeMap(nextRows, nextCols, rowOffset, colOffset);
+  }
+
+  function getResizeState(action) {
+    const config = RESIZE_ACTIONS[action];
+    if (!config) return null;
+    return {
+      nextRows: ROWS + config.rowsDelta,
+      nextCols: COLS + config.colsDelta,
+      rowOffset: config.rowOffset,
+      colOffset: config.colOffset
+    };
+  }
+
+  function canResize(action) {
+    const s = getResizeState(action);
+    return !!s &&
+      s.nextRows >= MIN_DIMENSION && s.nextRows <= MAX_DIMENSION &&
+      s.nextCols >= MIN_DIMENSION && s.nextCols <= MAX_DIMENSION;
+  }
+
+  function applyResizeAction(action) {
+    if (!canResize(action)) return;
+    const s = getResizeState(action);
+    resizeMap(s.nextRows, s.nextCols, s.rowOffset, s.colOffset);
+  }
+
+  function updateResizeControls() {
+    resizeButtons.forEach((button) => {
+      const direction = button.dataset.resizeDirection;
+      const action = `${resizeMode}-${direction}`;
+      button.disabled = !canResize(action);
+      button.textContent = RESIZE_GLYPHS[resizeMode][direction];
+      button.title = (resizeMode === 'add' ? 'Grow ' : 'Shrink ') + direction.replace('-', ' ');
+    });
+    resizeModeToggle.textContent = resizeMode === 'add' ? '+' : '\u2212';
+    resizeModeToggle.dataset.mode = resizeMode;
+    resizeModeToggle.title = resizeMode === 'add' ? 'Switch to shrink mode' : 'Switch to grow mode';
+  }
+
+  function generateLocalAgents() {
+    const requested = clampCountInput(agentCountInput, 1, parseInt(agentCountInput.max, 10), 1);
+    agentCountSlider.value = requested;
+
+    const freeCells = [];
+    forEachCell(ROWS, COLS, (r, c) => {
+      if (!obstacles.has(key(r, c))) freeCells.push([r, c]);
+    });
+
+    const maxAgents = freeCells.length;
+    if (requested > maxAgents) return;
+
+    const rng = createSeededRandom(Math.floor(Math.random() * 0x100000000));
+    shuffleInPlace(freeCells, rng);
+
+    const targetCells = freeCells.slice();
+    shuffleInPlace(targetCells, rng);
+
+    const generatedAgents = [];
+    for (let i = 0; i < requested; i++) {
+      const position = freeCells[i];
+      const target = targetCells[i];
+      generatedAgents.push({
+        row: position[0],
+        col: position[1],
+        targetRow: target[0],
+        targetCol: target[1]
+      });
+    }
+
+    gridAPI.loadConfig({
+      rows: ROWS,
+      cols: COLS,
+      obstacles: getObstacleCoords(),
+      agents: generatedAgents
+    });
+  }
+  randomizeBtn.addEventListener('click', () => {
+    const density = clampCountInput(densityInput, 0, 70, 18);
+    densitySlider.value = density;
+    const seed = Math.floor(Math.random() * 0x100000000);
+    loadRandomMap(ROWS, COLS, density, seed);
+  });
+
+  clearObstaclesBtn.addEventListener('click', () => {
+    gridAPI.clearObstacles();
+  });
+
+  resizeButtons.forEach((button) => {
+    button.addEventListener('click', () => applyResizeAction(`${resizeMode}-${button.dataset.resizeDirection}`));
+  });
+
+  resizeModeToggle.addEventListener('click', () => {
+    resizeMode = resizeMode === 'add' ? 'remove' : 'add';
+    updateResizeControls();
+  });
+
+  sizePresetButtons.forEach((button) => {
+    button.addEventListener('click', () => {
+      resizeMapCentered(parseInt(button.dataset.rows, 10), parseInt(button.dataset.cols, 10));
+    });
+  });
+
+  bindRangeNumberInput(densitySlider, densityInput, () => ({ min: 0, max: 70 }), 18);
+  bindRangeNumberInput(agentCountSlider, agentCountInput, () => ({ min: 1, max: parseInt(agentCountInput.max, 10) }), 1);
+
+  generateBtn.addEventListener('click', generateLocalAgents);
+  addAgentBtn.addEventListener('click', () => gridAPI.addAgent());
+  removeAgentBtn.addEventListener('click', () => {
+    if (!agents.length) return;
+    const currentIndex = agents.findIndex((agent) => agent.id === selectedAgent);
+    const agent = agents[currentIndex === -1 ? 0 : currentIndex];
+    if (agent) gridAPI.removeAgent(agent.id);
+  });
+
+  toggleNumberingBtn.addEventListener('click', () => {
+    showNumbering = !showNumbering;
+    toggleNumberingBtn.style.opacity = showNumbering ? '' : '0.5';
+    agents.forEach((agent) => {
+      agent.labelEl.style.display = (!showNumbering || agent.id === selectedAgent) ? 'none' : '';
+    });
+  });
+
+  toggleSelectionBtn.addEventListener('click', () => {
+    showSelection = !showSelection;
+    toggleSelectionBtn.style.opacity = showSelection ? '' : '0.5';
+    agents.forEach((agent) => {
+      if (agent.id === selectedAgent) {
+        agent.selectEl.style.display = showSelection ? '' : 'none';
+        agent.targetSelectEl.style.display = showSelection ? '' : 'none';
+      }
+    });
+  });
+
+  copyBtn.addEventListener('click', () => {
+    copyText(generatePogemaSnippet()).then(() => {
+      copyBtn.innerHTML = '&#10003; Copied';
+      setTimeout(() => { copyBtn.innerHTML = '&#128203; Copy Pogema Snippet'; }, 1400);
+    });
+  });
+
+  downloadSvgBtn.addEventListener('click', () => {
+    downloadCurrentSvg();
+    downloadSvgBtn.innerHTML = '&#10003; Downloaded';
+    setTimeout(() => { downloadSvgBtn.innerHTML = '&#10515; Download SVG'; }, 1400);
+  });
+
+  // Theme: sessionStorage overrides URL param
+  let saved = sessionStorage.getItem('pogema-editor-theme');
+  let nightMode = saved ? saved === 'night' : new URLSearchParams(window.location.search).get('theme') === 'slate';
+  function applyTheme() {
+    document.body.className = nightMode ? 'night' : 'day';
+    document.documentElement.classList.toggle('night', nightMode);
+    toggleBtn.innerHTML = nightMode ? '&#9788;' : '&#9790;';
+    toggleBtn.title = nightMode ? 'Switch to day mode' : 'Switch to night mode';
+  }
+
+  toggleBtn.addEventListener('click', () => {
+    nightMode = !nightMode;
+    sessionStorage.setItem('pogema-editor-theme', nightMode ? 'night' : 'day');
+    applyTheme();
+  });
+
+  window.grid = gridAPI;
+
+  applyTheme();
+  loadRandomMap(8, 8, 18, Math.floor(Math.random() * 0x100000000));
+  generateLocalAgents();
+})();
+</script>
+</body>
+</html>

From 4fa8e631d16c364fbbc5d3959cc451023860be46 Mon Sep 17 00:00:00 2001
From: Alexey Skrynnik <Tviskaron@gmail.com>
Date: Sat, 11 Apr 2026 13:54:00 +0300
Subject: [PATCH 15/15] Update __init__.py

---
 pogema/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pogema/__init__.py b/pogema/__init__.py
index 9488aaf..ac26ddb 100644
--- a/pogema/__init__.py
+++ b/pogema/__init__.py
@@ -22,7 +22,7 @@
 from pogema.wrappers.multi_time_limit import MultiTimeLimit
 from pogema.wrappers.persistence import PersistentWrapper
 
-__version__ = '1.4.0'
+__version__ = '2.0.0a'
 
 __all__ = [
     'GridConfig',