Merge pull request #70 from strakam/restructure-files-update-readme

Restructure files update readme
strakam · Oct 2, 2024 · d7f9924 · d7f9924
2 parents f26eb44 + 8e93898
commit d7f9924
Show file tree

Hide file tree

Showing 26 changed files with 94 additions and 82 deletions.
diff --git a/Makefile b/Makefile
@@ -28,7 +28,7 @@ at:
 	python3 tests/sb3_check.py
 
 test_performance:
-	python3 -m tests.parallel_api_test
+	python3 -m tests.parallel_api_check
 
 pytest:
 	pytest

diff --git a/README.md b/README.md
@@ -13,7 +13,10 @@
 [Installation](#-installation) • [Getting Started](#-getting-started) • [Customization](#-custom-maps) • [Environment](#-environment)
 </div>
 
-[Generals.io](https://generals.io/) is a real-time strategy game where players compete to conquer their opponents' generals on a 2D grid. While the goal is simple — capture the enemy general — the gameplay involves a lot of depth. Players need to employ strategic planning, deception, and manage both micro and macro mechanics throughout the game. The combination of these elements makes the game highly engaging and complex.
+Generals-RL is a real-time strategy environment where players compete to conquer their opponents' generals on a 2D grid.
+While the goal is simple — capture the enemy general — the gameplay involves a lot of depth.
+Players need to employ strategic planning, deception, and manage both micro and macro mechanics throughout the game.
+The combination of these elements makes the game highly engaging and complex.
 
 This repository aims to make bot development more accessible, especially for Machine Learning based agents.
 
@@ -23,6 +26,10 @@ Highlights:
 * 🔧 Easy customization of environments
 * 🔬 Analysis tools such as replays
 
+> [!NOTE]
+> This repository is based on the [generals.io](https://generals.io) game.
+> Check it out, its a lot of fun !
+
 ## 📦 Installation
 Stable release version is available through pip:
 ```bash
@@ -38,7 +45,7 @@ pip install -e .
 ## Usage example (🤸 Gymnasium)
 
 ```python
-from generals.env import gym_generals
+from generals import gym_generals
 from generals.agents import RandomAgent, ExpanderAgent
 
 # Initialize agents
@@ -73,44 +80,44 @@ Creating your first agent is very simple.
 > [!TIP]
 > Check out `Makefile` and run some examples to get a feel for the game 🤗.
 
-## 🎨 Custom maps
-Maps are handled via `Mapper` class. You can instantiate the class with desired map properties, and it will generate
-maps with these properties for each run.
+## 🎨 Custom grids
+Grids are generated via `GridFactory`. You can instantiate the class with desired grid properties, and it will generate
+grid with these properties for each run.
 ```python
-from generals.env import pz_generals
-from generals.map import Mapper
+from generals import pz_generals
+from generals import GridFactory
 
-mapper = Mapper(
+grid_factory = GridFactory(
     grid_dims=(10, 10),                    # Dimensions of the grid (height, width)
     mountain_density=0.2,                  # Probability of a mountain in a cell
     city_density=0.05,                     # Probability of a city in a cell
     general_positions=[(0,3),(5,7)],       # Positions of generals (i, j)
 )
 
 # Create environment
-env = pz_generals(mapper=mapper, ...)
+env = pz_generals(grid_factory=grid_factory, ...)
 ```
-You can also specify map manually, as a string via `options` dict:
+You can also specify grids manually, as a string via `options` dict:
 ```python
-from generals.env import pz_generals
-from generals.map import Mapper
+from generals import pz_generals
+from generals import GridFactory
 
-mapper = Mapper()
-env = pz_generals(mapper=mapper, ...)
+grid_factory = GridFactory()
+env = pz_generals(grid_factory=grid_factory, ...)
 
-map = """
+grid = """
 .3.#
 #..A
 #..#
 .#.B
 """
 
-options = {'map' : map}
+options = {"grid": grid}
 
-# Pass the new map to the environment (for the next game)
+# Pass the new grid to the environment (for the next game)
 env.reset(options=options)
 ```
-Maps are encoded using these symbols:
+Grids are encoded using these symbols:
 - `.` for cells where you can move your army
 - `#` for mountains (terrain that can not be passed)
 - `A,B` are positions of generals
@@ -120,7 +127,7 @@ Maps are encoded using these symbols:
 We can store replays and then analyze them. `Replay` class handles replay related functionality.
 ### Storing a replay
 ```python
-from generals.env import pz_generals
+from generals import pz_generals
 
 options = {"replay": "my_replay"}
 env = pz_generals(...)
@@ -130,7 +137,7 @@ env.reset(options=options) # The next game will be encoded in my_replay.pkl
 ### Loading a replay
 
 ```python
-from generals.replay import Replay
+from generals import Replay
 
 # Initialize Replay instance
 replay = Replay.load("my_replay")
@@ -189,6 +196,6 @@ def custom_reward_fn(observation, action, done, info):
     # Give agent a reward based on the number of cells they own
     return observation["observation"]["owned_land_count"]
 
-env = generals_v0(reward_fn=custom_reward_fn)
+env = pz_generals(reward_fn=custom_reward_fn)
 observations, info = env.reset()
 ```
diff --git a/examples/complete_example.py b/examples/complete_example.py
@@ -1,6 +1,6 @@
-from generals.env import pz_generals
+from generals import pz_generals
 from generals.agents import RandomAgent, ExpanderAgent
-from generals.grid import GridFactory
+from generals import GridFactory
 
 # Initialize agents - their names are then called for actions
 randomer = RandomAgent("Random1", color=(255, 125, 0))
@@ -18,7 +18,7 @@
     general_positions=[(0, 0), (3, 3)],
 )
 
-# Custom map that will override mapper's map for next game
+# Custom map that will override GridFactory for this game
 map = """
 A..#
 .#3#
@@ -30,7 +30,7 @@
 env = pz_generals(gf, agents, render_mode=None) # Disable rendering
 
 options = {
-    "map": map,
+    "grid": map,
     "replay_file": "replay",
 }
 

diff --git a/examples/gymnasium_example.py b/examples/gymnasium_example.py
@@ -1,4 +1,4 @@
-from generals.env import gym_generals
+from generals import gym_generals
 from generals.agents import RandomAgent, ExpanderAgent
 
 # Initialize agents

diff --git a/examples/pettingzoo_example.py b/examples/pettingzoo_example.py
@@ -1,4 +1,4 @@
-from generals.env import pz_generals
+from generals import pz_generals
 from generals.agents import ExpanderAgent, RandomAgent
 
 # Initialize agents

diff --git a/examples/replay_example.py b/examples/replay_example.py
@@ -1,4 +1,4 @@
-from generals.replay import Replay
+from generals import Replay
 
 replay = Replay.load("replay.pkl")
 replay.play()
diff --git a/generals/__init__.py b/generals/__init__.py
@@ -1,6 +1,6 @@
+from .core.grid import GridFactory, Grid
+from .envs.env import pz_generals, gym_generals
+from .core.replay import Replay
 
 
-__all__ = ['generals', 'generals_v0', 'game', 'game_config']
-
-__version__ = '0.0.1'
-__author__ = 'Matej Straka'
+__all__ = ['GridFactory', 'Grid', 'Replay', pz_generals, gym_generals]
diff --git a/generals/agents/expander_agent.py b/generals/agents/expander_agent.py
@@ -1,7 +1,7 @@
 import numpy as np
 from .agent import Agent
 
-from generals.config import DIRECTIONS
+from generals.core.config import DIRECTIONS
 
 
 class ExpanderAgent(Agent):

diff --git a/generals/integrations/__init__.py → generals/core/__init__.py b/generals/integrations/__init__.py → generals/core/__init__.py
diff --git a/generals/channels.py → generals/core/channels.py b/generals/channels.py → generals/core/channels.py
@@ -1,6 +1,6 @@
 import numpy as np
 
-from generals.config import MOUNTAIN, PASSABLE
+from .config import MOUNTAIN, PASSABLE
 
 valid_generals = ["A", "B"]  # Generals are represented by A and B
 

diff --git a/generals/config.py → generals/core/config.py b/generals/config.py → generals/core/config.py
@@ -19,7 +19,6 @@
 ##################
 # Game constants #
 ##################
-INCREMENT_RATE: int = 50 # every 50 ticks, number of units increases
 GAME_SPEED: float = 8 # by default, every 8 ticks, actions are processed
 
 ########################

diff --git a/generals/game.py → generals/core/game.py b/generals/game.py → generals/core/game.py
@@ -1,20 +1,22 @@
 import warnings
 from typing import Any
+from typing_extensions import TypeAlias
 
-from .channels import Channels
-from generals.grid import Grid
 import numpy as np
 import gymnasium as gym
-from typing_extensions import TypeAlias
 
-from generals.config import DIRECTIONS, PASSABLE, MOUNTAIN, INCREMENT_RATE
+from .channels import Channels
+from .grid import Grid
+from .config import DIRECTIONS
 
 from scipy.ndimage import maximum_filter
 
 Observation: TypeAlias = dict[str, gym.Space | dict[str, gym.Space]]
 Action: TypeAlias = gym.Space
 Info: TypeAlias = dict[str, Any]
 
+increment_rate = 50
+
 
 class Game:
     def __init__(self, grid: Grid, agents: list[str]):
@@ -138,7 +140,9 @@ def visibility_channel(self, ownership_channel: np.ndarray) -> np.ndarray:
         """
         return maximum_filter(ownership_channel, size=3)
 
-    def step(self, actions: dict[str, Action]) -> tuple[dict[str, Observation], dict[str, dict]]:
+    def step(
+        self, actions: dict[str, Action]
+    ) -> tuple[dict[str, Observation], dict[str, dict]]:
         """
         Perform one step of the game
 
@@ -242,18 +246,16 @@ def _global_game_update(self) -> None:
 
         owners = self.agents
 
-        # every TICK_RATE steps, increase army size in each cell
-        if self.time % INCREMENT_RATE == 0:
+        # every `increment_rate` steps, increase army size in each cell
+        if self.time % increment_rate == 0:
             for owner in owners:
                 self.channels.army += self.channels.ownership[owner]
 
         # Increment armies on general and city cells, but only if they are owned by player
         if self.time % 2 == 0 and self.time > 0:
             update_mask = self.channels.general + self.channels.city
             for owner in owners:
-                self.channels.army += (
-                    update_mask * self.channels.ownership[owner]
-                )
+                self.channels.army += update_mask * self.channels.ownership[owner]
 
     def is_done(self) -> bool:
         """

diff --git a/generals/grid.py → generals/core/grid.py b/generals/grid.py → generals/core/grid.py
@@ -1,5 +1,5 @@
 import numpy as np
-from generals.config import PASSABLE, MOUNTAIN
+from .config import PASSABLE, MOUNTAIN
 
 
 class Grid:

diff --git a/generals/replay.py → generals/core/replay.py b/generals/replay.py → generals/core/replay.py
@@ -1,9 +1,9 @@
 import pickle
 import time
 
-from generals.grid import Grid
+from generals.core.grid import Grid
+from generals.core.game import Game
 from generals.gui import GUI
-from generals.game import Game
 from copy import deepcopy
 
 

diff --git a/generals/envs/__init__.py b/generals/envs/__init__.py
diff --git a/generals/env.py → generals/envs/env.py b/generals/env.py → generals/envs/env.py
@@ -1,8 +1,9 @@
-from .agents import Agent
-from .integrations.gymnasium_integration import Gym_Generals, RewardFn
-from .integrations.pettingzoo_integration import PZ_Generals
+from generals.agents import Agent
+from .gymnasium_integration import Gym_Generals, RewardFn
+from .pettingzoo_integration import PZ_Generals
+
+from generals import GridFactory
 
-from .grid import GridFactory
 
 
 def pz_generals(

diff --git a/...als/integrations/gymnasium_integration.py → generals/envs/gymnasium_integration.py b/...als/integrations/gymnasium_integration.py → generals/envs/gymnasium_integration.py
@@ -5,14 +5,13 @@
 import functools
 from copy import deepcopy
 
-from ..agents import Agent
-from ..game import Game, Action, Observation
-from ..grid import GridFactory
-from ..gui import GUI
-from ..replay import Replay
+from generals.agents import Agent
+from generals.core.game import Game, Action, Observation, Info
+from generals.core.grid import GridFactory
+from generals.gui import GUI
+from generals.core.replay import Replay
 
 # Type aliases
-from generals.game import Info
 Reward: TypeAlias = float
 RewardFn: TypeAlias = Callable[[dict[str, Observation], Action, bool, Info], Reward]
 

diff --git a/...ls/integrations/pettingzoo_integration.py → generals/envs/pettingzoo_integration.py b/...ls/integrations/pettingzoo_integration.py → generals/envs/pettingzoo_integration.py
@@ -8,16 +8,14 @@
 
 from pettingzoo.utils.env import AgentID
 
-from ..game import Game, Action, Observation
-from ..grid import GridFactory
-from ..agents import Agent
-from ..gui import GUI
-from ..replay import Replay
+from generals.core.game import Game, Action, Observation, Info
+from generals.core.grid import GridFactory
+from generals.agents import Agent
+from generals.gui import GUI
+from generals.core.replay import Replay
 
 
 # Type aliases
-from generals.game import Info
-
 Reward: TypeAlias = float
 RewardFn: TypeAlias = Callable[[dict[str, Observation], Action, bool, Info], Reward]
 
@@ -63,9 +61,9 @@ def render(self, fps=6) -> None:
         if self.render_mode == "human":
             self.gui.tick(fps=fps)
 
-    def reset(self, seed: int | None = None, options: dict | None = None) -> tuple[
-        dict[AgentID, Observation], dict[AgentID, dict]
-    ]:
+    def reset(
+        self, seed: int | None = None, options: dict | None = None
+    ) -> tuple[dict[AgentID, Observation], dict[AgentID, dict]]:
         if options is None:
             options = {}
         self.agents = deepcopy(self.possible_agents)
@@ -94,8 +92,14 @@ def reset(self, seed: int | None = None, options: dict | None = None) -> tuple[
         infos = {agent: {} for agent in self.agents}
         return observations, infos
 
-    def step(self, actions: dict[AgentID, Action]) -> tuple[
-        dict[AgentID, Observation], dict[AgentID, float], dict[AgentID, bool], dict[AgentID, bool], dict[AgentID, Info]
+    def step(
+        self, actions: dict[AgentID, Action]
+    ) -> tuple[
+        dict[AgentID, Observation],
+        dict[AgentID, float],
+        dict[AgentID, bool],
+        dict[AgentID, bool],
+        dict[AgentID, Info],
     ]:
         observations, infos = self.game.step(actions)
 

diff --git a/generals/gui/gui.py b/generals/gui/gui.py
@@ -1,6 +1,6 @@
 from typing import Any
 
-from ..game import Game
+from generals.core.game import Game
 from .properties import Properties
 from .event_handler import EventHandler
 from .rendering import Renderer

diff --git a/generals/gui/properties.py b/generals/gui/properties.py
@@ -3,8 +3,8 @@
 
 from pygame.time import Clock
 
-from generals import config as c
-from generals.game import Game
+from generals.core import config as c
+from generals.core.game import Game
 
 
 @dataclass