Add registration functions for envs and intelligence backends (#115)

Farama-Foundation · Dec 19, 2023 · 2dcaa08 · 2dcaa08
1 parent 767ed20
commit 2dcaa08
Show file tree

Hide file tree

Showing 14 changed files with 131 additions and 42 deletions.
diff --git a/chatarena/backends/__init__.py b/chatarena/backends/__init__.py
@@ -1,21 +1,11 @@
 from ..config import BackendConfig
 from .anthropic import Claude
-from .base import IntelligenceBackend
+from .base import BACKEND_REGISTRY, IntelligenceBackend, register_backend
 from .cohere import CohereAIChat
 from .hf_transformers import TransformersConversational
 from .human import Human
 from .openai import OpenAIChat
 
-ALL_BACKENDS = [
-    Human,
-    OpenAIChat,
-    CohereAIChat,
-    TransformersConversational,
-    Claude,
-]
-
-BACKEND_REGISTRY = {backend.type_name: backend for backend in ALL_BACKENDS}
-
 
 # Load a backend from a config dictionary
 def load_backend(config: BackendConfig):

diff --git a/chatarena/backends/anthropic.py b/chatarena/backends/anthropic.py
@@ -6,7 +6,7 @@
 
 from ..message import SYSTEM_NAME as SYSTEM
 from ..message import Message
-from .base import IntelligenceBackend
+from .base import IntelligenceBackend, register_backend
 
 try:
     import anthropic
@@ -25,6 +25,7 @@
 DEFAULT_MODEL = "claude-v1"
 
 
+@register_backend
 class Claude(IntelligenceBackend):
     """Interface to the Claude offered by Anthropic."""
 

diff --git a/chatarena/backends/base.py b/chatarena/backends/base.py
@@ -1,5 +1,5 @@
 from abc import abstractmethod
-from typing import List
+from typing import Dict, List, Type
 
 from ..config import BackendConfig, Configurable
 from ..message import Message
@@ -64,3 +64,12 @@ def reset(self):
             raise NotImplementedError
         else:
             pass
+
+
+BACKEND_REGISTRY: Dict[str, Type[IntelligenceBackend]] = {}
+
+
+def register_backend(cls: Type[IntelligenceBackend]) -> Type[IntelligenceBackend]:
+    """Register a new backend."""
+    BACKEND_REGISTRY[cls.type_name] = cls
+    return cls
diff --git a/chatarena/backends/cohere.py b/chatarena/backends/cohere.py
@@ -4,7 +4,7 @@
 from tenacity import retry, stop_after_attempt, wait_random_exponential
 
 from ..message import Message
-from .base import IntelligenceBackend
+from .base import IntelligenceBackend, register_backend
 
 # Try to import the cohere package and check whether the API key is set
 try:
@@ -23,6 +23,7 @@
 DEFAULT_MODEL = "command-xlarge"
 
 
+@register_backend
 class CohereAIChat(IntelligenceBackend):
     """Interface to the Cohere API."""
 

diff --git a/chatarena/backends/hf_transformers.py b/chatarena/backends/hf_transformers.py
@@ -6,7 +6,7 @@
 
 from ..message import SYSTEM_NAME as SYSTEM
 from ..message import Message
-from .base import IntelligenceBackend
+from .base import IntelligenceBackend, register_backend
 
 
 @contextmanager
@@ -32,6 +32,7 @@ def suppress_stdout_stderr():
         is_transformers_available = True
 
 
+@register_backend
 class TransformersConversational(IntelligenceBackend):
     """Interface to the Transformers ConversationalPipeline."""
 

diff --git a/chatarena/backends/human.py b/chatarena/backends/human.py
@@ -1,5 +1,5 @@
 from ..config import BackendConfig
-from .base import IntelligenceBackend
+from .base import IntelligenceBackend, register_backend
 
 
 # An Error class for the human backend
@@ -9,6 +9,7 @@ def __init__(self, agent_name: str):
         super().__init__(f"Human backend requires a UI to get input from {agent_name}.")
 
 
+@register_backend
 class Human(IntelligenceBackend):
     stateful = False
     type_name = "human"

diff --git a/chatarena/backends/openai.py b/chatarena/backends/openai.py
@@ -5,7 +5,7 @@
 from tenacity import retry, stop_after_attempt, wait_random_exponential
 
 from ..message import SYSTEM_NAME, Message
-from .base import IntelligenceBackend
+from .base import IntelligenceBackend, register_backend
 
 try:
     import openai
@@ -31,6 +31,7 @@
 BASE_PROMPT = f"The messages always end with the token {END_OF_MESSAGE}."
 
 
+@register_backend
 class OpenAIChat(IntelligenceBackend):
     """Interface to the ChatGPT style model with system, user, assistant roles separation."""
 

diff --git a/chatarena/environments/__init__.py b/chatarena/environments/__init__.py
@@ -1,20 +1,10 @@
 from ..config import EnvironmentConfig
-from .base import Environment, TimeStep
+from .base import ENV_REGISTRY, Environment, TimeStep, register_env
 from .chameleon import Chameleon
 from .conversation import Conversation, ModeratedConversation
 from .pettingzoo_chess import PettingzooChess
 from .pettingzoo_tictactoe import PettingzooTicTacToe
 
-ALL_ENVIRONMENTS = [
-    Conversation,
-    ModeratedConversation,
-    Chameleon,
-    PettingzooChess,
-    PettingzooTicTacToe,
-]
-
-ENV_REGISTRY = {env.type_name: env for env in ALL_ENVIRONMENTS}
-
 
 # Load an environment from a config dictionary
 def load_environment(config: EnvironmentConfig):

diff --git a/chatarena/environments/base.py b/chatarena/environments/base.py
@@ -1,6 +1,6 @@
 from abc import abstractmethod
 from dataclasses import dataclass
-from typing import Dict, List
+from typing import Dict, List, Type
 
 from ..config import Configurable, EnvironmentConfig
 from ..message import Message
@@ -185,3 +185,20 @@ def get_one_rewards(self) -> Dict[str, float]:
             Dict[str, float]: A dictionary of players and their rewards (all one).
         """
         return {player_name: 1.0 for player_name in self.player_names}
+
+
+ENV_REGISTRY: Dict[str, Type[Environment]] = {}
+
+
+def register_env(cls: Type[Environment]) -> Type[Environment]:
+    """
+    Register an environment class.
+
+    Parameters:
+        cls (Type[Environment]): The class to register.
+
+    Returns:
+        Type[Environment]: The class that was registered.
+    """
+    ENV_REGISTRY[cls.type_name] = cls
+    return cls
diff --git a/chatarena/environments/chameleon.py b/chatarena/environments/chameleon.py
@@ -4,7 +4,7 @@
 
 from ..agent import SIGNAL_END_OF_CONVERSATION
 from ..message import Message, MessagePool
-from .base import Environment, TimeStep
+from .base import Environment, TimeStep, register_env
 
 DEFAULT_TOPIC_CODES = {
     "Fruits": [
@@ -50,6 +50,7 @@
 }
 
 
+@register_env
 class Chameleon(Environment):
     type_name = "chameleon"
 

diff --git a/chatarena/environments/conversation.py b/chatarena/environments/conversation.py
@@ -3,9 +3,10 @@
 from ..agent import SIGNAL_END_OF_CONVERSATION, Moderator
 from ..config import AgentConfig, EnvironmentConfig
 from ..message import Message, MessagePool
-from .base import Environment, TimeStep
+from .base import Environment, TimeStep, register_env
 
 
+@register_env
 class Conversation(Environment):
     """
     Turn-based fully observable conversation environment.
@@ -93,6 +94,7 @@ def step(self, player_name: str, action: str) -> TimeStep:
         return timestep
 
 
+@register_env
 class ModeratedConversation(Conversation):
     """
     Turn-based fully observable conversation environment.

diff --git a/chatarena/environments/pettingzoo_chess.py b/chatarena/environments/pettingzoo_chess.py
@@ -4,7 +4,7 @@
 from pettingzoo.classic import chess_v6
 from pettingzoo.classic.chess.chess_utils import chess, get_move_plane
 
-from chatarena.environments.base import Environment, TimeStep
+from chatarena.environments.base import Environment, TimeStep, register_env
 
 from ..message import Message, MessagePool
 
@@ -27,6 +27,7 @@ def action_string_to_alphazero_format(action: str, player_index: int) -> int:
     return x1 * 8 * 73 + y1 * 73 + move_plane
 
 
+@register_env
 class PettingzooChess(Environment):
     type_name = "pettingzoo:chess"
 

diff --git a/chatarena/environments/pettingzoo_tictactoe.py b/chatarena/environments/pettingzoo_tictactoe.py
@@ -3,7 +3,7 @@
 
 from pettingzoo.classic import tictactoe_v3
 
-from chatarena.environments.base import Environment, TimeStep
+from chatarena.environments.base import Environment, TimeStep, register_env
 
 from ..message import Message, MessagePool
 
@@ -27,6 +27,7 @@ def action_string_to_action(action: str) -> int:
     return row + column * 3
 
 
+@register_env
 class PettingzooTicTacToe(Environment):
     type_name = "pettingzoo:tictactoe"
 

diff --git a/tests/unit/test_environments.py b/tests/unit/test_environments.py
@@ -1,26 +1,99 @@
 import unittest
 from unittest import TestCase
 
-from chatarena.environments import PettingzooTicTacToe
+from chatarena.config import AgentConfig, BackendConfig, EnvironmentConfig
+from chatarena.environments import (
+    Chameleon,
+    Environment,
+    ModeratedConversation,
+    PettingzooChess,
+    PettingzooTicTacToe,
+    load_environment,
+    register_env,
+)
 
 
 class TestEnvironments(TestCase):
-    def test_chess_environment(self):
-        player_names = ["player1", "player2"]
-        env = PettingzooTicTacToe(player_names)
+    def test_env_registration(self):
+        @register_env
+        class TestEnv(Environment):
+            type_name = "test"
 
+            @classmethod
+            def from_config(cls, config: EnvironmentConfig):
+                return cls(player_names=config.player_names)
+
+        env_config = EnvironmentConfig(
+            env_type="test", player_names=["player1", "player2"]
+        )
+        env = load_environment(env_config)
+        assert isinstance(env, TestEnv)
+
+
+class TestTicTacToeEnvironment(TestCase):
+    def config(self):
+        return EnvironmentConfig(
+            env_type="pettingzoo:tictactoe", player_names=["player1", "player2"]
+        )
+
+    def test_registration_and_loading(self):
+        env = load_environment(self.config())
+        assert isinstance(env, PettingzooTicTacToe)
+
+    def test_game(self):
+        env = load_environment(self.config())
         env.reset()
         assert env.get_next_player() == "player1"
-        env.print()
 
         moves = ["X: (3, 1)", "O: (2, 2)", "X: (1, 2)", "O: (1, 1)"]
 
         for i, move in enumerate(moves):
             assert env.check_action(move, env.get_next_player())
-            timestep = env.step(env.get_next_player(), move)
-            print(timestep.reward)
-            print(timestep.terminal)
-            env.print()
+            env.step(env.get_next_player(), move)
+            assert not env.is_terminal()
+
+
+class TestChameleonEnvironment(TestCase):
+    def test_registration_and_loading(self):
+        config = EnvironmentConfig(
+            env_type="chameleon", player_names=["player1", "player2"]
+        )
+        env = load_environment(config)
+        assert isinstance(env, Chameleon)
+
+
+class TestConversationEnvironment(TestCase):
+    def test_registration_and_loading(self):
+        config = EnvironmentConfig(
+            env_type="conversation", player_names=["player1", "player2"]
+        )
+        env = load_environment(config)
+        assert isinstance(env, Environment)
+
+
+class TestModeratedConversationEnvironment(TestCase):
+    def test_registration_and_loading(self):
+        moderator = AgentConfig(
+            role_desc="moderator",
+            backend=BackendConfig(backend_type="human"),
+            terminal_condition="all_done",
+        )
+        config = EnvironmentConfig(
+            env_type="moderated_conversation",
+            player_names=["player1", "player2"],
+            moderator=moderator,
+        )
+        env = load_environment(config)
+        assert isinstance(env, ModeratedConversation)
+
+
+class TestPettingzooChessEnvironment(TestCase):
+    def test_registration_and_loading(self):
+        config = EnvironmentConfig(
+            env_type="pettingzoo:chess", player_names=["player1", "player2"]
+        )
+        env = load_environment(config)
+        assert isinstance(env, PettingzooChess)
 
 
 if __name__ == "__main__":