Spaces:

c-gohlke
/

LitRL-Inference

Build error

App Files Files Community

c-gohlke commited on Jan 23, 2024

Commit

5cd7fc9

verified ·

1 Parent(s): aba3e20

Upload folder using huggingface_hub

Browse files

Files changed (2) hide show

src/app.py +4 -4
src/app_state.py +31 -32

src/app.py CHANGED Viewed

@@ -67,7 +67,7 @@ def create_app() -> FastAPI:  # noqa: C901 # TODO move to routes
     @app.post(path="/connect_four/play", response_model=GridResponseType)
     def endpoint_play(
         action: int,
-        app_state: Annotated[AppState, Depends(dependency=AppState)],
     ) -> GridResponseType:
         response = step(app_state.env, action)
         app_state.inform_action(action=action)
@@ -75,7 +75,7 @@ def create_app() -> FastAPI:  # noqa: C901 # TODO move to routes
     @app.get(path="/connect_four/observe", response_model=GridResponseType)
     def endpoint_observe(
-        app_state: Annotated[AppState, Depends(dependency=AppState)],
     ) -> GridResponseType:
         return observe(app_state.env)
@@ -96,7 +96,7 @@ def create_app() -> FastAPI:  # noqa: C901 # TODO move to routes
     @app.get(path="/connect_four/bot_progress", response_model=float)
     def endpoint_bot_progress(
-        app_state: Annotated[AppState, Depends(dependency=AppState)],
     ) -> float:
         if isinstance(app_state.agent, MCTSAgent):
             if app_state.cpu_config.simulations is None:
@@ -110,7 +110,7 @@ def create_app() -> FastAPI:  # noqa: C901 # TODO move to routes
     @app.get(path="/connect_four/reset", response_model=GridResponseType)
     def endpoint_reset(
-        app_state: Annotated[AppState, Depends(dependency=AppState)],
     ) -> GridResponseType:
         app_state.env.reset()
         return observe(app_state.env)

     @app.post(path="/connect_four/play", response_model=GridResponseType)
     def endpoint_play(
         action: int,
+        app_state: Annotated[AppState, Depends(dependency=get_app_state)],
     ) -> GridResponseType:
         response = step(app_state.env, action)
         app_state.inform_action(action=action)
     @app.get(path="/connect_four/observe", response_model=GridResponseType)
     def endpoint_observe(
+        app_state: Annotated[AppState, Depends(dependency=get_app_state)],
     ) -> GridResponseType:
         return observe(app_state.env)
     @app.get(path="/connect_four/bot_progress", response_model=float)
     def endpoint_bot_progress(
+        app_state: Annotated[AppState, Depends(dependency=get_app_state)],
     ) -> float:
         if isinstance(app_state.agent, MCTSAgent):
             if app_state.cpu_config.simulations is None:
     @app.get(path="/connect_four/reset", response_model=GridResponseType)
     def endpoint_reset(
+        app_state: Annotated[AppState, Depends(dependency=get_app_state)],
     ) -> GridResponseType:
         app_state.env.reset()
         return observe(app_state.env)

src/app_state.py CHANGED Viewed

@@ -1,4 +1,11 @@
-from typing import Any, Self
 from loguru import logger
@@ -42,42 +49,34 @@ class AppState:
             logger.info("cpu_config unchanged")
     def create_rollout(self) -> Agent[Any, Any]:
-        match self.cpu_config.rollout_policy:
-            case None:
-                return RandomMultiAgent()
-            case RolloutPolicy.SAC:
-                return OnnxSacDeterministicMultiAgent()
-            case RolloutPolicy.RANDOM:
-                return RandomMultiAgent()
-            case _:
-                msg = f"cpu_config.rollout_policy: {self.cpu_config.rollout_policy}"
-                raise NotImplementedError(msg)
     def set_agent(self) -> None:
-        match self.cpu_config.agent_type.value:
-            case AgentType.MCTS.value:
-                rollout_agent = self.create_rollout()
-                # fmt: off
-                mcts_config = (
-                    MCTSConfigBuilder()
-                    .set_simulations(self.cpu_config.simulations or 50)
-                    .set_rollout_strategy(VanillaRollout(rollout_agent=rollout_agent))
-                ).build()
-                # fmt: on
-                self.agent = MCTSAgent(cfg=mcts_config)
-                logger.debug("set_agent: MCTSAgent")
-            case AgentType.RANDOM.value:
-                self.agent = RandomMultiAgent()
-            case AgentType.SAC.value:
-                self.agent = OnnxSacDeterministicMultiAgent()  # type: ignore[assignment]  # TODO
-            case _:
-                msg = f"cpu_config.name: {self.cpu_config.agent_type}"
-                raise NotImplementedError(msg)
     def get_action(self) -> int:
         return self.agent.get_action(env=self.env)
     def inform_action(self, action: int) -> None:
         """Update the agent's state as a result of external changes to the environment."""
-        if isinstance(self.agent, MCTSAgent) and self.agent.mcts is not None:
-            self.agent.mcts.update_root(action)

+from typing import Any
+import numpy as np
+try:
+    from typing import Self
+except ImportError:
+    from typing_extensions import Self
 from loguru import logger
             logger.info("cpu_config unchanged")
     def create_rollout(self) -> Agent[Any, Any]:
+        if self.cpu_config.rollout_policy == RolloutPolicy.SAC:
+            return OnnxSacDeterministicMultiAgent()
+        return RandomMultiAgent(np.random.default_rng(seed=123))
     def set_agent(self) -> None:
+        if self.cpu_config.agent_type.value == AgentType.MCTS.value:
+            rollout_agent = self.create_rollout()
+            # fmt: off
+            mcts_config = (
+                MCTSConfigBuilder()
+                .set_simulations(self.cpu_config.simulations or 50)
+                .set_rollout_strategy(VanillaRollout(rollout_agent=rollout_agent))
+            ).build()
+            # fmt: on
+            self.agent = MCTSAgent(cfg=mcts_config)
+            logger.debug("set_agent: MCTSAgent")
+        elif self.cpu_config.agent_type.value == AgentType.RANDOM.value:
+            self.agent = RandomMultiAgent()
+        elif self.cpu_config.agent_type.value == AgentType.SAC.value:
+            self.agent = OnnxSacDeterministicMultiAgent()  # type: ignore[assignment]  # TODO
+        else:
+            msg = f"cpu_config.name: {self.cpu_config.agent_type}"
+            raise NotImplementedError(msg)
     def get_action(self) -> int:
         return self.agent.get_action(env=self.env)
     def inform_action(self, action: int) -> None:
         """Update the agent's state as a result of external changes to the environment."""
+        if isinstance(self.agent, MCTSAgent):
+            self.agent.inform_action(action)