from causal_world.actors.base_policy import BaseActorPolicy
import numpy as np
[docs]class RandomActorPolicy(BaseActorPolicy):
"""
This is a policy wrapper for a random actor.
"""
[docs] def __init__(self, low_bound, upper_bound):
super(RandomActorPolicy, self).__init__(identifier="random_policy")
self._low_bound = low_bound
self._upper_bound = upper_bound
return
[docs] def act(self, obs):
"""
The function is called for the agent to act in the world.
:param obs: (nd.array) defines the observations received by the agent
at time step t
:return: (nd.array) defines the action to be executed at time step t
"""
return np.random.uniform(self._low_bound, self._upper_bound)