Source code for ddql_optimal_execution.agent._twap
from ._agent import Agent
from ddql_optimal_execution import State
# The TWAP class is an agent that calculates the action based on the budget and horizon.
[docs]class TWAP(Agent):
"""
The TWAP class inherits from the Agent class. It is an agent that calculates the action based on the budget and horizon.
It is used to compare the performance of the DDQL agent with the performance of a simple agent that uniformly distributes
its budget over the horizon.
Parameters
----------
initial_budget : int
The initial budget, by default 100
horizon : int
The horizon, by default 100
Attributes
----------
budget : int
The budget of the agent.
horizon : int
The horizon of the agent.
"""
[docs] def get_action(self, state: State) -> int:
"""
This function returns the action to take based on the budget and horizon values.
Args:
state (State): The "state" parameter is an instance of the "State" class, which represents the
current state of the environment in which the agent is operating. It contains information such
as the current time step, the agent's current position, and any other relevant information about
the environment. The "__get_action"
Returns:
an integer value which is the result of the division of the budget attribute of the object by
the horizon attribute of the object.
"""
return self.budget // self.horizon