memorax.algorithms.PQNState#

class memorax.algorithms.PQNState[source]#

Bases: object

PQNState(step: int, timestep: memorax.utils.timestep.Timestep, env_state: gymnax.environments.environment.EnvState, params: flax.core.frozen_dict.FrozenDict[str, typing.Any], hidden_state: jax.jaxlib._jax.Array, optimizer_state: Union[jax.jaxlib._jax.Array, numpy.ndarray, numpy.bool, numpy.number, Iterable[ForwardRef(‘ArrayTree’)], Mapping[Any, ForwardRef(‘ArrayTree’)]])

step: int#
timestep: Timestep#
env_state: EnvState#
params: FrozenDict[str, Any]#
hidden_state: Array#
optimizer_state: Array | ndarray | bool | number | Iterable[ArrayTree] | Mapping[Any, ArrayTree]#
__init__(step, timestep, env_state, params, hidden_state, optimizer_state)#
Parameters:
Return type:

None

replace(**updates)#

Returns a new object replacing the specified fields with new values.