jax[cuda12]==0.5.3
flax==0.10.5
orbax-checkpoint==0.11.23
gymnasium
shimmy==1.3.0
Cython<3
six==1.17.0
tqdm
hydra-core
distrax
tensorboardX==2.6.2.2
scikit-learn==1.6.1
wandb
matplotlib
imageio[ffmpeg]

[humanoidbench]
dm_control==1.0.20
mujoco==3.1.6

[offline]
dm_control<=1.0.20
mujoco<=3.1.6

[online]
dm_control==1.0.27
mujoco==3.2.7
