gymnasium>=0.29 stable-baselines3>=2.3 torch>=2.2 numpy>=1.26 matplotlib>=3.8 tensorboard>=2.16