max_steps: 500 robot_path: assets/cartpole angle_threshold: 0.418 cart_limit: 2.4 reward_alive: 1.0 reward_pole_upright_scale: 1.0 reward_action_penalty_scale: 0.01