num_envs: 64 device: auto # auto = cuda if available, else cpu dt: 0.002 substeps: 10 history_length: 10 # must match training.history_length (DR + embedding) rma_mode: "none" # "none" | "teacher" | "deploy" # ── Domain randomization (sim-to-real) ────────────────────────────── # Noise/delay levels anchored to the real recordings (~50 Hz, ~0.5 rad/s # velocity noise, ≤1-step latency). Set domain_rand: {} to disable. domain_rand: qpos_noise_std: 0.01 # rad — encoder angle noise qvel_noise_std: 0.5 # rad/s — velocity-estimate noise (measured) action_delay_steps: [0, 2] # control-step latency (0–40 ms) friction_scale: [0.6, 1.6] # Coulomb-friction multiplier damping_scale: [0.6, 1.6] # viscous-damping multiplier torque_scale: [0.85, 1.15] # motor-constant / battery-voltage variation