project: name: polyguard-rl seed: 42 reward_min: 0.001 reward_max: 0.999 reward_precision: 3 runtime: profile: full device: auto deterministic: true