| from app.common.normalization import clamp_reward | |
| def test_reward_range_clamp() -> None: | |
| assert clamp_reward(-10) == 0.001 | |
| assert clamp_reward(10) == 0.999 | |
| assert 0.001 <= clamp_reward(0.55) <= 0.999 | |
| from app.common.normalization import clamp_reward | |
| def test_reward_range_clamp() -> None: | |
| assert clamp_reward(-10) == 0.001 | |
| assert clamp_reward(10) == 0.999 | |
| assert 0.001 <= clamp_reward(0.55) <= 0.999 | |