| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| import unittest |
|
|
| import torch |
|
|
| from verl.protocol import DataProto |
| from verl.utils.debug.metrics import calculate_debug_metrics |
|
|
|
|
| class TestMetrics(unittest.TestCase): |
| def test_calculate_debug_metrics(self): |
| data = DataProto.from_dict( |
| { |
| "rollout_log_probs": torch.tensor( |
| [ |
| [-1.5085, -0.1200, -0.6650, -0.4823, -0.1426, -1.5557, -2.8532, -0.3919, -0.4294, -0.4700], |
| [-0.0585, -0.0573, -0.4681, -0.5187, -0.7451, -1.2737, -0.0682, -0.4284, -0.5754, -0.0611], |
| ] |
| ), |
| "old_log_probs": torch.tensor( |
| [ |
| [-1.8636, -0.7863, -0.2136, -0.4376, -2.0257, -0.2579, -1.1547, -0.5203, -0.3802, -0.9872], |
| [-0.3507, -0.5426, -0.2725, -0.4637, -0.3577, -0.3733, -1.7560, -1.9542, -0.4229, -1.3098], |
| ] |
| ), |
| "loss_mask": torch.tensor([[1, 0, 0, 0, 1, 1, 0, 1, 1, 0], [1, 0, 1, 0, 1, 1, 1, 0, 1, 1]]), |
| "responses": torch.zeros((2, 10)), |
| } |
| ) |
| metrics = calculate_debug_metrics(data) |
| print(metrics) |
| assert metrics["training/rollout_probs_diff_valid"] == 1 |
|
|
|
|
| if __name__ == "__main__": |
| unittest.main() |
|
|