Spaces:
Running
Running
| { | |
| "status": "ok", | |
| "model_source": "merged", | |
| "model_load_error": "", | |
| "samples": 3, | |
| "valid_rate": 1.0, | |
| "avg_env_reward": 0.712333, | |
| "results": [ | |
| { | |
| "idx": 0, | |
| "prompt": "{\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_123\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}", | |
| "completion": "\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_123\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}atheratheratheratheratheratherather(cccccccccccccccccccccccccccccccccccccccccccccccccccccc\ufffd\ufffd\ufffdififififififififiriririririririr\ufffdissississississississississississississississississississississississississ", | |
| "candidate_id": "cand_01", | |
| "selected_candidate": "cand_01", | |
| "env_reward": 0.717, | |
| "done": true, | |
| "valid": true, | |
| "termination_reason": "exploit_detection" | |
| }, | |
| { | |
| "idx": 1, | |
| "prompt": "{\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_124\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_05\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}", | |
| "completion": "\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_124\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_05\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}FFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFF", | |
| "candidate_id": "cand_01", | |
| "selected_candidate": "cand_01", | |
| "env_reward": 0.703, | |
| "done": true, | |
| "valid": true, | |
| "termination_reason": "exploit_detection" | |
| }, | |
| { | |
| "idx": 2, | |
| "prompt": "{\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_125\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_05\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}", | |
| "completion": "\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_125\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_05\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}FFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFF", | |
| "candidate_id": "cand_01", | |
| "selected_candidate": "cand_01", | |
| "env_reward": 0.717, | |
| "done": true, | |
| "valid": true, | |
| "termination_reason": "exploit_detection" | |
| } | |
| ] | |
| } |