polyguard-openenv / docs /results /postsave_inference.json
TheJackBright's picture
Deploy PolyGuard OpenEnv Space
877add7 verified
{
"status": "ok",
"model_source": "merged",
"model_load_error": "",
"samples": 3,
"valid_rate": 1.0,
"avg_env_reward": 0.712333,
"results": [
{
"idx": 0,
"prompt": "{\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_123\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}",
"completion": "\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_123\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}atheratheratheratheratheratherather(cccccccccccccccccccccccccccccccccccccccccccccccccccccc\ufffd\ufffd\ufffdififififififififiriririririririr\ufffdissississississississississississississississississississississississississ",
"candidate_id": "cand_01",
"selected_candidate": "cand_01",
"env_reward": 0.717,
"done": true,
"valid": true,
"termination_reason": "exploit_detection"
},
{
"idx": 1,
"prompt": "{\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_124\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_05\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}",
"completion": "\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_124\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_05\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}FFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFF",
"candidate_id": "cand_01",
"selected_candidate": "cand_01",
"env_reward": 0.703,
"done": true,
"valid": true,
"termination_reason": "exploit_detection"
},
{
"idx": 2,
"prompt": "{\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_125\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_05\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}",
"completion": "\"instruction\": \"Choose one candidate_id and justify briefly.\", \"patient_id\": \"patient_125\", \"candidate_ids\": [\"cand_01\", \"cand_02\", \"cand_03\", \"cand_04\", \"cand_05\", \"cand_08\", \"cand_09\", \"cand_10\"], \"format\": \"candidate_id=<cand_xx>; rationale=<text>\"}FFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFF",
"candidate_id": "cand_01",
"selected_candidate": "cand_01",
"env_reward": 0.717,
"done": true,
"valid": true,
"termination_reason": "exploit_detection"
}
]
}