ghostexec / outputs /training /episode_returns.jsonl
modelbuilderhq's picture
Upload folder using huggingface_hub
ff293b1 verified
{"episode": 0, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}
{"episode": 1, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}
{"episode": 2, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}
{"episode": 3, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}
{"episode": 4, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}
{"episode": 0, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}
{"episode": 1, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}
{"episode": 2, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}
{"episode": 3, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}
{"episode": 4, "scenario": "phase2_core.json", "backend": "local", "agent": "smart", "return": -6.347039999999998, "length": 12, "mean_step_reward": -0.5289199999999998}