Spaces:
Sleeping
Sleeping
Upload server/redveil_environment.py with huggingface_hub
Browse files
server/redveil_environment.py
CHANGED
|
@@ -20,10 +20,6 @@ from uuid import uuid4
|
|
| 20 |
from openenv.core.env_server.interfaces import Environment
|
| 21 |
from openenv.core.env_server.types import State
|
| 22 |
|
| 23 |
-
import sys as _sys
|
| 24 |
-
import os as _os
|
| 25 |
-
_sys.path.insert(0, _os.path.dirname(_os.path.dirname(_os.path.abspath(__file__))))
|
| 26 |
-
|
| 27 |
try:
|
| 28 |
from ..models import ActionType, RedVeilAction, RedVeilObservation
|
| 29 |
from ..noise import DeceptionEngine, NoiseEngine
|
|
@@ -31,11 +27,11 @@ try:
|
|
| 31 |
from ..grader import grade_task
|
| 32 |
from ..vulnerable_app import create_vulnerable_app
|
| 33 |
except (ImportError, ModuleNotFoundError):
|
| 34 |
-
from
|
| 35 |
-
from
|
| 36 |
-
from
|
| 37 |
-
from
|
| 38 |
-
from
|
| 39 |
|
| 40 |
|
| 41 |
# ---------------------------------------------------------------------------
|
|
@@ -216,7 +212,7 @@ class RedVeilEnvironment(Environment):
|
|
| 216 |
task_description=self._task.description,
|
| 217 |
milestones_reached=[],
|
| 218 |
done=False,
|
| 219 |
-
reward=0.
|
| 220 |
)
|
| 221 |
|
| 222 |
def step(
|
|
@@ -661,15 +657,15 @@ class RedVeilEnvironment(Environment):
|
|
| 661 |
def _compute_reward(self) -> float:
|
| 662 |
milestones = self._get_reached_milestones()
|
| 663 |
if not milestones or not self._task:
|
| 664 |
-
return 0.
|
| 665 |
|
| 666 |
-
reward = 0.
|
| 667 |
milestone_rewards = {name: val for name, val in self._task.milestones}
|
| 668 |
for m in milestones:
|
| 669 |
if m in milestone_rewards:
|
| 670 |
reward = max(reward, milestone_rewards[m])
|
| 671 |
|
| 672 |
-
return round(reward, 2)
|
| 673 |
|
| 674 |
@property
|
| 675 |
def state(self) -> State:
|
|
|
|
| 20 |
from openenv.core.env_server.interfaces import Environment
|
| 21 |
from openenv.core.env_server.types import State
|
| 22 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
try:
|
| 24 |
from ..models import ActionType, RedVeilAction, RedVeilObservation
|
| 25 |
from ..noise import DeceptionEngine, NoiseEngine
|
|
|
|
| 27 |
from ..grader import grade_task
|
| 28 |
from ..vulnerable_app import create_vulnerable_app
|
| 29 |
except (ImportError, ModuleNotFoundError):
|
| 30 |
+
from models import ActionType, RedVeilAction, RedVeilObservation
|
| 31 |
+
from noise import DeceptionEngine, NoiseEngine
|
| 32 |
+
from tasks import ALL_TASKS, TaskConfig
|
| 33 |
+
from grader import grade_task
|
| 34 |
+
from vulnerable_app import create_vulnerable_app
|
| 35 |
|
| 36 |
|
| 37 |
# ---------------------------------------------------------------------------
|
|
|
|
| 212 |
task_description=self._task.description,
|
| 213 |
milestones_reached=[],
|
| 214 |
done=False,
|
| 215 |
+
reward=0.01,
|
| 216 |
)
|
| 217 |
|
| 218 |
def step(
|
|
|
|
| 657 |
def _compute_reward(self) -> float:
|
| 658 |
milestones = self._get_reached_milestones()
|
| 659 |
if not milestones or not self._task:
|
| 660 |
+
return 0.01
|
| 661 |
|
| 662 |
+
reward = 0.01
|
| 663 |
milestone_rewards = {name: val for name, val in self._task.milestones}
|
| 664 |
for m in milestones:
|
| 665 |
if m in milestone_rewards:
|
| 666 |
reward = max(reward, milestone_rewards[m])
|
| 667 |
|
| 668 |
+
return max(0.01, min(0.99, round(reward, 2)))
|
| 669 |
|
| 670 |
@property
|
| 671 |
def state(self) -> State:
|