Spaces:
Sleeping
Sleeping
| name: focusflow-env | |
| version: "2.0.0" | |
| description: > | |
| LLM-hard RL environment for student focus and distraction management. | |
| Agent must handle natural language distraction events, manage cognitive load, | |
| track multi-day deadlines, and justify every decision with graded reasoning. | |
| author: Abdul Hannan | |
| theme: "Theme 3.2 - Personalized Tasks" | |
| hackathon: "Meta x Scaler OpenEnv Hackathon 2026" | |
| license: MIT | |
| environment: | |
| base_url: https://YOUR-HF-SPACE-NAME.hf.space | |
| framework: openenv | |
| language: python | |
| python_version: "3.11" | |
| # OpenEnv HTTP API endpoints | |
| api: | |
| reset: | |
| method: POST | |
| path: /reset | |
| params: | |
| - name: task_id | |
| type: string | |
| default: task_1 | |
| description: Which task to load (task_1, task_2, task_3) | |
| - name: seed | |
| type: integer | |
| default: 42 | |
| - name: session_id | |
| type: string | |
| default: default | |
| description: Unique ID for multi-agent parallel training | |
| step: | |
| method: POST | |
| path: /step | |
| params: | |
| - name: session_id | |
| type: string | |
| default: default | |
| body: FocusAction | |
| state: | |
| method: GET | |
| path: /state | |
| params: | |
| - name: session_id | |
| type: string | |
| default: default | |
| health: | |
| method: GET | |
| path: /health | |
| tasks: | |
| method: GET | |
| path: /tasks | |
| metrics: | |
| method: GET | |
| path: /metrics | |
| # Tasks | |
| tasks: | |
| - id: task_1 | |
| description: Single focused session. Complete one 25-min Pomodoro with zero app checks and handle NL events correctly. | |
| max_steps: 60 | |
| days: 1 | |
| - id: task_2 | |
| description: Multi-session day. Manage cognitive load and defer low-urgency events across 2 sessions. | |
| max_steps: 120 | |
| days: 1 | |
| - id: task_3 | |
| description: Week planner. Plan a 3-day schedule, handle shifting deadlines, and maintain energy levels. | |
| max_steps: 240 | |
| days: 3 | |
| # Action space | |
| actions: | |
| - focus | |
| - block_app | |
| - take_break | |
| - defer_event | |
| - respond_to_event | |
| - plan_day | |
| - adjust_energy | |
| - check_app | |
| - quit_session | |
| # Observation fields | |
| observation: | |
| - time_remaining_seconds | |
| - current_phase | |
| - sessions_completed | |
| - focus_score | |
| - active_distractions | |
| - blocked_apps | |
| - pending_event | |
| - day_context | |
| - cognitive_load | |
| - deadline_pressure | |
| - last_action_feedback | |
| - reasoning_quality_score | |
| # Reward range | |
| reward: | |
| min: -0.60 | |
| max: 0.60 | |
| shaped: true | |
| reasoning_graded: true | |
| # Training | |
| training: | |
| frameworks: [trl, unsloth] | |
| algorithm: GRPO | |
| model: unsloth/Llama-3.2-1B-Instruct | |
| colab_notebook: training_colab.py | |
| tags: | |
| - productivity | |
| - student | |
| - llm-hard | |
| - natural-language-rl | |
| - pomodoro | |
| - llm-agent | |
| - openenv | |
| - meta-hackathon-2026 | |